export CUDA_VISIBLE_DEVICES=0 python -m torch.distributed.run --nproc_per_node=1 \ ./main.py >> test.log