CUDA_VISIBLE_DEVICES=0,1,2,3 python -m torch.distributed.run --master_port=10021 --nproc_per_node=4 train.py --cfg-path lavis/projects/blip2/train/RN50/pretrain_RN512_word.yaml