CUDA_VISIBLE_DEVICES=7 accelerate launch --mixed_precision="bf16" --multi_gpu  train_second.py \
  --resolution=768 --center_crop --random_flip \
  --train_batch_size=1 \
  --gradient_accumulation_steps=4 \
  --gradient_checkpointing \
  --max_train_steps=30 \
  --learning_rate=1e-5 \
  --max_grad_norm=1 \
  --lr_scheduler="linear" --lr_warmup_steps=0 \
  --checkpointing_steps 500 \
  --num_train_epochs 2\
  --mixed_precision bf16 \
  --checkpoints_total_limit 3\
  --l 0.0 \
  --lambda_total 0.0 \
  --lambda_contrast 0.0 \
  #--report_to "wandb" \