CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7 accelerate launch --num_processes 8 train_clean.py --dataset_name="cifar10" --resolution=32 --center_crop --random_flip --output_dir="ddpmpp-cifar10-100e-fintune-ema" --train_batch_size=32 --num_epochs=100  --checkpointing_steps=2000  --model_config_name_or_path ../cifar10-ddpmpp-deep-vp --use_ema --mixed_precision no