# SVD: https://huggingface.co/stabilityai/stable-video-diffusion-img2vid-xt
# SVD 1.1:  https://huggingface.co/stabilityai/stable-video-diffusion-img2vid-xt-1-1

CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7 accelerate launch train_pose_on_latent.py \
 --pretrained_model_name_or_path="stabilityai/stable-video-diffusion-img2vid" \
 --output_dir="model_out/ControlSVD-2024.12.10_pose_on_latent" \
 --video_folder="/users/zeyuzhu/dataset_project/Datasets/fallowshow/datasets" \
 --ann_folder="/users/zeyuzhu/dataset_project/Datasets/fallowshow/datasets" \
 --width=384 \
 --height=256 \
 --num_frames=16\
 --learning_rate=2e-5 \
 --per_gpu_batch_size=1 \
 --num_train_epochs=500 \
 --mixed_precision="fp16" \
 --gradient_accumulation_steps=2 \
 --checkpointing_steps=1000 \
 --gradient_checkpointing \



