accelerate launch encoder_based_method.py \
    --model-path="llava-v1.5-7b" \
    --ref_img "data/CelebAMask-HQ/CelebA-HQ-img/1.jpg" \
    --tgt_img "data/CelebAMask-HQ/CelebA-HQ-img/1.jpg" \
    --load-8bit \
    --prompt="Can you spot <sks> in this photo?" \
    --output_dir="exp/encoder_pos_prob_0_7/"\
    --logging_dir="log"\
    --gradient_accumulation_steps=1 \
    --mixed_precision="fp16" \
    --num_train_steps=90000 \
    --img_dir="data/CelebAMask-HQ/CelebA-HQ-img" \
    --importance_weight=2.0 \
    --task="train" \
    --pos_prob=0.7 \
    --yes_no_ratio=0.6 \
    --num_query=16