CUDA_VISIBLE_DEVICES=0,1 accelerate launch sft.py \
    --base_model_name '../ppo/meta-llama/Llama-2-7b-hf' \
    --exp_type 'summary' \
    --wandb_name sft_summary