cd $TAMPERING_HOME/tampering/rm/dataset

export VLLM_TORCH_COMPILE=0
export CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7

# main experiment
python sft_sampling.py --model_name $HF_NAME/AT-qwen2.5-7b-hhrlhf-5120-sft-b3s3-ai \
    --source_path $TAMPERING_HOME/datasets/hhrlhf/rm/train/hhrlhf_RM_5120.json \
    --target_path $TAMPERING_HOME/datasets/hhrlhf/rm/train/hhrlhf_RM_5120_ai_sft.json \
    --save_every 1 \
    --gpus 0,1,2,3,4,5,6,7