pip3 install deepspeed==0.14.0

cd /.../.../.../fastchat/

RUN_CMD="accelerate launch --config_file=/.../.../.../fastchat/accelerate_config/deepspeed_zero3_cpuoffload.yaml --num_processes=8  "
export RUN_CMD

OTHER=" --my_task_name=phi2-code-sft-lr-6 --save_hdfs_path=....../home/.../.../user/.../metadata/generate/codedpo/phi2/phi2-code-sft-lr-6 --gradient_accumulation_steps=8 --learning_rate=1e-6 "
export OTHER


CODEFILE="code.sft.py"
export CODEFILE

bash dpo.code.a100.phi2.sh

