# python openrlhf/main/dpo_evaluating.py --ckpt_path /data/checkpoint/gemma3-1b-cpo --model_name google/gemma-3-1b-pt --save_path ./results/gemma-3-1b-cpo.csv
# python openrlhf/main/dpo_evaluating.py --ckpt_path /data/checkpoint/gemma3-1b-ppm --model_name google/gemma-3-1b-pt --save_path ./results/gemma-3-1b-ppm.csv
python openrlhf/main/dpo_evaluating.py --ckpt_path /data/checkpoint/qwen2.5-1.5b-simpo --model_name Qwen/Qwen2.5-1.5B-Instruct --save_path ./results/qwen2.5-1.5b-simpo.csv
# python openrlhf/main/dpo_evaluating.py --ckpt_path /home/ubuntu/projects/trl/qwen2.5-1.5b-cpo --model_name Qwen/Qwen2.5-1.5B-Instruct --save_path ./results/qwen2.5-1.5b-cpo.csv