#!/bin/bash

ultracm_path=/cpfs02/llm/shared/public/lantian/exp/20240501_sft_7b_critique_ultracm_878/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_critic_ultracm/878_hf_ckpt
autoj_path=/cpfs02/llm/shared/public/lantian/exp/20240501_sft_7b_critique_autoj_26/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_critic_autoj/26_hf_ckpt
tigerscore_path=/cpfs02/llm/shared/public/lantian/hf_models/TIGER-Lab/TIGERScore-7B
d4_5_l1_resumm_path=/cpfs02/llm/shared/public/lantian/exp/20240618_sft_7b_critique_nips2024_d4_st_5_l1_resumm_385_epoch_2_0701/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm/385_hf_ckpt
base_path=base_path=/cpfs02/llm/shared/public/lantian/exp/20240418_aliyun_Ampere_7B_v1_1_FT_v1_0_0_s1_rc48_1660_hf_ckpt
models=($d4_5_l1_resumm_path $ultracm_path $autoj_path)
ultracm_path=/cpfs02/llm/shared/public/lantian/hf_models/openbmb/UltraCM-13b
autoj_path=/cpfs02/llm/shared/public/lantian/hf_models/GAIR/autoj-13b
prometheus=/cpfs02/llm/shared/public/lantian/exp/promethues/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_promethues/540_hf


# prompt_type: fs, zs-crit-cot, zs-crit-ao-1
CUDA_VISIBLE_DEVICES=0 python evaluate.py  \
	--available_gpus 0 \
	--tasks Q \
	--prompt_type zs-crit-cot \
    --hf_critic_model $ultracm_path \
	--enable_code_execution \
    --existed_crit_file 20240903_jingduduiqi_20240925/_cpfs02_llm_shared_public_lantian_exp_step_train_exp_20240925_ultracm_1_aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_critic_ultracm_14_hf/critique/result_09_27_10_26_56.jsonl

#--hf_critic_model $d4_5_l1_resumm_path \
#--existed_crit_file /cpfs02/llm/shared/public/lantian/NIPS_2024/evaluation/CriticBench-THU/src/20240903_jingduduiqi/_cpfs02_llm_shared_public_lantian_exp_20240618_sft_7b_critique_nips2024_d4_st_5_l1_resumm_no_criteria_275_epoch_2_0703_aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_no_criteria_275_hf_ckpt/critique/result_09_04_16_41_18.jsonl
#--existed_crit_file /cpfs02/llm/shared/public/lantian/NIPS_2024/evaluation/CriticBench-THU/src/20240823_rlhf_relabel/_cpfs02_llm_shared_public_lantian_exp_internlm2_5_s1_d4_st_5_l1_resumm_20240906_internlm2_5_7b_s1_aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_s1_d4_st_5_l1_resumm_20240906_internlm2_5_7b_s1_385_hf_ckpt/critique/result_09_07_23_13_37.jsonl
