#!/bin/bash

ultracm_path=/cpfs02/llm/shared/public/lantian/exp/20240501_sft_7b_critique_ultracm_878/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_critic_ultracm/878_hf_ckpt
autoj_path=/cpfs02/llm/shared/public/lantian/exp/20240501_sft_7b_critique_autoj_26/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_critic_autoj/26_hf_ckpt
d4_5_l1_resumm_path=/cpfs02/llm/shared/public/lantian/exp/20240618_sft_7b_critique_nips2024_d4_st_5_l1_resumm_385_epoch_2_0701/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm/385_hf_ckpt
d4_5_l2_resumm_path=/cpfs02/llm/shared/public/lantian/exp/20240618_sft_7b_critique_nips2024_d4_st_5_l2_resumm_385_epoch_2_0702/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l2_resumm/385_hf_ckpt
d4_5_l4_resumm_path=/cpfs02/llm/shared/public/lantian/exp/20240618_sft_7b_critique_nips2024_d4_st_5_l4_resumm_385_epoch_2_0702/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l4_resumm/385_hf_ckpt
d4_5_resumm_path=/cpfs02/llm/shared/public/lantian/exp/20240618_sft_7b_critique_nips2024_d4_st_5_resumm_385_epoch_2_0701/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_resumm/385_hf_ckpt
base_path=/cpfs02/llm/shared/public/lantian/exp/20240418_aliyun_Ampere_7B_v1_1_FT_v1_0_0_s1_rc48_1660_hf_ckpt
#models=($d4_5_l1_resumm_path $d4_5_l2_resumm_path $d4_5_l4_resumm_path $d4_5_resumm_path)
models=(Themis)
models=($d4_5_l1_resumm_path)


#####################################################################################################
our_feedback_64=/cpfs02/llm/shared/public/lantian/exp/metacritique_step_train_exp/our_no_summarization_step_64/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_our_feedback/64_hf_ckpt
our_feedback_128=/cpfs02/llm/shared/public/lantian/exp/metacritique_step_train_exp/our_no_summarization_step_128/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_our_feedback/128_hf_ckpt
our_feedback_256=/cpfs02/llm/shared/public/lantian/exp/metacritique_step_train_exp/our_no_summarization_step_256/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_our_feedback/256_hf_ckpt
our_feedback_512=/cpfs02/llm/shared/public/lantian/exp/metacritique_step_train_exp/our_no_summarization_step_512/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_our_feedback/512_hf_ckpt
our_feedback_1024=/cpfs02/llm/shared/public/lantian/exp/metacritique_step_train_exp/our_no_summarization_step_1024/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_our_feedback/1024_hf_ckpt

gpt_feedback_64=/cpfs02/llm/shared/public/lantian/exp/metacritique_step_train_exp/gpt4_feedback_step_64/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_gpt_feedback/64_hf_ckpt
gpt_feedback_128=/cpfs02/llm/shared/public/lantian/exp/metacritique_step_train_exp/gpt4_feedback_step_128/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_gpt_feedback/128_hf_ckpt
gpt_feedback_256=/cpfs02/llm/shared/public/lantian/exp/metacritique_step_train_exp/gpt4_feedback_step_256/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_gpt_feedback/256_hf_ckpt
gpt_feedback_512=/cpfs02/llm/shared/public/lantian/exp/metacritique_step_train_exp/gpt4_feedback_step_512/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_gpt_feedback/512_hf_ckpt
gpt_feedback_1024=/cpfs02/llm/shared/public/lantian/exp/metacritique_step_train_exp/gpt4_feedback_step_1024/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_gpt_feedback/1024_hf_ckpt

claude_feedback_64=/cpfs02/llm/shared/public/lantian/exp/metacritique_step_train_exp/claude_feedback_step_64/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_claude_feedback/64_hf_ckpt
claude_feedback_128=/cpfs02/llm/shared/public/lantian/exp/metacritique_step_train_exp/claude_feedback_step_128/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_claude_feedback/128_hf_ckpt
claude_feedback_256=/cpfs02/llm/shared/public/lantian/exp/metacritique_step_train_exp/claude_feedback_step_256/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_claude_feedback/256_hf_ckpt
claude_feedback_512=/cpfs02/llm/shared/public/lantian/exp/metacritique_step_train_exp/claude_feedback_step_512/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_claude_feedback/512_hf_ckpt
claude_feedback_1024=/cpfs02/llm/shared/public/lantian/exp/metacritique_step_train_exp/claude_feedback_step_1024/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_claude_feedback/1024_hf_ckpt

qwen_feedback_64=/cpfs02/llm/shared/public/lantian/exp/metacritique_step_train_exp/qwen_feedback_step_64/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_qwen_feedback/64_hf_ckpt
qwen_feedback_128=/cpfs02/llm/shared/public/lantian/exp/metacritique_step_train_exp/qwen_feedback_step_128/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_qwen_feedback/128_hf_ckpt
qwen_feedback_256=/cpfs02/llm/shared/public/lantian/exp/metacritique_step_train_exp/qwen_feedback_step_256/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_qwen_feedback/256_hf_ckpt
qwen_feedback_512=/cpfs02/llm/shared/public/lantian/exp/metacritique_step_train_exp/qwen_feedback_step_512/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_qwen_feedback/512_hf_ckpt
qwen_feedback_1024=/cpfs02/llm/shared/public/lantian/exp/metacritique_step_train_exp/qwen_feedback_step_1024/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_qwen_feedback/1024_hf_ckpt

internlm2_feedback_64=/cpfs02/llm/shared/public/lantian/exp/metacritique_step_train_exp/internlm2_feedback_step_64/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_internlm_feedback/64_hf_ckpt
internlm2_feedback_128=/cpfs02/llm/shared/public/lantian/exp/metacritique_step_train_exp/internlm2_feedback_step_128/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_internlm_feedback/128_hf_ckpt
internlm2_feedback_256=/cpfs02/llm/shared/public/lantian/exp/metacritique_step_train_exp/internlm2_feedback_step_256/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_internlm_feedback/256_hf_ckpt
internlm2_feedback_512=/cpfs02/llm/shared/public/lantian/exp/metacritique_step_train_exp/internlm2_feedback_step_512/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_internlm_feedback/512_hf_ckpt
internlm2_feedback_1024=/cpfs02/llm/shared/public/lantian/exp/metacritique_step_train_exp/internlm2_feedback_step_1024/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_internlm_feedback/1024_hf_ckpt


#models=($internlm2_feedback_512 $gpt_feedback_512 $our_feedback_512 $qwen_feedback_512 $claude_feedback_512 $internlm2_feedback_256 $gpt_feedback_256 $our_feedback_256)
models=($qwen_feedback_256 $claude_feedback_256 $internlm2_feedback_128 $gpt_feedback_128 $our_feedback_128 $qwen_feedback_128 $claude_feedback_128)
#####################################################################################################
#models=($base_path)


#######################################################################
# d1 series
#######################################################################
d12_5_l1_resumm_path=/cpfs02/llm/shared/public/lantian/exp/20240705_sft_7b_critique_nips2024_d12_st_5_l1_resumm_step_247_epoch_2/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v12_st_5_l1_resumm/247_hf_ckpt
d13_5_l1_resumm_path=/cpfs02/llm/shared/public/lantian/exp/20240705_sft_7b_critique_nips2024_d13_st_5_l1_resumm_step_step_273/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v13_st_5_l1_resumm/273_hf_ckpt
d23_5_l1_resumm_path=/cpfs02/llm/shared/public/lantian/exp/20240705_sft_7b_critique_nips2024_d23_st_5_l1_resumm_step_253/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v23_st_5_l1_resumm/253_hf_ckpt

d1_5_l1_resumm_1000_path=/cpfs02/llm/shared/public/lantian/exp/20240705_sft_7b_critique_nips2024_d1_st_5_l1_resumm_1000_step_22_epoch_2/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v1_st_5_l1_resumm_1000/22_hf_ckpt
d1_5_l1_resumm_2000_path=/cpfs02/llm/shared/public/lantian/exp/20240705_sft_7b_critique_nips2024_d1_st_5_l1_resumm_2000_step_33/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v1_st_5_l1_resumm_2000/33_hf_ckpt
d1_5_l1_resumm_4000_path=/cpfs02/llm/shared/public/lantian/exp/20240705_sft_7b_critique_nips2024_d1_st_5_l1_resumm_4000_step_55/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v1_st_5_l1_resumm_4000/55_hf_ckpt
d1_5_l1_resumm_8000_path=/cpfs02/llm/shared/public/lantian/exp/20240705_sft_7b_critique_nips2024_d1_st_5_l1_resumm_8000_step_100/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v1_st_5_l1_resumm_8000/100_hf_ckpt
d1_5_l1_resumm_path=/cpfs02/llm/shared/public/lantian/exp/20240705_sft_7b_critique_nips2024_d1_st_5_l1_resumm_step_138_epoch_2/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v1_st_5_l1_resumm/138_hf_ckpt

d2_5_l1_resumm_1000_path=/cpfs02/llm/shared/public/lantian/exp/20240705_sft_7b_critique_nips2024_d2_st_5_l1_resumm_1000_step_22/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v2_st_5_l1_resumm_1000/22_hf_ckpt
d2_5_l1_resumm_2000_path=/cpfs02/llm/shared/public/lantian/exp/20240705_sft_7b_critique_nips2024_d2_st_5_l1_resumm_2000_step_33/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v2_st_5_l1_resumm_2000/33_hf_ckpt
d2_5_l1_resumm_4000_path=/cpfs02/llm/shared/public/lantian/exp/20240705_sft_7b_critique_nips2024_d2_st_5_l1_resumm_4000_step_56/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v2_st_5_l1_resumm_4000/56_hf_ckpt
d2_5_l1_resumm_8000_path=/cpfs02/llm/shared/public/lantian/exp/20240705_sft_7b_critique_nips2024_d2_st_5_l1_resumm_8000_step_102/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v2_st_5_l1_resumm_8000/102_hf_ckpt
d2_5_l1_resumm_path=/cpfs02/llm/shared/public/lantian/exp/20240705_sft_7b_critique_nips2024_d2_st_5_l1_resumm_step_119/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v2_st_5_l1_resumm/119_hf_ckpt

d3_5_l1_resumm_1000_path=/cpfs02/llm/shared/public/lantian/exp/20240705_sft_7b_critique_nips2024_d3_st_5_l1_resumm_1000_step_23/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v3_st_5_l1_resumm_1000/23_hf_ckpt
d3_5_l1_resumm_2000_path=/cpfs02/llm/shared/public/lantian/exp/20240705_sft_7b_critique_nips2024_d3_st_5_l1_resumm_2000_step_34/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v3_st_5_l1_resumm_2000/34_hf_ckpt
d3_5_l1_resumm_4000_path=/cpfs02/llm/shared/public/lantian/exp/20240705_sft_7b_critique_nips2024_d3_st_5_l1_resumm_4000_step_58/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v3_st_5_l1_resumm_4000/58_hf_ckpt
d3_5_l1_resumm_8000_path=/cpfs02/llm/shared/public/lantian/exp/20240705_sft_7b_critique_nips2024_d3_st_5_l1_resumm_8000_step_105/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v3_st_5_l1_resumm_8000/105_hf_ckpt
d3_5_l1_resumm_path=/cpfs02/llm/shared/public/lantian/exp/20240705_sft_7b_critique_nips2024_d3_st_5_l1_resumm_step_145/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v3_st_5_l1_resumm/145_hf_ckpt

d4_5_l1_resumm_1000_path=/cpfs02/llm/shared/public/lantian/exp/20240705_sft_7b_critique_nips2024_d4_st_5_l1_resumm_1000_step_42/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_1000/42_hf_ckpt
d4_5_l1_resumm_2000_path=/cpfs02/llm/shared/public/lantian/exp/20240705_sft_7b_critique_nips2024_d4_st_5_l1_resumm_2000_step_75/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_2000/75_hf_ckpt
d4_5_l1_resumm_4000_path=/cpfs02/llm/shared/public/lantian/exp/20240705_sft_7b_critique_nips2024_d4_st_5_l1_resumm_4000_step_139/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_4000/139_hf_ckpt
d4_5_l1_resumm_8000_path=/cpfs02/llm/shared/public/lantian/exp/20240705_sft_7b_critique_nips2024_d4_st_5_l1_resumm_8000_step_268/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_8000/268_hf_ckpt


models=($d1_5_l1_resumm_path $d2_5_l1_resumm_path $d3_5_l1_resumm_path)
#models=($d4_5_l1_resumm_1000_path $d4_5_l1_resumm_2000_path $d4_5_l1_resumm_4000_path $d4_5_l1_resumm_8000_path $d3_5_l1_resumm_1000_path $d3_5_l1_resumm_2000_path $d3_5_l1_resumm_4000_path $d3_5_l1_resumm_8000_path)
#models=($d2_5_l1_resumm_1000_path $d2_5_l1_resumm_2000_path $d2_5_l1_resumm_4000_path $d2_5_l1_resumm_8000_path $d1_5_l1_resumm_1000_path $d1_5_l1_resumm_2000_path $d1_5_l1_resumm_4000_path $d1_5_l1_resumm_8000_path)

#########################################################################################

############################### d12
d12_5_l1_resumm_1000_path=/cpfs02/llm/shared/public/lantian/exp/step_train_exp/our_d12_1000/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v12_st_5_l1_resumm_1000/33_hf_ckpt
d12_5_l1_resumm_2000_path=/cpfs02/llm/shared/public/lantian/exp/step_train_exp/our_d12_2000/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v12_st_5_l1_resumm_2000/56_hf_ckpt
d12_5_l1_resumm_4000_path=/cpfs02/llm/shared/public/lantian/exp/step_train_exp/our_d12_4000/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v12_st_5_l1_resumm_4000/101_hf_ckpt
d12_5_l1_resumm_8000_path=/cpfs02/llm/shared/public/lantian/exp/step_train_exp/our_d12_8000/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v12_st_5_l1_resumm_8000/191_hf_ckpt
d12_5_l1_resumm_path=/cpfs02/llm/shared/public/lantian/exp/20240705_sft_7b_critique_nips2024_d12_st_5_l1_resumm_step_247_epoch_2/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v12_st_5_l1_resumm/247_hf_ckpt
#models=($d12_5_l1_resumm_1000_path $d12_5_l1_resumm_2000_path $d12_5_l1_resumm_4000_path $d12_5_l1_resumm_8000_path)
models=($d4_5_l1_resumm_path)

##################################################################################
d4_5_l1_resumm_our_step_300_path=/cpfs02/llm/shared/public/lantian/exp/metacritique_step_train_exp/our_no_summarization_step_300/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_our_feedback/300_hf_ckpt
d4_5_l1_resumm_our_step_400_path=/cpfs02/llm/shared/public/lantian/exp/metacritique_step_train_exp/our_no_summarization_step_400/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_our_feedback/400_hf_ckpt
d4_5_l1_resumm_our_step_500_path=/cpfs02/llm/shared/public/lantian/exp/metacritique_step_train_exp/our_no_summarization_step_500/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_our_feedback/500_hf_ckpt

d4_5_l1_resumm_gpt4_step_300_path=/cpfs02/llm/shared/public/lantian/exp/metacritique_step_train_exp/gpt4_feedback_step_300/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_gpt_feedback/300_hf_ckpt
d4_5_l1_resumm_gpt4_step_400_path=/cpfs02/llm/shared/public/lantian/exp/metacritique_step_train_exp/gpt4_feedback_step_400/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_gpt_feedback/400_hf_ckpt
d4_5_l1_resumm_gpt4_step_500_path=/cpfs02/llm/shared/public/lantian/exp/metacritique_step_train_exp/gpt4_feedback_step_500/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_gpt_feedback/500_hf_ckpt

d4_5_l1_resumm_claude_step_300_path=/cpfs02/llm/shared/public/lantian/exp/metacritique_step_train_exp/claude_feedback_step_300/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_claude_feedback/300_hf_ckpt
d4_5_l1_resumm_claude_step_400_path=/cpfs02/llm/shared/public/lantian/exp/metacritique_step_train_exp/claude_feedback_step_400/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_claude_feedback/400_hf_ckpt
d4_5_l1_resumm_claude_step_500_path=/cpfs02/llm/shared/public/lantian/exp/metacritique_step_train_exp/claude_feedback_step_500/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_claude_feedback/500_hf_ckpt

d4_5_l1_resumm_qwen_step_300_path=/cpfs02/llm/shared/public/lantian/exp/metacritique_step_train_exp/qwen_feedback_step_300/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_qwen_feedback/300_hf_ckpt
d4_5_l1_resumm_qwen_step_400_path=/cpfs02/llm/shared/public/lantian/exp/metacritique_step_train_exp/qwen_feedback_step_400/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_qwen_feedback/400_hf_ckpt
d4_5_l1_resumm_qwen_step_500_path=/cpfs02/llm/shared/public/lantian/exp/metacritique_step_train_exp/qwen_feedback_step_500/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_qwen_feedback/500_hf_ckpt

d4_5_l1_resumm_internlm2_step_300_path=/cpfs02/llm/shared/public/lantian/exp/metacritique_step_train_exp/internlm2_feedback_step_300/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_internlm_feedback/300_hf_ckpt
d4_5_l1_resumm_internlm2_step_400_path=/cpfs02/llm/shared/public/lantian/exp/metacritique_step_train_exp/internlm2_feedback_step_400/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_internlm_feedback/400_hf_ckpt
d4_5_l1_resumm_internlm2_step_500_path=/cpfs02/llm/shared/public/lantian/exp/metacritique_step_train_exp/internlm2_feedback_step_500/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_internlm_feedback/500_hf_ckpt

#models=($d4_5_l1_resumm_claude_step_300_path $d4_5_l1_resumm_claude_step_400_path $d4_5_l1_resumm_qwen_step_300_path $d4_5_l1_resumm_qwen_step_500_path $d4_5_l1_resumm_internlm2_step_300_path $d4_5_l1_resumm_internlm2_step_400_path $d4_5_l1_resumm_internlm2_step_500_path)
models=($d4_5_l1_resumm_claude_step_500_path $d4_5_l1_resumm_qwen_step_400_path)

d4_5_l1_resumm_v2_path=/cpfs02/llm/shared/public/lantian/exp/our_template_test/5_l1_resumm_path/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm/384_hf_ckpt
d4_5_l1_resumm_v3_path=/cpfs02/llm/shared/public/lantian/exp/our_template_test/5_l1_resumm_res_after/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm/384_hf_ckpt
models=($d4_5_l1_resumm_v3_path)

d4_5_l1_resumm_no_ref_path=/cpfs02/llm/shared/public/lantian/exp/20240618_sft_7b_critique_nips2024_d4_st_5_l1_resumm_no_ref_333_epoch_2_0703/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_no_ref/333_hf_ckpt
models=($d4_5_l1_resumm_no_ref_path)


############################################### task ablation
d4_5_l1_resumm_task_0_2_path=/cpfs02/llm/shared/public/lantian/exp/20240705_sft_7b_critique_nips2024_d4_st_5_l1_resumm_task_rate_0_2_step_81/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_task_0.2/81_hf_ckpt
d4_5_l1_resumm_task_0_4_path=/cpfs02/llm/shared/public/lantian/exp/20240705_sft_7b_critique_nips2024_d4_st_5_l1_resumm_task_rate_0_4_step_89/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_task_0.4/89_hf_ckpt
d4_5_l1_resumm_task_0_6_path=/cpfs02/llm/shared/public/lantian/exp/20240705_sft_7b_critique_nips2024_d4_st_5_l1_resumm_task_rate_0_6_step_93/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_task_0.6/93_hf_ckpt
d4_5_l1_resumm_task_0_8_path=/cpfs02/llm/shared/public/lantian/exp/20240705_sft_7b_critique_nips2024_d4_st_5_l1_resumm_task_rate_0_8_step_73/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_task_0.8/73_hf_ckpt
d4_5_l1_resumm_task_1_0_path=/cpfs02/llm/shared/public/lantian/exp/20240716_d4_5_l1_resumm_task_rate_1_0_step_75/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_task_rate/75_hf_ckpt
#models=($d4_5_l1_resumm_task_0_2_path $d4_5_l1_resumm_task_0_4_path $d4_5_l1_resumm_task_0_6_path $d4_5_l1_resumm_task_0_8_path)
models=($d4_5_l1_resumm_task_1_0_path)


############################## scaling exp
d1_5_l1_resumm_1000_400_step=/cpfs02/llm/shared/public/lantian/exp/scaling_exp/low_1000_step_400/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v1_st_5_l1_resumm_1000/400_hf_ckpt
d1_5_l1_resumm_2000_400_step=/cpfs02/llm/shared/public/lantian/exp/scaling_exp/low_2000_step_400/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v1_st_5_l1_resumm_2000/400_hf_ckpt
d1_5_l1_resumm_4000_400_step=/cpfs02/llm/shared/public/lantian/exp/scaling_exp/low_4000_step_400/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v1_st_5_l1_resumm_4000/400_hf_ckpt
d1_5_l1_resumm_8000_400_step=/cpfs02/llm/shared/public/lantian/exp/scaling_exp/low_8000_step_400/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v1_st_5_l1_resumm_8000/400_hf_ckpt
d1_5_l1_resumm_full_400_step=/cpfs02/llm/shared/public/lantian/exp/scaling_exp/low_full_step_400/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v1_st_5_l1_resumm_full/400_hf_ckpt
d2_5_l1_resumm_1000_400_step=/cpfs02/llm/shared/public/lantian/exp/scaling_exp/medium_1000_step_400/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v2_st_5_l1_resumm_1000/400_hf_ckpt
d2_5_l1_resumm_2000_400_step=/cpfs02/llm/shared/public/lantian/exp/scaling_exp/medium_2000_step_400/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v2_st_5_l1_resumm_2000/400_hf_ckpt
d2_5_l1_resumm_4000_400_step=/cpfs02/llm/shared/public/lantian/exp/scaling_exp/medium_4000_step_400/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v2_st_5_l1_resumm_4000/400_hf_ckpt
d2_5_l1_resumm_8000_400_step=/cpfs02/llm/shared/public/lantian/exp/scaling_exp/medium_8000_step_400/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v2_st_5_l1_resumm_8000/400_hf_ckpt
d2_5_l1_resumm_full_400_step=/cpfs02/llm/shared/public/lantian/exp/scaling_exp/medium_full_step_400/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v2_st_5_l1_resumm_full/400_hf_ckpt
d3_5_l1_resumm_1000_400_step=/cpfs02/llm/shared/public/lantian/exp/scaling_exp/high_1000_step_400/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v3_st_5_l1_resumm_1000/400_hf_ckpt
d3_5_l1_resumm_2000_400_step=/cpfs02/llm/shared/public/lantian/exp/scaling_exp/high_2000_step_400/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v3_st_5_l1_resumm_2000/400_hf_ckpt
d3_5_l1_resumm_4000_400_step=/cpfs02/llm/shared/public/lantian/exp/scaling_exp/high_4000_step_400/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v3_st_5_l1_resumm_4000/400_hf_ckpt
d3_5_l1_resumm_8000_400_step=/cpfs02/llm/shared/public/lantian/exp/scaling_exp/high_8000_step_400/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v3_st_5_l1_resumm_8000/400_hf_ckpt
d3_5_l1_resumm_full_400_step=/cpfs02/llm/shared/public/lantian/exp/scaling_exp/high_full_step_400/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v3_st_5_l1_resumm_full/400_hf_ckpt
d4_5_l1_resumm_1000_400_step=/cpfs02/llm/shared/public/lantian/exp/scaling_exp/our_1000_step_400/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_1000/400_hf_ckpt
d4_5_l1_resumm_2000_400_step=/cpfs02/llm/shared/public/lantian/exp/scaling_exp/our_2000_step_400/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_2000/400_hf_ckpt
d4_5_l1_resumm_4000_400_step=/cpfs02/llm/shared/public/lantian/exp/scaling_exp/our_4000_step_400/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_4000/400_hf_ckpt
d4_5_l1_resumm_8000_400_step=/cpfs02/llm/shared/public/lantian/exp/scaling_exp/our_8000_step_400/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_8000/400_hf_ckpt
d4_5_l1_resumm_full_400_step=/cpfs02/llm/shared/public/lantian/exp/scaling_exp/our_full_step_400/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_full/400_hf_ckpt

# server1
#models=($d1_5_l1_resumm_full_400_step $d1_5_l1_resumm_1000_400_step $d1_5_l1_resumm_2000_400_step $d1_5_l1_resumm_4000_400_step $d1_5_l1_resumm_8000_400_step $d2_5_l1_resumm_full_400_step $d2_5_l1_resumm_1000_400_step $d2_5_l1_resumm_2000_400_step)
# server2
#models=($d2_5_l1_resumm_4000_400_step $d2_5_l1_resumm_8000_400_step $d3_5_l1_resumm_full_400_step $d3_5_l1_resumm_1000_400_step $d3_5_l1_resumm_2000_400_step $d3_5_l1_resumm_4000_400_step $d3_5_l1_resumm_8000_400_step $d4_5_l1_resumm_full_400_step)
# server3
models=($d4_5_l1_resumm_1000_400_step $d4_5_l1_resumm_2000_400_step $d4_5_l1_resumm_4000_400_step $d4_5_l1_resumm_8000_400_step)


#################### s2 series
s2_add_critictuning=/cpfs02/llm/shared/public/lantian/exp/s2_add_critictuning_v01rc1/s2_add_critic_530/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_s2_add_critictuning_v01rc1/530_hf_ckpt
s2_no_critictuning=/cpfs02/llm/shared/public/lantian/exp/s2_add_critictuning_v01rc1/s2_no_critic_344/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_s2_no_critictuning_v01rc1/344_hf_ckpt
s2_add_autoj=/cpfs02/llm/shared/public/lantian/exp/s2_add_critictuning_v01rc1/s2_add_autoj_critic_349/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_s2_add_critictuning_v01rc3/359_hf_ckpt
s2_add_ultracm=/cpfs02/llm/shared/public/lantian/exp/s2_add_critictuning_v01rc1/s2_add_ultrafeedback_critic_894/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_s2_add_critictuning_v01rc4/894_hf_ckpt
models=($s2_add_autoj $s2_add_ultracm)


d4_st_5_l1_resumm_debug=/cpfs02/llm/shared/public/lantian/exp/20240727_d4_st_5_l1_resumm_debug/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm/0_hf_ckpt
models=($d4_st_5_l1_resumm_debug)

####################### rlhf
rlhf_120_hf=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240820_warmup_80_bsz_64_prompt_len_32768_policy_rm_v8_120_hf
rlhf_160_hf=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240820_warmup_80_bsz_64_prompt_len_32768_policy_rm_v8_160_hf
rlhf_200_hf=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240820_warmup_80_bsz_64_prompt_len_32768_policy_rm_v8_200_hf
rlhf_240_hf=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240820_warmup_80_bsz_64_prompt_len_32768_policy_rm_v8_240_hf
models=($rlhf_120_hf $rlhf_160_hf $rlhf_200_hf $rlhf_240_hf)

rlhf_v7_relabel_64=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_64
rlhf_v7_relabel_128=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_128
rlhf_v7_relabel_192=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_192
rlhf_v7_relabel_256=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_256
rlhf_v7_relabel_320=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_320
rlhf_v7_relabel_384=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_384
rlhf_v7_relabel_400=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_400
models=($rlhf_v7_relabel_64 $rlhf_v7_relabel_128 $rlhf_v7_relabel_192 $rlhf_v7_relabel_256 $rlhf_v7_relabel_320 $rlhf_v7_relabel_384 $rlhf_v7_relabel_400)



rlhf_v7_relabel_add_mathcode_64=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mathcode_64
rlhf_v7_relabel_add_mathcode_96=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mathcode_96
rlhf_v7_relabel_add_mathcode_128=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mathcode_128
rlhf_v7_relabel_add_mathcode_160=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mathcode_160
rlhf_v7_relabel_add_mathcode_192=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mathcode_192
rlhf_v7_relabel_add_mathcode_224=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mathcode_224
models=($rlhf_v7_relabel_add_mathcode_64 $rlhf_v7_relabel_add_mathcode_96 $rlhf_v7_relabel_add_mathcode_128 $rlhf_v7_relabel_add_mathcode_160 $rlhf_v7_relabel_add_mathcode_192 $rlhf_v7_relabel_add_mathcode_224)

rlhf_v7_relabel_rm_reverse_64=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_64
rlhf_v7_relabel_rm_reverse_96=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_96
rlhf_v7_relabel_rm_reverse_128=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_128
rlhf_v7_relabel_rm_reverse_160=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_160
rlhf_v7_relabel_rm_reverse_192=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_192
models=($rlhf_v7_relabel_rm_reverse_64 $rlhf_v7_relabel_rm_reverse_96 $rlhf_v7_relabel_rm_reverse_128 $rlhf_v7_relabel_rm_reverse_160 $rlhf_v7_relabel_rm_reverse_192)


rlhf_v7_relabel_rm_reverse_add_mathcode_64=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_64
rlhf_v7_relabel_rm_reverse_add_mathcode_96=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_96
rlhf_v7_relabel_rm_reverse_add_mathcode_128=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_128
rlhf_v7_relabel_rm_reverse_add_mathcode_160=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_160
rlhf_v7_relabel_rm_reverse_add_mathcode_192=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_192
models=($rlhf_v7_relabel_rm_reverse_add_mathcode_64 $rlhf_v7_relabel_rm_reverse_add_mathcode_96 $rlhf_v7_relabel_rm_reverse_add_mathcode_128 $rlhf_v7_relabel_rm_reverse_add_mathcode_160 $rlhf_v7_relabel_rm_reverse_add_mathcode_192)

rlhf_v7_relabel_rm_reverse_0_4_192=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_0_4_192
rlhf_v7_relabel_rm_reverse_add_mathcode_0_1_448=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_0_1_448
rlhf_v7_relabel_rm_reverse_0_8_128=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_0_8_128
models=($rlhf_v7_relabel_rm_reverse_0_4_192 $rlhf_v7_relabel_rm_reverse_add_mathcode_0_1_448 $rlhf_v7_relabel_rm_reverse_0_8_128)

##################### 0903
rlhf_v7_relabel_rm_amc_02_48=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_0_2_48
rlhf_v7_relabel_rm_amc_02_64=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_0_2_64
rlhf_v7_relabel_rm_amc_02_128=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_0_2_128
rlhf_v7_relabel_rm_amc_02_192=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_0_2_192
rlhf_v7_relabel_rm_amc_02_256=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_0_2_256

rlhf_v7_relabel_rm_amc_04_64=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_0_4_64
rlhf_v7_relabel_rm_amc_04_128=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_0_4_128
rlhf_v7_relabel_rm_amc_04_192=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_0_4_192
rlhf_v7_relabel_rm_amc_04_256=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_0_4_256
rlhf_v7_relabel_rm_amc_04_320=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_0_4_320

rlhf_v7_relabel_rm_amc_08_64=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_0_8_64
rlhf_v7_relabel_rm_amc_08_96=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_0_8_96
rlhf_v7_relabel_rm_amc_08_128=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_0_8_128
rlhf_v7_relabel_rm_amc_08_160=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_0_8_160
models=($rlhf_v7_relabel_rm_amc_02_48 $rlhf_v7_relabel_rm_amc_02_64 $rlhf_v7_relabel_rm_amc_02_128 $rlhf_v7_relabel_rm_amc_02_192 $rlhf_v7_relabel_rm_amc_02_256 $rlhf_v7_relabel_rm_amc_04_64 $rlhf_v7_relabel_rm_amc_04_128 $rlhf_v7_relabel_rm_amc_04_192)
models=($rlhf_v7_relabel_rm_amc_04_256 $rlhf_v7_relabel_rm_amc_04_320 $rlhf_v7_relabel_rm_amc_08_64 $rlhf_v7_relabel_rm_amc_08_96 $rlhf_v7_relabel_rm_amc_08_128 $rlhf_v7_relabel_rm_amc_08_160)

internlm2_5_7b_chat=/cpfs02/llm/shared/public/lantian/exp/internlm2_5/s1_d4_st_5_l1_resumm_20240906_internlm2_5_7b_s1/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_s1_d4_st_5_l1_resumm_20240906_internlm2_5_7b_s1/385_hf_ckpt
llama3_1_8b_instruct=/cpfs01/shared/public/llmeval/model_weights/hf_hub/models--meta-llama--Meta-Llama-3.1-8B-Instruct/snapshots/5206a32e0bd3067aef1ce90f5528ade7d866253f
llama3_1_70b_instruct=/cpfs01/shared/public/llmeval/model_weights/hf_hub/models--meta-llama--Meta-Llama-3.1-70B-Instruct/snapshots/846357c7ee5e3f50575fd4294edb3d898c8ea100
qwen2_7b_instruct=/cpfs01/shared/public/llmeval/model_weights/hf_hub/models--Qwen--Qwen2-7B-Instruct/snapshots/f2826a00ceef68f0f2b946d945ecc0477ce4450c
qwen2_72b_instruct=/cpfs02/llm/shared/public/lantian/hf_models/Qwen/Qwen2-72B-Instruct
#models=($internlm2_5_7b_chat "qwen2-7b-instruct" "llama-3.1-8b-instruct" "llama-3.1-70b-instruct")
#models=($llama3_1_8b_instruct $qwen2_7b_instruct)
models=($qwen2_72b_instruct)
#models=($llama3_1_70b_instruct)
models=(/cpfs02/llm/shared/public/lantian/exp/202409_13_d4_st_5_l1_resumm_mix_mathcode_with_criteria_s1_model/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm/300_hf)

tigerscore_path=/cpfs02/llm/shared/public/lantian/hf_models/TIGER-Lab/TIGERScore-7B
models=($tigerscore_path)
#models=(/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_4_mathcode_no_reference_256 /cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_6_mathcode_no_reference_160)
models=(/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_4_mathcode_no_reference_256 /cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_6_mathcode_no_reference_160 /cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_8_mathcode_no_reference_96)
models=(/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_1_0_mathcode_no_reference_144)
models=(/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_2_mathcode_with_reference_128 /cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_2_mathcode_with_reference_256)

for index in $(seq 0 1)
do
    model=${models[$index]}
    index=$(($index+0)) # prompt_type: fs, zs-crit-cot, zs-crit-ao-1
    #index="0,1,2,3,4,5,6,7"
    echo "Evaluate for model: " $model "on GPU[$index]"
    CUDA_VISIBLE_DEVICES=$index python evaluate.py --available_gpus $index --tasks Q --hf_critic_model $model --prompt_type zs-crit-cot --enable_code_execution --output_dir 20240823_rlhf_relabel &
    ## only for internlm2-7b-chat or internlm2-20b-chat
    #CUDA_VISIBLE_DEVICES=$index python evaluate.py --available_gpus $index --tasks Q --hf_model $model --prompt_type zs-crit-cot --enable_code_execution --output_dir 20240823_rlhf_relabel
    echo "[!] inference ${model} over"
done
