#!/bin/bash

rlhf_v9_from_pretrained_64=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v9_from_pretrained_64_hf
rlhf_v9_from_pretrained_128=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v9_from_pretrained_128_hf
rlhf_v9_from_pretrained_192=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v9_from_pretrained_192_hf
rlhf_v9_from_pretrained_256=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v9_from_pretrained_256_hf
rlhf_v9_from_pretrained_320=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v9_from_pretrained_320_hf
models=($rlhf_v9_from_pretrained_64 $rlhf_v9_from_pretrained_128 $rlhf_v9_from_pretrained_192 $rlhf_v9_from_pretrained_256 $rlhf_v9_from_pretrained_320)

rlhf_v8_time_2_64=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v8_time_2_hf_64
rlhf_v8_time_2_96=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v8_time_2_hf_96
rlhf_v8_time_2_128=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v8_time_2_hf_128
rlhf_v8_time_2_160=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v8_time_2_hf_160
models=($rlhf_v8_time_2_64 $rlhf_v8_time_2_96 $rlhf_v8_time_2_128 $rlhf_v8_time_2_160)


#rlhf_v7_40_120=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240820_warmup_40_bsz_16_1_1_prompt_len_32768_policy_rm_v7_96_hf/
rlhf_v7_40_120=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240820_warmup_40_bsz_64_prompt_len_32768_policy_120_hf
rlhf_v7_relabel_64=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_64
rlhf_v7_relabel_128=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_128
rlhf_v7_relabel_192=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_192
rlhf_v7_relabel_256=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_256
rlhf_v7_relabel_320=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_320
rlhf_v7_relabel_384=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_384
rlhf_v7_relabel_400=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_400
models=($rlhf_v7_relabel_320 $rlhf_v7_relabel_384 $rlhf_v7_relabel_400)

rlhf_v7_relabel_add_mathcode_64=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mathcode_64
rlhf_v7_relabel_add_mathcode_96=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mathcode_96
rlhf_v7_relabel_add_mathcode_128=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mathcode_128
rlhf_v7_relabel_add_mathcode_160=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mathcode_160
rlhf_v7_relabel_add_mathcode_192=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mathcode_192
rlhf_v7_relabel_add_mathcode_224=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mathcode_224
models=($rlhf_v7_relabel_add_mathcode_64 $rlhf_v7_relabel_add_mathcode_96 $rlhf_v7_relabel_add_mathcode_128 $rlhf_v7_relabel_add_mathcode_160 $rlhf_v7_relabel_add_mathcode_192 $rlhf_v7_relabel_add_mathcode_224)


rlhf_v7_relabel_rm_reverse_64=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_64
rlhf_v7_relabel_rm_reverse_96=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_96
rlhf_v7_relabel_rm_reverse_128=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_128
rlhf_v7_relabel_rm_reverse_160=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_160
rlhf_v7_relabel_rm_reverse_192=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_192
models=($rlhf_v7_relabel_rm_reverse_64 $rlhf_v7_relabel_rm_reverse_96 $rlhf_v7_relabel_rm_reverse_128 $rlhf_v7_relabel_rm_reverse_160 $rlhf_v7_relabel_rm_reverse_192)

rlhf_v7_relabel_rm_reverse_add_mathcode_64=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_64
rlhf_v7_relabel_rm_reverse_add_mathcode_96=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_96
rlhf_v7_relabel_rm_reverse_add_mathcode_128=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_128
rlhf_v7_relabel_rm_reverse_add_mathcode_160=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_160
rlhf_v7_relabel_rm_reverse_add_mathcode_192=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_192
#models=($rlhf_v7_relabel_rm_reverse_add_mathcode_64 $rlhf_v7_relabel_rm_reverse_add_mathcode_96 $rlhf_v7_relabel_rm_reverse_add_mathcode_128 $rlhf_v7_relabel_rm_reverse_add_mathcode_160 $rlhf_v7_relabel_rm_reverse_add_mathcode_192)
models=($rlhf_v7_relabel_rm_reverse_add_mathcode_160 $rlhf_v7_relabel_rm_reverse_add_mathcode_192)


rlhf_v7_relabel_fp_64=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_from_pretrained_64
rlhf_v7_relabel_fp_96=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_from_pretrained_96
rlhf_v7_relabel_fp_128=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_from_pretrained_128
rlhf_v7_relabel_fp_160=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_from_pretrained_160
rlhf_v7_relabel_fp_192=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_from_pretrained_192
models=($rlhf_v7_relabel_fp_64 $rlhf_v7_relabel_fp_96 $rlhf_v7_relabel_fp_128 $rlhf_v7_relabel_fp_160 $rlhf_v7_relabel_fp_192)

rlhf_v7_relabel_fp_amc_64=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mathcode_from_pretrained_64
rlhf_v7_relabel_fp_amc_128=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mathcode_from_pretrained_128
rlhf_v7_relabel_fp_amc_192=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mathcode_from_pretrained_192
rlhf_v7_relabel_fp_amc_256=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mathcode_from_pretrained_256
rlhf_v7_relabel_fp_amc_320=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mathcode_from_pretrained_320
rlhf_v7_relabel_fp_amc_384=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mathcode_from_pretrained_384
rlhf_v7_relabel_fp_amc_448=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mathcode_from_pretrained_448
rlhf_v7_relabel_fp_amc_500=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mathcode_from_pretrained_500
models=($rlhf_v7_relabel_fp_amc_64 $rlhf_v7_relabel_fp_amc_128 $rlhf_v7_relabel_fp_amc_192 $rlhf_v7_relabel_fp_amc_256 $rlhf_v7_relabel_fp_amc_320 $rlhf_v7_relabel_fp_amc_384 $rlhf_v7_relabel_fp_amc_448 $rlhf_v7_relabel_fp_amc_500)

rlhf_v7_relabel_fp_rr_64=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_from_pretrained_64
rlhf_v7_relabel_fp_rr_96=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_from_pretrained_96
rlhf_v7_relabel_fp_rr_128=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_from_pretrained_128
rlhf_v7_relabel_fp_rr_160=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_from_pretrained_160
rlhf_v7_relabel_fp_rr_192=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_from_pretrained_192
rlhf_v7_relabel_fp_rr_224=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_from_pretrained_224
models=($rlhf_v7_relabel_fp_amc_500 $rlhf_v7_relabel_fp_rr_64 $rlhf_v7_relabel_fp_rr_96 $rlhf_v7_relabel_fp_rr_128 $rlhf_v7_relabel_fp_rr_160 $rlhf_v7_relabel_fp_rr_192 $rlhf_v7_relabel_fp_rr_224)

rlhf_v7_relabel_fp_rr_amc_64=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_from_pretrained_64
rlhf_v7_relabel_fp_rr_amc_96=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_from_pretrained_96
rlhf_v7_relabel_fp_rr_amc_128=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_from_pretrained_128
rlhf_v7_relabel_fp_rr_amc_160=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_from_pretrained_160
models=($rlhf_v7_relabel_fp_rr_amc_128 $rlhf_v7_relabel_fp_rr_amc_160)


# re-inference
rlhf_v7_relabel_add_mathcode_192=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mathcode_192
d4_st_5_l1_resumm=/cpfs02/llm/shared/public/lantian/exp/20240618_sft_7b_critique_nips2024_d4_st_5_l1_resumm_385_epoch_2_0701/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm/385_hf_ckpt
models=($rlhf_v7_relabel_add_mathcode_192 $d4_st_5_l1_resumm)

rlhf_v7_relabel_rr_02_48=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_0_2_48
rlhf_v7_relabel_rr_02_64=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_0_2_64
rlhf_v7_relabel_rr_02_96=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_0_2_96
rlhf_v7_relabel_rr_02_128=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_0_2_128
rlhf_v7_relabel_rr_04_64=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_0_4_64
rlhf_v7_relabel_rr_04_96=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_0_4_96
rlhf_v7_relabel_rr_04_128=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_0_4_128
rlhf_v7_relabel_rr_04_160=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_0_4_160
rlhf_v7_relabel_rr_04_192=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_0_4_192
rlhf_v7_relabel_rr_04_224=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_0_4_224
#models=($rlhf_v7_relabel_rr_02_48 $rlhf_v7_relabel_rr_02_64 $rlhf_v7_relabel_rr_02_96 $rlhf_v7_relabel_rr_02_128 $rlhf_v7_relabel_rr_04_64 $rlhf_v7_relabel_rr_04_96 $rlhf_v7_relabel_rr_04_128 $rlhf_v7_relabel_rr_04_160 $rlhf_v7_relabel_rr_04_192 $rlhf_v7_relabel_rr_04_224)
#models=($rlhf_v7_relabel_rr_02_48 $rlhf_v7_relabel_rr_02_64 $rlhf_v7_relabel_rr_02_96 $rlhf_v7_relabel_rr_02_128 $rlhf_v7_relabel_rr_04_64 $rlhf_v7_relabel_rr_04_96 $rlhf_v7_relabel_rr_04_128 $rlhf_v7_relabel_rr_04_160)
models=($rlhf_v7_relabel_rr_04_192 $rlhf_v7_relabel_rr_04_224)


rlhf_v7_relabel_rr_01_64=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_0_1_64
rlhf_v7_relabel_rr_01_96=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_0_1_96
rlhf_v7_relabel_rr_01_128=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_0_1_128
rlhf_v7_relabel_rr_01_160=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_0_1_160
models=($rlhf_v7_relabel_rr_01_64 $rlhf_v7_relabel_rr_01_96 $rlhf_v7_relabel_rr_01_128 $rlhf_v7_relabel_rr_01_160)

rlhf_v7_relabel_rr_08_64=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_0_8_64
rlhf_v7_relabel_rr_08_128=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_0_8_128
rlhf_v7_relabel_rr_08_192=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_0_8_192
rlhf_v7_relabel_rr_08_256=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_0_8_256
rlhf_v7_relabel_rr_08_320=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_0_8_320
rlhf_v7_relabel_rr_08_384=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_0_8_384
rlhf_v7_relabel_rr_08_448=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_0_8_448
rlhf_v7_relabel_rr_08_500=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_0_8_500
models=($rlhf_v7_relabel_rr_08_64 $rlhf_v7_relabel_rr_08_128 $rlhf_v7_relabel_rr_08_192 $rlhf_v7_relabel_rr_08_256 $rlhf_v7_relabel_rr_08_320 $rlhf_v7_relabel_rr_08_384 $rlhf_v7_relabel_rr_08_448 $rlhf_v7_relabel_rr_08_500)

rlhf_v7_relabel_rr_amc_01_64=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_0_1_64
rlhf_v7_relabel_rr_amc_01_128=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_0_1_128
rlhf_v7_relabel_rr_amc_01_192=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_0_1_192
rlhf_v7_relabel_rr_amc_01_256=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_0_1_256
rlhf_v7_relabel_rr_amc_01_320=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_0_1_320
rlhf_v7_relabel_rr_amc_01_384=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_0_1_384
rlhf_v7_relabel_rr_amc_01_448=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_0_1_448
rlhf_v7_relabel_rr_amc_01_500=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_0_1_500
models=($rlhf_v7_relabel_rr_amc_01_64 $rlhf_v7_relabel_rr_amc_01_128 $rlhf_v7_relabel_rr_amc_01_192 $rlhf_v7_relabel_rr_amc_01_256 $rlhf_v7_relabel_rr_amc_01_320 $rlhf_v7_relabel_rr_amc_01_384 $rlhf_v7_relabel_rr_amc_01_448 $rlhf_v7_relabel_rr_amc_01_500)

rlhf_v7_relabel_rm_amc_02_48=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_0_2_48
rlhf_v7_relabel_rm_amc_02_64=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_0_2_64
rlhf_v7_relabel_rm_amc_02_128=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_0_2_128
rlhf_v7_relabel_rm_amc_02_192=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_0_2_192
rlhf_v7_relabel_rm_amc_02_256=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_0_2_256

rlhf_v7_relabel_rm_amc_04_64=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_0_4_64
rlhf_v7_relabel_rm_amc_04_128=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_0_4_128
rlhf_v7_relabel_rm_amc_04_192=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_0_4_192
rlhf_v7_relabel_rm_amc_04_256=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_0_4_256
rlhf_v7_relabel_rm_amc_04_320=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_0_4_320

rlhf_v7_relabel_rm_amc_08_64=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_0_8_64
rlhf_v7_relabel_rm_amc_08_96=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_0_8_96
rlhf_v7_relabel_rm_amc_08_128=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_0_8_128
rlhf_v7_relabel_rm_amc_08_160=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_0_8_160

models=($rlhf_v7_relabel_rm_amc_02_48 $rlhf_v7_relabel_rm_amc_02_64 $rlhf_v7_relabel_rm_amc_02_128 $rlhf_v7_relabel_rm_amc_02_192 $rlhf_v7_relabel_rm_amc_02_256 $rlhf_v7_relabel_rm_amc_04_64 $rlhf_v7_relabel_rm_amc_04_128 $rlhf_v7_relabel_rm_amc_04_192)
models=($rlhf_v7_relabel_rm_amc_04_256 $rlhf_v7_relabel_rm_amc_04_320 $rlhf_v7_relabel_rm_amc_08_64 $rlhf_v7_relabel_rm_amc_08_96 $rlhf_v7_relabel_rm_amc_08_128 $rlhf_v7_relabel_rm_amc_08_160)

###
rlhf_v7_add_mul_4_rm_reverse_0_0_64=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mul_4_rm_reverse_0_0_64
rlhf_v7_add_mul_4_rm_reverse_0_0_96=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mul_4_rm_reverse_0_0_96
rlhf_v7_add_mul_4_rm_reverse_0_0_128=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mul_4_rm_reverse_0_0_128
rlhf_v7_add_mul_4_rm_reverse_0_0_160=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mul_4_rm_reverse_0_0_160
models=($rlhf_v7_add_mul_4_rm_reverse_0_0_64 $rlhf_v7_add_mul_4_rm_reverse_0_0_96 $rlhf_v7_add_mul_4_rm_reverse_0_0_128 $rlhf_v7_add_mul_4_rm_reverse_0_0_160)

rlhf_v7_add_mul_4_rm_reverse_0_0_add_mathcode_64=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mul_4_rm_reverse_0_0_add_mathcode_64
rlhf_v7_add_mul_4_rm_reverse_0_0_add_mathcode_96=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mul_4_rm_reverse_0_0_add_mathcode_96
rlhf_v7_add_mul_4_rm_reverse_0_0_add_mathcode_128=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mul_4_rm_reverse_0_0_add_mathcode_128
rlhf_v7_add_mul_4_rm_reverse_0_0_add_mathcode_160=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mul_4_rm_reverse_0_0_add_mathcode_160
models=($rlhf_v7_add_mul_4_rm_reverse_0_0_add_mathcode_64 $rlhf_v7_add_mul_4_rm_reverse_0_0_add_mathcode_96 $rlhf_v7_add_mul_4_rm_reverse_0_0_add_mathcode_128 $rlhf_v7_add_mul_4_rm_reverse_0_0_add_mathcode_160)

rlhf_v7_add_mul_4_rm_reverse_0_1_add_mathcode_64=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mul_4_rm_reverse_0_1_add_mathcode_64
rlhf_v7_add_mul_4_rm_reverse_0_1_add_mathcode_128=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mul_4_rm_reverse_0_1_add_mathcode_128
rlhf_v7_add_mul_4_rm_reverse_0_1_add_mathcode_192=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mul_4_rm_reverse_0_1_add_mathcode_192
rlhf_v7_add_mul_4_rm_reverse_0_1_add_mathcode_256=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mul_4_rm_reverse_0_1_add_mathcode_256
rlhf_v7_add_mul_4_rm_reverse_0_1_add_mathcode_320=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mul_4_rm_reverse_0_1_add_mathcode_320
rlhf_v7_add_mul_4_rm_reverse_0_1_add_mathcode_384=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mul_4_rm_reverse_0_1_add_mathcode_384
rlhf_v7_add_mul_4_rm_reverse_0_1_add_mathcode_448=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mul_4_rm_reverse_0_1_add_mathcode_448
rlhf_v7_add_mul_4_rm_reverse_0_1_add_mathcode_500=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mul_4_rm_reverse_0_1_add_mathcode_500
models=($rlhf_v7_add_mul_4_rm_reverse_0_1_add_mathcode_64 $rlhf_v7_add_mul_4_rm_reverse_0_1_add_mathcode_128 $rlhf_v7_add_mul_4_rm_reverse_0_1_add_mathcode_192 $rlhf_v7_add_mul_4_rm_reverse_0_1_add_mathcode_256 $rlhf_v7_add_mul_4_rm_reverse_0_1_add_mathcode_320 $rlhf_v7_add_mul_4_rm_reverse_0_1_add_mathcode_384 $rlhf_v7_add_mul_4_rm_reverse_0_1_add_mathcode_448 $rlhf_v7_add_mul_4_rm_reverse_0_1_add_mathcode_500)
rlhf_v7_add_mul_4_rm_reverse_0_2_add_mathcode_64=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mul_4_rm_reverse_0_2_add_mathcode_64
rlhf_v7_add_mul_4_rm_reverse_0_2_add_mathcode_96=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mul_4_rm_reverse_0_2_add_mathcode_96
rlhf_v7_add_mul_4_rm_reverse_0_2_add_mathcode_128=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mul_4_rm_reverse_0_2_add_mathcode_128
rlhf_v7_add_mul_4_rm_reverse_0_2_add_mathcode_160=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mul_4_rm_reverse_0_2_add_mathcode_160
rlhf_v7_add_mul_4_rm_reverse_0_2_add_mathcode_192=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mul_4_rm_reverse_0_2_add_mathcode_192
models=($rlhf_v7_add_mul_4_rm_reverse_0_2_add_mathcode_64 $rlhf_v7_add_mul_4_rm_reverse_0_2_add_mathcode_96 $rlhf_v7_add_mul_4_rm_reverse_0_2_add_mathcode_128 $rlhf_v7_add_mul_4_rm_reverse_0_2_add_mathcode_160 $rlhf_v7_add_mul_4_rm_reverse_0_2_add_mathcode_192)


##### internlm2_5 baseline
internlm2_5_baseline=/cpfs02/llm/shared/public/lantian/exp/internlm2_5/s1_d4_st_5_l1_resumm_20240906_internlm2_5_7b_s1/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_s1_d4_st_5_l1_resumm_20240906_internlm2_5_7b_s1/385_hf_ckpt
models=($internlm2_5_baseline)


rlhf_v7_add_mul_4_rm_reverse_0_4_64=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mul_4_rm_reverse_0_4_64
rlhf_v7_add_mul_4_rm_reverse_0_4_96=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mul_4_rm_reverse_0_4_96
rlhf_v7_add_mul_4_rm_reverse_0_4_128=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mul_4_rm_reverse_0_4_128

rlhf_v7_add_mul_4_rm_reverse_0_8_64=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mul_4_rm_reverse_0_8_64
rlhf_v7_add_mul_4_rm_reverse_0_8_96=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mul_4_rm_reverse_0_8_96
rlhf_v7_add_mul_4_rm_reverse_0_8_128=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mul_4_rm_reverse_0_8_128
rlhf_v7_add_mul_4_rm_reverse_0_8_160=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mul_4_rm_reverse_0_8_160

rlhf_v7_add_mul_4_rm_reverse_0_4_add_mathcode_64=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mul_4_rm_reverse_0_4_add_mathcode_64
rlhf_v7_add_mul_4_rm_reverse_0_4_add_mathcode_128=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mul_4_rm_reverse_0_4_add_mathcode_128
rlhf_v7_add_mul_4_rm_reverse_0_4_add_mathcode_192=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mul_4_rm_reverse_0_4_add_mathcode_192
rlhf_v7_add_mul_4_rm_reverse_0_4_add_mathcode_256=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mul_4_rm_reverse_0_4_add_mathcode_256
rlhf_v7_add_mul_4_rm_reverse_0_4_add_mathcode_320=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mul_4_rm_reverse_0_4_add_mathcode_320

models=($rlhf_v7_add_mul_4_rm_reverse_0_4_64 $rlhf_v7_add_mul_4_rm_reverse_0_4_96 $rlhf_v7_add_mul_4_rm_reverse_0_4_128 $rlhf_v7_add_mul_4_rm_reverse_0_8_64 $rlhf_v7_add_mul_4_rm_reverse_0_8_96 $rlhf_v7_add_mul_4_rm_reverse_0_8_128 $rlhf_v7_add_mul_4_rm_reverse_0_8_160 $rlhf_v7_add_mul_4_rm_reverse_0_4_add_mathcode_64)
models=($rlhf_v7_add_mul_4_rm_reverse_0_4_add_mathcode_128 $rlhf_v7_add_mul_4_rm_reverse_0_4_add_mathcode_192 $rlhf_v7_add_mul_4_rm_reverse_0_4_add_mathcode_256 $rlhf_v7_add_mul_4_rm_reverse_0_4_add_mathcode_320)

rlhf_v7_add_mul_4_rm_reverse_0_8_add_mathcode_64=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mul_4_rm_reverse_0_8_add_mathcode_64
rlhf_v7_add_mul_4_rm_reverse_0_8_add_mathcode_96=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mul_4_rm_reverse_0_8_add_mathcode_96
rlhf_v7_add_mul_4_rm_reverse_0_8_add_mathcode_128=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mul_4_rm_reverse_0_8_add_mathcode_128
rlhf_v7_add_mul_4_rm_reverse_0_8_add_mathcode_160=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mul_4_rm_reverse_0_8_add_mathcode_160
rlhf_v7_add_mul_4_rm_reverse_0_8_add_mathcode_192=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mul_4_rm_reverse_0_8_add_mathcode_192

rlhf_v7_add_mul_4_rm_reverse_1_0_64=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mul_4_rm_reverse_1_0_64
rlhf_v7_add_mul_4_rm_reverse_1_0_96=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mul_4_rm_reverse_1_0_96
rlhf_v7_add_mul_4_rm_reverse_1_0_128=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mul_4_rm_reverse_1_0_128
rlhf_v7_add_mul_4_rm_reverse_1_0_160=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mul_4_rm_reverse_1_0_160


rlhf_v7_add_mul_4_rm_reverse_1_0_add_mathcode_64=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mul_4_rm_reverse_1_0_add_mathcode_64
rlhf_v7_add_mul_4_rm_reverse_1_0_add_mathcode_96=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mul_4_rm_reverse_1_0_add_mathcode_96
rlhf_v7_add_mul_4_rm_reverse_1_0_add_mathcode_128=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mul_4_rm_reverse_1_0_add_mathcode_128
rlhf_v7_add_mul_4_rm_reverse_1_0_add_mathcode_160=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mul_4_rm_reverse_1_0_add_mathcode_160
rlhf_v7_add_mul_4_rm_reverse_1_0_add_mathcode_192=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_add_mul_4_rm_reverse_1_0_add_mathcode_192

#models=($rlhf_v7_add_mul_4_rm_reverse_0_8_add_mathcode_64 $rlhf_v7_add_mul_4_rm_reverse_0_8_add_mathcode_96 $rlhf_v7_add_mul_4_rm_reverse_0_8_add_mathcode_128 $rlhf_v7_add_mul_4_rm_reverse_0_8_add_mathcode_160 $rlhf_v7_add_mul_4_rm_reverse_0_8_add_mathcode_192 $rlhf_v7_add_mul_4_rm_reverse_1_0_64 $rlhf_v7_add_mul_4_rm_reverse_1_0_96 $rlhf_v7_add_mul_4_rm_reverse_1_0_128)
models=($rlhf_v7_add_mul_4_rm_reverse_1_0_160 $rlhf_v7_add_mul_4_rm_reverse_1_0_add_mathcode_64 $rlhf_v7_add_mul_4_rm_reverse_1_0_add_mathcode_96 $rlhf_v7_add_mul_4_rm_reverse_1_0_add_mathcode_128 $rlhf_v7_add_mul_4_rm_reverse_1_0_add_mathcode_160 $rlhf_v7_add_mul_4_rm_reverse_1_0_add_mathcode_192)



internlm2_5_sft_rlhf_relabel_add_mathcode_64=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/internlm2_5_7b_sft_hf_rm_v7_relabel_add_mathcode_64
internlm2_5_sft_rlhf_relabel_add_mathcode_128=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/internlm2_5_7b_sft_hf_rm_v7_relabel_add_mathcode_128
internlm2_5_sft_rlhf_relabel_add_mathcode_192=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/internlm2_5_7b_sft_hf_rm_v7_relabel_add_mathcode_192
internlm2_5_sft_rlhf_relabel_add_mathcode_256=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/internlm2_5_7b_sft_hf_rm_v7_relabel_add_mathcode_256
internlm2_5_sft_rlhf_relabel_add_mathcode_320=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/internlm2_5_7b_sft_hf_rm_v7_relabel_add_mathcode_320
internlm2_5_sft_rlhf_relabel_add_mathcode_384=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/internlm2_5_7b_sft_hf_rm_v7_relabel_add_mathcode_384
internlm2_5_sft_rlhf_relabel_add_mathcode_448=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/internlm2_5_7b_sft_hf_rm_v7_relabel_add_mathcode_448
internlm2_5_sft_rlhf_relabel_add_mathcode_500=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/internlm2_5_7b_sft_hf_rm_v7_relabel_add_mathcode_500

models=($internlm2_5_sft_rlhf_relabel_add_mathcode_64 $internlm2_5_sft_rlhf_relabel_add_mathcode_192)

internlm2_5_sft_rlhf_relabel_0_4_64=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/internlm2_5_7b_sft_hf_rm_v7_relabel_rm_reverse_0_4_64
internlm2_5_sft_rlhf_relabel_0_4_128=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/internlm2_5_7b_sft_hf_rm_v7_relabel_rm_reverse_0_4_128
internlm2_5_sft_rlhf_relabel_0_4_192=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/internlm2_5_7b_sft_hf_rm_v7_relabel_rm_reverse_0_4_192
internlm2_5_sft_rlhf_relabel_0_4_256=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/internlm2_5_7b_sft_hf_rm_v7_relabel_rm_reverse_0_4_256
internlm2_5_sft_rlhf_relabel_0_4_320=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/internlm2_5_7b_sft_hf_rm_v7_relabel_rm_reverse_0_4_320
internlm2_5_sft_rlhf_relabel_0_4_384=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/internlm2_5_7b_sft_hf_rm_v7_relabel_rm_reverse_0_4_384
internlm2_5_sft_rlhf_relabel_0_4_448=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/internlm2_5_7b_sft_hf_rm_v7_relabel_rm_reverse_0_4_448
internlm2_5_sft_rlhf_relabel_0_4_500=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/internlm2_5_7b_sft_hf_rm_v7_relabel_rm_reverse_0_4_500


internlm2_5_sft_rlhf_relabel_0_8_64=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/internlm2_5_7b_sft_hf_rm_v7_relabel_rm_reverse_0_8_64
internlm2_5_sft_rlhf_relabel_0_8_128=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/internlm2_5_7b_sft_hf_rm_v7_relabel_rm_reverse_0_8_128
internlm2_5_sft_rlhf_relabel_0_8_192=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/internlm2_5_7b_sft_hf_rm_v7_relabel_rm_reverse_0_8_192
internlm2_5_sft_rlhf_relabel_0_8_256=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/internlm2_5_7b_sft_hf_rm_v7_relabel_rm_reverse_0_8_256
internlm2_5_sft_rlhf_relabel_0_8_320=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/internlm2_5_7b_sft_hf_rm_v7_relabel_rm_reverse_0_8_320
internlm2_5_sft_rlhf_relabel_0_8_384=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/internlm2_5_7b_sft_hf_rm_v7_relabel_rm_reverse_0_8_384
internlm2_5_sft_rlhf_relabel_0_8_448=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/internlm2_5_7b_sft_hf_rm_v7_relabel_rm_reverse_0_8_448
internlm2_5_sft_rlhf_relabel_0_8_500=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/internlm2_5_7b_sft_hf_rm_v7_relabel_rm_reverse_0_8_500

#models=($internlm2_5_sft_rlhf_relabel_0_8_64 $internlm2_5_sft_rlhf_relabel_0_8_128 $internlm2_5_sft_rlhf_relabel_0_8_192 $internlm2_5_sft_rlhf_relabel_0_8_256 $internlm2_5_sft_rlhf_relabel_0_8_320 $internlm2_5_sft_rlhf_relabel_0_8_384 $internlm2_5_sft_rlhf_relabel_0_8_448 $internlm2_5_sft_rlhf_relabel_0_8_500)
internlm2_5_sft_step_400=/cpfs02/llm/shared/public/lantian/exp/internlm2_5/s1_d4_st_5_l1_resumm_20240906_internlm2_5_7b_s1/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_s1_d4_st_5_l1_resumm_20240906_internlm2_5_7b_s1_step_400/400_hf_ckpt
internlm2_5_sft_step_500=/cpfs02/llm/shared/public/lantian/exp/internlm2_5/s1_d4_st_5_l1_resumm_20240906_internlm2_5_7b_s1/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_s1_d4_st_5_l1_resumm_20240906_internlm2_5_7b_s1_step_500/500_hf_ckpt
models=($internlm2_5_sft_step_400 $internlm2_5_sft_step_500)

s1_baseline=/cpfs02/llm/shared/public/lantian/exp/20240418_aliyun_Ampere_7B_v1_1_FT_v1_0_0_s1_rc48_1660_hf_ckpt
models=($s1_baseline)


internlm2_rm_reverse_bsz_16_64=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/internlm2_rm_reverse_bsz_16_64
internlm2_rm_reverse_bsz_16_96=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/internlm2_rm_reverse_bsz_16_96
internlm2_rm_reverse_bsz_16_128=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/internlm2_rm_reverse_bsz_16_128
internlm2_rm_reverse_bsz_16_160=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/internlm2_rm_reverse_bsz_16_160
internlm2_rm_reverse_bsz_16_192=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/internlm2_rm_reverse_bsz_16_192

internlm2_rm_reverse_bsz_48_64=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/internlm2_rm_reverse_bsz_48_64
internlm2_rm_reverse_bsz_48_128=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/internlm2_rm_reverse_bsz_48_128
internlm2_rm_reverse_bsz_48_192=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/internlm2_rm_reverse_bsz_48_192
internlm2_rm_reverse_bsz_48_256=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/internlm2_rm_reverse_bsz_48_256
internlm2_rm_reverse_bsz_48_320=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/internlm2_rm_reverse_bsz_48_320
models=($internlm2_rm_reverse_bsz_16_64 $internlm2_rm_reverse_bsz_16_96 $internlm2_rm_reverse_bsz_16_128 $internlm2_rm_reverse_bsz_16_160 $internlm2_rm_reverse_bsz_16_192 $internlm2_rm_reverse_bsz_48_64 $internlm2_rm_reverse_bsz_48_128 $internlm2_rm_reverse_bsz_48_192)
models=($internlm2_rm_reverse_bsz_48_256 $internlm2_rm_reverse_bsz_48_320)

internlm2_rm_reverse_bsz_96_64=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/internlm2_rm_reverse_bsz_96_64
internlm2_rm_reverse_bsz_96_128=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/internlm2_rm_reverse_bsz_96_128
internlm2_rm_reverse_bsz_96_192=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/internlm2_rm_reverse_bsz_96_192
internlm2_rm_reverse_bsz_96_256=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/internlm2_rm_reverse_bsz_96_256
internlm2_rm_reverse_bsz_96_320=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/internlm2_rm_reverse_bsz_96_320
internlm2_rm_reverse_bsz_96_384=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/internlm2_rm_reverse_bsz_96_384
internlm2_rm_reverse_bsz_96_448=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/internlm2_rm_reverse_bsz_96_448

internlm2_rm_reverse_bsz_128_64=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/internlm2_rm_reverse_bsz_128_64
internlm2_rm_reverse_bsz_128_128=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/internlm2_rm_reverse_bsz_128_128
internlm2_rm_reverse_bsz_128_192=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/internlm2_rm_reverse_bsz_128_192
internlm2_rm_reverse_bsz_128_256=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/internlm2_rm_reverse_bsz_128_256
internlm2_rm_reverse_bsz_128_320=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/internlm2_rm_reverse_bsz_128_320
internlm2_rm_reverse_bsz_128_384=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/internlm2_rm_reverse_bsz_128_384
internlm2_rm_reverse_bsz_128_448=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/internlm2_rm_reverse_bsz_128_448
internlm2_rm_reverse_bsz_128_500=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/internlm2_rm_reverse_bsz_128_500

#models=($internlm2_rm_reverse_bsz_96_64 $internlm2_rm_reverse_bsz_96_128 $internlm2_rm_reverse_bsz_96_192 $internlm2_rm_reverse_bsz_96_256 $internlm2_rm_reverse_bsz_96_320 $internlm2_rm_reverse_bsz_96_384 $internlm2_rm_reverse_bsz_96_448 $internlm2_rm_reverse_bsz_128_64)
models=($internlm2_rm_reverse_bsz_128_128 $internlm2_rm_reverse_bsz_128_192 $internlm2_rm_reverse_bsz_128_256 $internlm2_rm_reverse_bsz_128_320 $internlm2_rm_reverse_bsz_128_384 $internlm2_rm_reverse_bsz_128_448 $internlm2_rm_reverse_bsz_128_500)

no_criteria_v7_relabel_rm_reverse_add_mathcode_0_1_64=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/sft_hf_rm_v7_relabel_rm_reverse_add_mathcode_0_1_no_criteria_64
no_criteria_v7_relabel_rm_reverse_add_mathcode_0_1_128=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/sft_hf_rm_v7_relabel_rm_reverse_add_mathcode_0_1_no_criteria_128
no_criteria_v7_relabel_rm_reverse_add_mathcode_0_1_192=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/sft_hf_rm_v7_relabel_rm_reverse_add_mathcode_0_1_no_criteria_192
no_criteria_v7_relabel_rm_reverse_add_mathcode_0_1_256=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/sft_hf_rm_v7_relabel_rm_reverse_add_mathcode_0_1_no_criteria_256
no_criteria_v7_relabel_rm_reverse_add_mathcode_0_1_320=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/sft_hf_rm_v7_relabel_rm_reverse_add_mathcode_0_1_no_criteria_320
no_criteria_v7_relabel_rm_reverse_add_mathcode_0_1_384=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/sft_hf_rm_v7_relabel_rm_reverse_add_mathcode_0_1_no_criteria_384
no_criteria_v7_relabel_rm_reverse_add_mathcode_0_1_448=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/sft_hf_rm_v7_relabel_rm_reverse_add_mathcode_0_1_no_criteria_448
no_criteria_v7_relabel_rm_reverse_add_mathcode_0_1_500=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/sft_hf_rm_v7_relabel_rm_reverse_add_mathcode_0_1_no_criteria_500
models=($no_criteria_v7_relabel_rm_reverse_add_mathcode_0_1_320 $no_criteria_v7_relabel_rm_reverse_add_mathcode_0_1_384 $no_criteria_v7_relabel_rm_reverse_add_mathcode_0_1_448 $no_criteria_v7_relabel_rm_reverse_add_mathcode_0_1_500)

#no_criteria_v7_relabel_rm_reverse_0_4_64=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/sft_hf_rm_v7_relabel_rm_reverse_0_4_no_criteria_64
#no_criteria_v7_relabel_rm_reverse_0_4_128=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/sft_hf_rm_v7_relabel_rm_reverse_0_4_no_criteria_128
#no_criteria_v7_relabel_rm_reverse_0_4_192=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/sft_hf_rm_v7_relabel_rm_reverse_0_4_no_criteria_192
#no_criteria_v7_relabel_rm_reverse_0_4_256=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/sft_hf_rm_v7_relabel_rm_reverse_0_4_no_criteria_256
#models=($no_criteria_v7_relabel_rm_reverse_0_4_64 $no_criteria_v7_relabel_rm_reverse_0_4_128 $no_criteria_v7_relabel_rm_reverse_0_4_192 $no_criteria_v7_relabel_rm_reverse_0_4_256)

models=(20240912_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_0_1_rloo_20 20240912_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_0_1_rloo_40 20240912_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_0_1_rloo_60 20240912_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_0_1_rloo_100 20240912_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_0_1_rloo_140 20240912_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_0_1_rloo_160 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_2_64 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_2_96)
models=(sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_2_128 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_2_160 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_2_192 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_4_64 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_4_96 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_4_128 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_4_160 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_6_64)
models=(sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_6_96 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_6_128 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_6_160 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_8_64 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_8_96 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_8_128 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_8_160 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_1_0_64)
models=(sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_1_0_96 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_1_0_128)

d4_st_5_l1_resumm=/cpfs02/llm/shared/public/lantian/exp/20240618_sft_7b_critique_nips2024_d4_st_5_l1_resumm_385_epoch_2_0701/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm/385_hf_ckpt
models=($d4_st_5_l1_resumm)
#models=(/cpfs02/llm/shared/public/lantian/exp/202409_13_d4_st_5_l1_resumm_mix/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm/300_hf_ckpt)
#models=(sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_2_64 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_2_128 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_2_192 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_2_256 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_2_320 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_4_64 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_4_96 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_4_128)
#models=(sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_4_160 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_4_192 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_6_64 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_6_128 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_6_192 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_6_256 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_6_320 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_6_384)
#models=(/cpfs02/llm/shared/public/lantian/exp/202409_13_d4_st_5_l1_resumm_mix/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm_mathcode_without_criteria_but_other_with/370_hf)
#models=(/cpfs02/llm/shared/public/lantian/exp/202409_13_d4_st_5_l1_resumm_mix_mathcode_without_criteria_s1_model/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm/370_hf)
#models=(/cpfs02/llm/shared/public/lantian/exp/202409_13_d4_st_5_l1_resumm_mix_mathcode_with_criteria_s1_model/aliyun_Ampere_7B_v1.1_enchance_FT_v1.0.0_s1_rc47_FINAL_critic_v4_st_5_l1_resumm/300_hf)
models=(/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/20240826_warmup_40_bsz_64_1_1_prompt_len_32768_rm_v7_relabel_rm_reverse_add_mathcode_0_1_448)


models=(sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_2_mathcode_no_reference_64 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_2_mathcode_no_reference_128 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_2_mathcode_no_reference_192 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_2_mathcode_no_reference_320 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_2_mathcode_no_reference_384 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_2_mathcode_no_reference_448 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_2_mathcode_no_reference_500 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_4_mathcode_no_reference_64)
models=(sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_4_mathcode_no_reference_128 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_4_mathcode_no_reference_192 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_4_mathcode_no_reference_256 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_4_mathcode_no_reference_320 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_4_mathcode_no_reference_384 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_4_mathcode_no_reference_448 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_4_mathcode_no_reference_500 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_6_mathcode_no_reference_64) 
models=(sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_6_mathcode_no_reference_96 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_6_mathcode_no_reference_128 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_6_mathcode_no_reference_160 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_6_mathcode_no_reference_192 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_6_mathcode_no_reference_224 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_6_mathcode_no_reference_256)

models=(sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_8_mathcode_no_reference_64 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_8_mathcode_no_reference_80 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_8_mathcode_no_reference_96 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_8_mathcode_no_reference_112 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_8_mathcode_no_reference_128 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_8_mathcode_no_reference_144)
models=(sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_8_mathcode_no_reference_144)
models=(sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_1_0_mathcode_no_reference_64 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_1_0_mathcode_no_reference_80 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_1_0_mathcode_no_reference_96 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_1_0_mathcode_no_reference_112 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_1_0_mathcode_no_reference_128 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_1_0_mathcode_no_reference_144 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_1_0_mathcode_no_reference_160)


models=(sft_hf_rm_v7_relabel_rm_reverse_0_4_relabel_add_mathcode_0_2_mathcode_no_reference_64 sft_hf_rm_v7_relabel_rm_reverse_0_4_relabel_add_mathcode_0_2_mathcode_no_reference_96 sft_hf_rm_v7_relabel_rm_reverse_0_4_relabel_add_mathcode_0_2_mathcode_no_reference_128 sft_hf_rm_v7_relabel_rm_reverse_0_4_relabel_add_mathcode_0_2_mathcode_no_reference_160 sft_hf_rm_v7_relabel_rm_reverse_0_4_relabel_add_mathcode_0_2_mathcode_no_reference_192 sft_hf_rm_v7_relabel_rm_reverse_0_4_relabel_add_mathcode_0_2_mathcode_no_reference_224 sft_hf_rm_v7_relabel_rm_reverse_0_4_relabel_add_mathcode_0_4_mathcode_no_reference_64 sft_hf_rm_v7_relabel_rm_reverse_0_4_relabel_add_mathcode_0_4_mathcode_no_reference_96)
models=(sft_hf_rm_v7_relabel_rm_reverse_0_4_relabel_add_mathcode_0_4_mathcode_no_reference_128 sft_hf_rm_v7_relabel_rm_reverse_0_4_relabel_add_mathcode_0_4_mathcode_no_reference_160 sft_hf_rm_v7_relabel_rm_reverse_0_4_relabel_add_mathcode_0_4_mathcode_no_reference_192 sft_hf_rm_v7_relabel_rm_reverse_0_4_relabel_add_mathcode_0_6_mathcode_no_reference_64 sft_hf_rm_v7_relabel_rm_reverse_0_4_relabel_add_mathcode_0_6_mathcode_no_reference_96 sft_hf_rm_v7_relabel_rm_reverse_0_4_relabel_add_mathcode_0_6_mathcode_no_reference_128 sft_hf_rm_v7_relabel_rm_reverse_0_4_relabel_add_mathcode_0_6_mathcode_no_reference_160)
models=(sft_hf_rm_v7_relabel_rm_reverse_0_4_relabel_add_mathcode_0_6_mathcode_no_reference_192 sft_hf_rm_v7_relabel_rm_reverse_0_4_relabel_add_mathcode_0_6_mathcode_no_reference_224 sft_hf_rm_v7_relabel_rm_reverse_0_4_relabel_add_mathcode_0_6_mathcode_no_reference_256)


models=(sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_6_mathcode_no_reference_rloo_20 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_6_mathcode_no_reference_rloo_40 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_6_mathcode_no_reference_rloo_60 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_6_mathcode_no_reference_rloo_80 sft_hf_rm_v7_relabel_rm_reverse_0_4_relabel_add_mathcode_0_8_mathcode_no_reference_64 sft_hf_rm_v7_relabel_rm_reverse_0_4_relabel_add_mathcode_0_8_mathcode_no_reference_96 sft_hf_rm_v7_relabel_rm_reverse_0_4_relabel_add_mathcode_0_8_mathcode_no_reference_128 sft_hf_rm_v7_relabel_rm_reverse_0_4_relabel_add_mathcode_0_8_mathcode_no_reference_160)
#models=(sft_hf_rm_v7_relabel_rm_reverse_0_4_relabel_add_mathcode_0_8_mathcode_no_reference_192 sft_hf_rm_v7_relabel_rm_reverse_0_4_relabel_add_mathcode_1_0_mathcode_no_reference_64 sft_hf_rm_v7_relabel_rm_reverse_0_4_relabel_add_mathcode_1_0_mathcode_no_reference_96 sft_hf_rm_v7_relabel_rm_reverse_0_4_relabel_add_mathcode_1_0_mathcode_no_reference_128 sft_hf_rm_v7_relabel_rm_reverse_0_4_relabel_add_mathcode_1_0_mathcode_no_reference_160)


models=(sft_hf_rm_v7_relabel_rm_reverse_0_0_relabel_add_mathcode_0_2_mathcode_no_reference_64 sft_hf_rm_v7_relabel_rm_reverse_0_0_relabel_add_mathcode_0_2_mathcode_no_reference_128 sft_hf_rm_v7_relabel_rm_reverse_0_0_relabel_add_mathcode_0_2_mathcode_no_reference_192 sft_hf_rm_v7_relabel_rm_reverse_0_0_relabel_add_mathcode_0_2_mathcode_no_reference_256 sft_hf_rm_v7_relabel_rm_reverse_0_0_relabel_add_mathcode_0_2_mathcode_no_reference_320 sft_hf_rm_v7_relabel_rm_reverse_0_0_relabel_add_mathcode_0_2_mathcode_no_reference_384 sft_hf_rm_v7_relabel_rm_reverse_0_0_relabel_add_mathcode_0_2_mathcode_no_reference_448 sft_hf_rm_v7_relabel_rm_reverse_0_0_relabel_add_mathcode_0_4_mathcode_no_reference_64)
models=(sft_hf_rm_v7_relabel_rm_reverse_0_0_relabel_add_mathcode_0_4_mathcode_no_reference_128 sft_hf_rm_v7_relabel_rm_reverse_0_0_relabel_add_mathcode_0_4_mathcode_no_reference_192 sft_hf_rm_v7_relabel_rm_reverse_0_0_relabel_add_mathcode_0_4_mathcode_no_reference_256 sft_hf_rm_v7_relabel_rm_reverse_0_0_relabel_add_mathcode_0_4_mathcode_no_reference_320 sft_hf_rm_v7_relabel_rm_reverse_0_0_relabel_add_mathcode_0_4_mathcode_no_reference_384 sft_hf_rm_v7_relabel_rm_reverse_0_0_relabel_add_mathcode_0_6_mathcode_no_reference_64 sft_hf_rm_v7_relabel_rm_reverse_0_0_relabel_add_mathcode_0_6_mathcode_no_reference_128 sft_hf_rm_v7_relabel_rm_reverse_0_0_relabel_add_mathcode_0_6_mathcode_no_reference_192)
models=(sft_hf_rm_v7_relabel_rm_reverse_0_0_relabel_add_mathcode_0_6_mathcode_no_reference_256 sft_hf_rm_v7_relabel_rm_reverse_0_0_relabel_add_mathcode_0_6_mathcode_no_reference_320 sft_hf_rm_v7_relabel_rm_reverse_0_0_relabel_add_mathcode_0_6_mathcode_no_reference_384 sft_hf_rm_v7_relabel_rm_reverse_0_0_relabel_add_mathcode_0_6_mathcode_no_reference_448 sft_hf_rm_v7_relabel_rm_reverse_0_0_relabel_add_mathcode_0_6_mathcode_no_reference_500 sft_hf_rm_v7_relabel_rm_reverse_0_0_relabel_add_mathcode_0_8_mathcode_no_reference_64 sft_hf_rm_v7_relabel_rm_reverse_0_0_relabel_add_mathcode_0_8_mathcode_no_reference_96 sft_hf_rm_v7_relabel_rm_reverse_0_0_relabel_add_mathcode_0_8_mathcode_no_reference_128)
models=(sft_hf_rm_v7_relabel_rm_reverse_0_0_relabel_add_mathcode_0_8_mathcode_no_reference_160 sft_hf_rm_v7_relabel_rm_reverse_0_0_relabel_add_mathcode_1_0_mathcode_no_reference_64 sft_hf_rm_v7_relabel_rm_reverse_0_0_relabel_add_mathcode_1_0_mathcode_no_reference_96 sft_hf_rm_v7_relabel_rm_reverse_0_0_relabel_add_mathcode_1_0_mathcode_no_reference_129 sft_hf_rm_v7_relabel_rm_reverse_0_0_relabel_add_mathcode_1_0_mathcode_no_reference_160)


models=(sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_2_mathcode_with_reference_64 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_2_mathcode_with_reference_128 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_2_mathcode_with_reference_192 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_2_mathcode_with_reference_256 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_2_mathcode_with_reference_320 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_2_mathcode_with_reference_352 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_6_mathcode_with_reference_64 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_6_mathcode_with_reference_128)
models=(sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_6_mathcode_with_reference_192 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_6_mathcode_with_reference_256 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_6_mathcode_with_reference_320)


models=(sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_1_mathcode_with_reference_64 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_1_mathcode_with_reference_128 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_1_mathcode_with_reference_192 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_1_mathcode_with_reference_256 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_1_mathcode_with_reference_320 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_1_mathcode_with_reference_384 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_1_mathcode_with_reference_448 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_1_mathcode_with_reference_500)
models=(sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_1_mathcode_no_reference_64 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_1_mathcode_no_reference_128 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_1_mathcode_no_reference_192 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_1_mathcode_no_reference_256 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_1_mathcode_no_reference_320 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_1_mathcode_no_reference_384 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_1_mathcode_no_reference_448 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_1_mathcode_no_reference_500)
models=(sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_6_mathcode_no_reference_rloo_20240919_40 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_6_mathcode_no_reference_rloo_20240919_60 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_6_mathcode_no_reference_rloo_20240919_80 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_6_mathcode_no_reference_rloo_20240919_100 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_6_mathcode_no_reference_rloo_20240919_120 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_6_mathcode_no_reference_rloo_20240919_140 sft_hf_rm_v7_relabel_rm_reverse_0_1_relabel_add_mathcode_0_6_mathcode_no_reference_rloo_20240919_160)

for index in $(seq 0 7)
do
    model=/cpfs02/llm/shared/public/lantian/exp/transfer_from_tos/${models[$index]}
    #model=${models[$index]}
    index=$(($index+0))

    if [[ $model == *"no_ref"* ]]; then
        # inference donot contain reference prompt
        reference=False
    else
        reference=True
    fi
    reference=True

    if [[ $model == *"no_criteria"* ]]; then
        # inference donot contain criteria prompt
        criteria=False
    else
        criteria=True
    fi

    if [[ $model == *"no_task"* ]]; then
        # inference donot contain task prompt
        task=False
    else
        task=True
    fi


    if [[ $model == *"no_all"* ]]; then
        # inference donot contain task prompt
        task=False
        criteria=False
        reference=False
    fi
    echo "Inference $model on GPU[$index] | task [$task] | criteria [$criteria] | reference [$reference]"
    CUDA_VISIBLE_DEVICES=$index python feedback_models.py --model_name $model --output_dir 20240823_rlhf_singleturn_temp_07 --reference $reference --task $task --criteria $criteria --split dev &
    #CUDA_VISIBLE_DEVICES=$(($index+1)) python feedback_models.py --model_name $model --output_dir 20240811_resumm_debug --reference $reference --task $task --criteria $criteria --split test &
done
