data_root=
model_root1=/data3/MODELS
model_root2=/data2/MODELS
peft_root=${data_root}/output
BATCH_SIZE=10
NUM_SAMPLE=200
MAX_NEW_TOKENS=128
MODELS=(Llama-2-7b-hf gemma-7b Mistral-7B-v0.1)
PEFT_NAME=(sharegpt_ia3_ff_1 sharegpt_ia3_ff_1_hh_harmless_dpo_ia3_ff)

for MODEL in ${MODELS[@]}
do 
    PEFT_PATH=(${peft_root}/${MODEL}_${PEFT_NAME[0]} ${peft_root}/${MODEL}_${PEFT_NAME[1]})
    # evaluating llama 7B model using chain-of-thought
    # evaluating lora llama 7B model using chain-of-thought
    # python -m eval.bbh.run_eval \
    #     --data_dir ${data_root}/data/eval/bbh \
    #     --save_dir results/bbh/${MODEL}-cot \
    #     --model ${model_root2}/${MODEL} \
    #     --tokenizer ${model_root2}/${MODEL} \
    #     --eval_batch_size ${BATCH_SIZE} \
    #     --max_num_examples_per_task 40 \
    #     --use_chat_format \
    #     --hooked

    # python -m eval.bbh.run_eval \
    #     --data_dir ${data_root}/data/eval/bbh \
    #     --save_dir results/bbh/${MODEL}-sft-cot \
    #     --model ${model_root2}/${MODEL} \
    #     --tokenizer ${model_root2}/${MODEL} \
    #     --eval_batch_size ${BATCH_SIZE} \
    #     --max_num_examples_per_task 40 \
    #     --use_chat_format \
    #     --red_peft_path ${PEFT_PATH[0]} \
    #     --hooked

    # python -m eval.bbh.run_eval \
    #     --data_dir ${data_root}/data/eval/bbh \
    #     --save_dir results/bbh/${MODEL}-dpo-cot \
    #     --model ${model_root2}/${MODEL} \
    #     --tokenizer ${model_root2}/${MODEL} \
    #     --eval_batch_size ${BATCH_SIZE} \
    #     --max_num_examples_per_task 40 \
    #     --use_chat_format \
    #     --red_peft_path ${PEFT_PATH[@]} \
    #     --hooked

    python -m eval.bbh.run_eval \
        --data_dir ${data_root}/data/eval/bbh \
        --save_dir results/bbh/${MODEL}-sft-patch-cot \
        --model ${model_root2}/${MODEL} \
        --tokenizer ${model_root2}/${MODEL} \
        --eval_batch_size ${BATCH_SIZE} \
        --max_num_examples_per_task 40 \
        --use_chat_format \
        --red_peft_path ${PEFT_PATH[0]} \
        --blue_peft_path ${PEFT_PATH[@]} \
        --index_path ${data_root}/hooked_llama/neuron_activation/${MODEL}_${PEFT_NAME[-1]}_sft_vs_dpo_on_hh_harmless_sft_completion.pt \
        --hooked
        
    python -m eval.bbh.run_eval \
        --data_dir ${data_root}/data/eval/bbh \
        --save_dir results/bbh/${MODEL}-patch-cot \
        --model ${model_root2}/${MODEL} \
        --tokenizer ${model_root2}/${MODEL} \
        --eval_batch_size ${BATCH_SIZE} \
        --max_num_examples_per_task 40 \
        --use_chat_format \
        --blue_peft_path ${PEFT_PATH[@]} \
        --index_path ${data_root}/hooked_llama/neuron_activation/${MODEL}_${PEFT_NAME[-1]}_sft_vs_dpo_on_hh_harmless_sft_completion.pt \
        --hooked
done