data_root
model_root1=/data3/MODELS
model_root2=/data2/MODELS
peft_root=${data_root}/output
BATCH_SIZE=100
NUM_SAMPLE=200
MAX_NEW_TOKENS=128
MODELS=(Llama-2-7b-hf gemma-7b Mistral-7B-v0.1)
PEFT_NAME=(sharegpt_ia3_ff_1 sharegpt_ia3_ff_1_hh_harmless_dpo_ia3_ff)

for MODEL in ${MODELS[@]}
do 
    PEFT_PATH=(${peft_root}/${MODEL}_${PEFT_NAME[0]} ${peft_root}/${MODEL}_${PEFT_NAME[1]})

    # python -m src.eval.truthfulqa.run_eval \
    #     --data_dir ${data_root}/data/eval/truthfulqa \
    #     --save_dir results/trutufulqa_base/${MODEL} \
    #     --model_name_or_path ${model_root2}/${MODEL} \
    #     --tokenizer_name_or_path ${model_root2}/${MODEL} \
    #     --metrics mc \
    #     --preset qa \
    #     --eval_batch_size ${BATCH_SIZE} \
    #     --use_chat_format \
    #     --hooked

    # python -m src.eval.truthfulqa.run_eval \
    #     --data_dir ${data_root}/data/eval/truthfulqa \
    #     --save_dir results/trutufulqa_sft/${MODEL} \
    #     --model_name_or_path ${model_root2}/${MODEL} \
    #     --tokenizer_name_or_path ${model_root2}/${MODEL} \
    #     --metrics mc \
    #     --preset qa \
    #     --eval_batch_size ${BATCH_SIZE} \
    #     --use_chat_format \
    #     --red_peft_path ${PEFT_PATH[0]} \
    #     --hooked

    # python -m src.eval.truthfulqa.run_eval \
    #     --data_dir ${data_root}/data/eval/truthfulqa \
    #     --save_dir results/trutufulqa_dpo/${MODEL} \
    #     --model_name_or_path ${model_root2}/${MODEL} \
    #     --tokenizer_name_or_path ${model_root2}/${MODEL} \
    #     --metrics mc \
    #     --preset qa \
    #     --eval_batch_size ${BATCH_SIZE} \
    #     --use_chat_format \
    #     --red_peft_path ${PEFT_PATH[@]} \
    #     --hooked

    python -m eval.truthfulqa.run_eval \
        --data_dir ${data_root}/data/eval/truthfulqa \
        --save_dir results/trutufulqa_sft_patch/${MODEL} \
        --model_name_or_path ${model_root2}/${MODEL} \
        --tokenizer_name_or_path ${model_root2}/${MODEL} \
        --metrics mc \
        --preset qa \
        --eval_batch_size ${BATCH_SIZE} \
        --use_chat_format \
        --red_peft_path ${PEFT_PATH[0]} \
        --blue_peft_path ${PEFT_PATH[@]} \
        --index_path ${data_root}/hooked_llama/neuron_activation/${MODEL}_${PEFT_NAME[-1]}_sft_vs_dpo_on_hh_harmless_sft_completion.pt \
        --hooked

    python -m eval.truthfulqa.run_eval \
        --data_dir ${data_root}/data/eval/truthfulqa \
        --save_dir results/trutufulqa_base_patch/${MODEL} \
        --model_name_or_path ${model_root2}/${MODEL} \
        --tokenizer_name_or_path ${model_root2}/${MODEL} \
        --metrics mc \
        --preset qa \
        --eval_batch_size ${BATCH_SIZE} \
        --use_chat_format \
        --blue_peft_path ${PEFT_PATH[@]} \
        --index_path ${data_root}/hooked_llama/neuron_activation/${MODEL}_${PEFT_NAME[-1]}_sft_vs_dpo_on_hh_harmless_sft_completion.pt \
        --hooked

done