
data_root=
DATA_SET=(beavertails flan harmfulqa)
model_root1=
peft_root=${data_root}/output
DATASET=data/raw_train/BeaverTails/test.jsonl
# DATASET=data/eval/bbh

for model in hh_harmless
do
for seed in 1
do
    PEFT_NAME=(sharegpt_ia3_ff_${seed} sharegpt_ia3_ff_${seed}_${model}_dpo_ia3_ff)
    GUIDED_PEFT_NAME=(sharegpt_ia3_ff_${seed} sharegpt_ia3_ff_${seed}_hh_helpful_dpo_ia3_ff)
    MODEL=Llama-2-7b-hf
    PEFT_PATH=()
    for ((i=0; i<${#PEFT_NAME[*]}; ++i)) 
    do
        PEFT_PATH[i]=${peft_root}/${MODEL}_${PEFT_NAME[i]}
        GUIDED_PEFT_PATH[i]=${peft_root}/${MODEL}_${GUIDED_PEFT_NAME[i]}
    done
    for dataset in beavertails
    do
        INDEX_PATH=(
            base_vs_dpo_on_${dataset}_base_completion
            base_vs_dpo_on_${dataset}_dpo_completion
            sft_vs_dpo_on_${dataset}_sft_completion
            sft_vs_dpo_on_${dataset}_dpo_completion
            # chat_vs_sft_on_${dataset}_sft_completion
            # chat_vs_sft_on_${dataset}_chat_completion
            # hh_harmless_prompt_last_token
        )
        #  800 1200 2000 3000 4000 5000
        for index_path in ${INDEX_PATH[@]}
        do
 
            
            python -m hooked_models.output_comparison \
                --dataset ${data_root}/${DATASET} \
                --save_dir results/output_comparison \
                --model_name_or_path ${model_root1}/${MODEL} \
                --tokenizer_name_or_path ${model_root1}/${MODEL} \
                --eval_batch_size 50 \
                --num_samples 1000 \
                --max_new_tokens 128 \
                --topk_ablate  0 200 400 600 800 1000 1200 1500 2000 3000 4000 5000 6000 7000 8000 9000 10000 12000 14000 16000 18000 20000  \
                --use_chat_format \
                --red_peft_path ${PEFT_PATH[@]} \
                --index_path ${data_root}/hooked_llama/neuron_activation/${MODEL}_${PEFT_NAME[-1]}_${index_path}.pt \
                --value_path ${data_root}/hooked_llama/neuron_activation/${MODEL}_${PEFT_NAME[-1]}_${index_path}.pt 
            
            # python -m eval.arena.run_eval \
            #     --dataset ${data_root}/${DATASET} \
            #     --save_dir results/arena \
            #     --model_name_or_path ${model_root2}/${MODEL} \
            #     --tokenizer_name_or_path ${model_root2}/${MODEL} \
            #     --cost_model_name_or_path ${model_root1}/beaver-7b-v1.0-cost \
            #     --eval_batch_size 200 \
            #     --num_samples 1000 \
            #     --max_new_tokens 128 \
            #     --topk_ablate 0 200 400 600 800 1000 1200 1500 2000 3000 4000 5000 6000 7000 8000 9000 10000 12000 14000 16000 18000 20000 \
            #     --use_chat_format \
            #     --patch_mean \
            #     --index_path ${data_root}/hooked_llama/neuron_activation/${MODEL}_${PEFT_NAME[-1]}_${index_path}.pt \
            #     --value_path ${data_root}/hooked_llama/neuron_activation/${MODEL}_${PEFT_NAME[-1]}_${index_path}.pt 
            
            # python -m eval.arena.run_eval \
            #     --dataset ${data_root}/${DATASET} \
            #     --save_dir results/arena \
            #     --model_name_or_path ${model_root2}/${MODEL} \
            #     --tokenizer_name_or_path ${model_root2}/${MODEL} \
            #     --cost_model_name_or_path ${model_root1}/beaver-7b-v1.0-cost \
            #     --eval_batch_size 200 \
            #     --num_samples 200 \
            #     --max_new_tokens 128 \
            #     --topk_ablate 10000 \
            #     --use_chat_format \
            #     --blue_peft_path ${PEFT_PATH[@]} \
            #     --generation_startswith Sure 

                
            # python -m eval.arena.run_eval \
            #     --dataset ${data_root}/${DATASET} \
            #     --save_dir results/arena \
            #     --model_name_or_path ${model_root1}/${MODEL} \
            #     --tokenizer_name_or_path ${model_root1}/${MODEL} \
            #     --cost_model_name_or_path ${model_root1}/beaver-7b-v1.0-cost \
            #     --eval_batch_size 200 \
            #     --num_samples 200 \
            #     --max_new_tokens 128 \
            #     --topk_ablate 0 200 400 600 800 1000 1200 1500 2000 3000 4000 5000 6000 7000 8000 9000 10000 12000 14000 16000 18000 20000 \
            #     --use_chat_format \
            #     --blue_peft_path ${PEFT_PATH[@]} \
            #     --red_peft_path ${GUIDED_PEFT_PATH[@]} \
            #     --index_path ${data_root}/hooked_llama/neuron_activation/Llama-2-7b-hf_${PEFT_NAME[-1]}_${index_path}.pt \
            #     --value_path ${data_root}/hooked_llama/neuron_activation/Llama-2-7b-hf_${PEFT_NAME[-1]}_${index_path}.pt \
            #     --guided_generation 
                # --cache_difference

            # python -m eval.arena.run_eval \
            #     --dataset ${data_root}/${DATASET} \
            #     --save_dir results/arena \
            #     --model_name_or_path ${model_root1}/${MODEL} \
            #     --tokenizer_name_or_path ${model_root1}/${MODEL} \
            #     --cost_model_name_or_path ${model_root1}/beaver-7b-v1.0-reward \
            #     --eval_batch_size 200 \
            #     --num_samples 200 \
            #     --max_new_tokens 128 \
            #     --topk_ablate 0 200 400 600 800 1000 1200 1500 2000 3000 4000 5000 6000 7000 8000 9000 10000 12000 14000 16000 18000 20000 \
            #     --use_chat_format \
            #     --blue_peft_path ${PEFT_PATH[@]} \
            #     --index_path ${data_root}/hooked_llama/neuron_activation/Llama-2-7b-hf_sharegpt_ia3_ff_${seed}_hh_harmless_dpo_ia3_ff_${index_path}.pt \
            #     --value_path ${data_root}/hooked_llama/neuron_activation/Llama-2-7b-hf_sharegpt_ia3_ff_${seed}_hh_harmless_dpo_ia3_ff_${index_path}.pt \
            #     --guided_generation 
                
            # python -m eval.arena.run_eval \
            #     --dataset ${data_root}/${DATASET} \
            #     --save_dir results/arena \
            #     --model_name_or_path ${model_root1}/${MODEL} \
            #     --tokenizer_name_or_path ${model_root1}/${MODEL} \
            #     --cost_model_name_or_path ${model_root1}/beaver-7b-v1.0-reward \
            #     --eval_batch_size 200 \
            #     --num_samples 200 \
            #     --max_new_tokens 128 \
            #     --topk_ablate 0 200 400 600 800 1000 1200 1500 2000 3000 4000 5000 6000 7000 8000 9000 10000 12000 14000 16000 18000 20000 \
            #     --use_chat_format \
            #     --red_peft_path ${PEFT_PATH[0]} \
            #     --blue_peft_path ${PEFT_PATH[@]} \
            #     --index_path ${data_root}/hooked_llama/neuron_activation/Llama-2-7b-hf_sharegpt_ia3_ff_${seed}_hh_harmless_dpo_ia3_ff_${index_path}.pt \
            #     --value_path ${data_root}/hooked_llama/neuron_activation/Llama-2-7b-hf_sharegpt_ia3_ff_${seed}_hh_harmless_dpo_ia3_ff_${index_path}.pt \
            #     --guided_generation 
        done
    done
done
done

# for model in hh_harmless hh_helpful
# do
# for seed in 1
# do
#     PEFT_NAME=(sharegpt_ia3_ff_${seed} sharegpt_ia3_ff_${seed}_${model}_dpo_ia3_ff)
#     # PEFT_NAME=(sharegpt_lora_qv sharegpt_lora_qv_merged_hh_harmless_dpo_lora_qv)
#     GUIDED_PEFT_NAME=(sharegpt_ia3_ff_${seed} sharegpt_ia3_ff_${seed}_hh_harmless_dpo_ia3_ff)
#     MODEL=Llama-2-7b-hf
#     PEFT_PATH=()
#     for ((i=0; i<${#PEFT_NAME[*]}; ++i)) 
#     do
#         PEFT_PATH[i]=${model_root2}/${MODEL}_${PEFT_NAME[i]}
#         GUIDED_PEFT_PATH[i]=${model_root2}/${MODEL}_${GUIDED_PEFT_NAME[i]}
#     done
#     for dataset in beavertails
#     do
#         INDEX_PATH=(
#             # base_vs_dpo_on_${dataset}_base_completion
#             # base_vs_dpo_on_${dataset}_dpo_completion
#             sft_vs_dpo_on_${dataset}_sft_completion
#             # sft_vs_dpo_on_${dataset}_dpo_completion
#         )
#         #  800 1200 2000 3000 4000 5000
#         for index_path in ${INDEX_PATH[@]}
#         do
#             python -m eval.arena.run_eval \
#                 --dataset ${data_root}/${DATASET} \
#                 --save_dir results/arena \
#                 --model_name_or_path ${model_root1}/${MODEL} \
#                 --tokenizer_name_or_path ${model_root1}/${MODEL} \
#                 --cost_model_name_or_path ${model_root1}/beaver-7b-v1.0-cost \
#                 --eval_batch_size 100 \
#                 --num_samples 1000 \
#                 --max_new_tokens 256 \
#                 --topk_ablate 10000 \
#                 --use_chat_format \
#                 --red_peft_path ${PEFT_PATH[0]} \
#                 --blue_peft_path ${PEFT_PATH[@]} \
#                 --index_path ${data_root}/hooked_llama/neuron_activation/Llama-2-7b-hf_${GUIDED_PEFT_NAME[-1]}_${index_path}.pt \
#                 --value_path ${data_root}/hooked_llama/neuron_activation/Llama-2-7b-hf_${GUIDED_PEFT_NAME[-1]}_${index_path}.pt \
#                 --guided_generation \
#                 --cache_difference
                
#             # python -m eval.arena.run_eval \
#             #     --dataset ${data_root}/${DATASET} \
#             #     --save_dir results/arena \
#             #     --model_name_or_path ${model_root1}/${MODEL} \
#             #     --tokenizer_name_or_path ${model_root1}/${MODEL} \
#             #     --cost_model_name_or_path ${model_root1}/beaver-7b-v1.0-cost \
#             #     --eval_batch_size 200 \
#             #     --num_samples 200 \
#             #     --max_new_tokens 128 \
#             #     --topk_ablate 0 200 400 600 800 1000 1200 1500 2000 3000 4000 5000 6000 7000 8000 9000 10000 12000 14000 16000 18000 20000 \
#             #     --use_chat_format \
#             #     --blue_peft_path ${PEFT_PATH[@]} \
#             #     --red_peft_path ${GUIDED_PEFT_PATH[@]} \
#             #     --index_path ${data_root}/hooked_llama/neuron_activation/Llama-2-7b-hf_${PEFT_NAME[-1]}_${index_path}.pt \
#             #     --value_path ${data_root}/hooked_llama/neuron_activation/Llama-2-7b-hf_${PEFT_NAME[-1]}_${index_path}.pt \
#             #     --guided_generation 
#                 # --cache_difference

#             # python -m eval.arena.run_eval \
#             #     --dataset ${data_root}/${DATASET} \
#             #     --save_dir results/arena \
#             #     --model_name_or_path ${model_root1}/${MODEL} \
#             #     --tokenizer_name_or_path ${model_root1}/${MODEL} \
#             #     --cost_model_name_or_path ${model_root1}/beaver-7b-v1.0-reward \
#             #     --eval_batch_size 200 \
#             #     --num_samples 200 \
#             #     --max_new_tokens 128 \
#             #     --topk_ablate 0 200 400 600 800 1000 1200 1500 2000 3000 4000 5000 6000 7000 8000 9000 10000 12000 14000 16000 18000 20000 \
#             #     --use_chat_format \
#             #     --blue_peft_path ${PEFT_PATH[@]} \
#             #     --index_path ${data_root}/hooked_llama/neuron_activation/Llama-2-7b-hf_sharegpt_ia3_ff_${seed}_hh_harmless_dpo_ia3_ff_${index_path}.pt \
#             #     --value_path ${data_root}/hooked_llama/neuron_activation/Llama-2-7b-hf_sharegpt_ia3_ff_${seed}_hh_harmless_dpo_ia3_ff_${index_path}.pt \
#             #     --guided_generation 
                
#             # python -m eval.arena.run_eval \
#             #     --dataset ${data_root}/${DATASET} \
#             #     --save_dir results/arena \
#             #     --model_name_or_path ${model_root1}/${MODEL} \
#             #     --tokenizer_name_or_path ${model_root1}/${MODEL} \
#             #     --cost_model_name_or_path ${model_root1}/beaver-7b-v1.0-reward \
#             #     --eval_batch_size 200 \
#             #     --num_samples 200 \
#             #     --max_new_tokens 128 \
#             #     --topk_ablate 0 200 400 600 800 1000 1200 1500 2000 3000 4000 5000 6000 7000 8000 9000 10000 12000 14000 16000 18000 20000 \
#             #     --use_chat_format \
#             #     --red_peft_path ${PEFT_PATH[0]} \
#             #     --blue_peft_path ${PEFT_PATH[@]} \
#             #     --index_path ${data_root}/hooked_llama/neuron_activation/Llama-2-7b-hf_sharegpt_ia3_ff_${seed}_hh_harmless_dpo_ia3_ff_${index_path}.pt \
#             #     --value_path ${data_root}/hooked_llama/neuron_activation/Llama-2-7b-hf_sharegpt_ia3_ff_${seed}_hh_harmless_dpo_ia3_ff_${index_path}.pt \
#             #     --guided_generation 
#         done
#     done
# done
# done
# INDEX_PATH=(
#     base_vs_dpo_lora_on_beavertails_base_completion
#     base_vs_dpo_lora_on_beavertails_dpo_completion
#     sft_lora_vs_dpo_lora_on_beavertails_sft_completion
#     sft_lora_vs_dpo_lora_on_beavertails_dpo_completion
# )

# for index in ${INDEX_PATH[@]}
# do
#     python -m eval.arena.run_eval \
#         --dataset ${data_root}/data/raw_train/BeaverTails/test.jsonl \
#         --save_dir results/arena \
#         --model_name_or_path ${model_root1}/${MODEL} \
#         --tokenizer_name_or_path ${model_root1}/${MODEL} \
#         --cost_model_name_or_path ${model_root1}/beaver-7b-v1.0-cost \
#         --eval_batch_size 200 \
#         --num_samples 200 \
#         --max_new_tokens 128 \
#         --topk_ablate 20000 40000 60000 80000 120000 140000 160000 180000 200000 220000 240000 260000 280000 300000 320000 341248 \
#         --use_chat_format \
#         --blue_peft_path ${GUIDED_PEFT_PATH[@]} \
#         --index_path ${data_root}/hooked_llama/neuron_activation/Llama-2-7b-hf_${index}.pt \
#         --value_path ${data_root}/hooked_llama/neuron_activation/Llama-2-7b-hf_${index}.pt \
#         --guided_generation 
# done

# for index in ${INDEX_PATH[@]}
# do
#     python -m eval.arena.run_eval \
#         --dataset ${data_root}/data/raw_train/BeaverTails/test.jsonl \
#         --save_dir results/arena \
#         --model_name_or_path ${model_root1}/${MODEL} \
#         --tokenizer_name_or_path ${model_root1}/${MODEL} \
#         --cost_model_name_or_path ${model_root1}/beaver-7b-v1.0-cost \
#         --eval_batch_size 200 \
#         --num_samples 200 \
#         --max_new_tokens 128 \
#         --topk_ablate 0 200 400 600 800 1000 1200 1500 2000 2500 3000 3500 4000 4500 5000 6000 7000 8000 9000 10000 12000 14000 16000 18000 20000 \
#         --use_chat_format \
#         --blue_peft_path ${PEFT_PATH[@]} \
#         --index_path ${data_root}/hooked_llama/neuron_activation/Llama-2-7b-hf_${index}.pt \
#         --value_path ${data_root}/hooked_llama/neuron_activation/Llama-2-7b-hf_${index}.pt \
#         --patch_mean
# done

# for index in ${INDEX_PATH[@]}
# do
#     python -m eval.arena.run_eval \
#         --dataset ${data_root}/data/raw_train/BeaverTails/test.jsonl \
#         --save_dir results/arena \
#         --model_name_or_path ${model_root1}/${MODEL} \
#         --tokenizer_name_or_path ${model_root1}/${MODEL} \
#         --cost_model_name_or_path ${model_root1}/beaver-7b-v1.0-cost \
#         --eval_batch_size 200 \
#         --num_samples 200 \
#         --max_new_tokens 128 \
#         --topk_ablate 0 200 400 600 800 1000 1200 1500 2000 2500 3000 3500 4000 4500 5000 6000 7000 8000 9000 10000 12000 14000 16000 18000 20000 \
#         --use_chat_format \
#         --blue_peft_path ${PEFT_PATH[@]} \
#         --index_path ${data_root}/hooked_llama/neuron_activation/Llama-2-7b-hf_${index}.pt \
#         --value_path ${data_root}/hooked_llama/neuron_activation/Llama-2-7b-hf_${index}.pt \
#         --patch_zero
# done

# for index in ${INDEX_PATH[@]}
# do
#     python -m eval.arena.run_eval \
#         --dataset ${data_root}/data/raw_train/BeaverTails/test.jsonl \
#         --save_dir results/arena \
#         --model_name_or_path ${model_root1}/${MODEL} \
#         --tokenizer_name_or_path ${model_root1}/${MODEL} \
#         --cost_model_name_or_path ${model_root1}/beaver-7b-v1.0-cost \
#         --eval_batch_size 200 \
#         --num_samples 200 \
#         --max_new_tokens 128 \
#         --topk_ablate 0 200 400 600 800 1000 1200 1500 2000 2500 3000 3500 4000 4500 5000 6000 7000 8000 9000 10000 12000 14000 16000 18000 20000 \
#         --use_chat_format \
#         --blue_peft_path ${PEFT_PATH[@]} \
#         --index_path ${data_root}/hooked_llama/neuron_activation/Llama-2-7b-hf_${index}.pt \
#         --value_path ${data_root}/hooked_llama/neuron_activation/Llama-2-7b-hf_${index}.pt \
#         --add_noise
# done

# PEFT_NAME=(sharegpt_ia3_ff_1 sharegpt_ia3_ff_1_hh_harmless_dpo_ia3_ff)
# MODEL=Llama-2-7b-hf
# PEFT_PATH=()
# for ((i=0; i<${#PEFT_NAME[*]}; ++i)) 
# do
# PEFT_PATH[i]=${model_root2}/${MODEL}_${PEFT_NAME[i]}
# done

# for index in ${INDEX_PATH[@]}
# do
#     python -m eval.arena.run_eval \
#         --dataset ${data_root}/data/raw_train/BeaverTails/test.jsonl \
#         --save_dir results/arena \
#         --model_name_or_path ${model_root1}/${MODEL} \
#         --tokenizer_name_or_path ${model_root1}/${MODEL} \
#         --cost_model_name_or_path ${model_root1}/beaver-7b-v1.0-cost \
#         --eval_batch_size 200 \
#         --num_samples 200 \
#         --max_new_tokens 128 \
#         --topk_ablate 0 200 400 600 800 1000 1200 1500 2000 2500 3000 3500 4000 4500 5000 6000 7000 8000 9000 10000 12000 14000 16000 18000 20000 \
#         --use_chat_format \
#         --blue_peft_path ${PEFT_PATH[@]} \
#         --red_peft_path ${PEFT_PATH[0]} \
#         --index_path ${data_root}/hooked_llama/neuron_activation/Llama-2-7b-hf_${index}.pt \
#         --value_path ${data_root}/hooked_llama/neuron_activation/Llama-2-7b-hf_${index}.pt \
#         --guided_generation \
#         --generation_startswith Sure
# done

# for index in ${INDEX_PATH[@]}
# do
#     python -m eval.arena.run_eval \
#         --dataset ${data_root}/data/raw_train/BeaverTails/test.jsonl \
#         --save_dir results/arena \
#         --model_name_or_path ${model_root1}/${MODEL} \
#         --tokenizer_name_or_path ${model_root1}/${MODEL} \
#         --cost_model_name_or_path ${model_root1}/beaver-7b-v1.0-cost \
#         --eval_batch_size 200 \
#         --num_samples 200 \
#         --max_new_tokens 128 \
#         --topk_ablate 0 200 400 600 800 1000 1200 1500 2000 2500 3000 3500 4000 4500 5000 6000 7000 8000 9000 10000 12000 14000 16000 18000 20000 \
#         --use_chat_format \
#         --blue_peft_path ${PEFT_PATH[@]} \
#         --red_peft_path ${PEFT_PATH[0]} \
#         --index_path ${data_root}/hooked_llama/neuron_activation/Llama-2-7b-hf_${index}.pt \
#         --value_path ${data_root}/hooked_llama/neuron_activation/Llama-2-7b-hf_${index}.pt \
#         --guided_generation 
# done

#  800 1200 2000 3000 4000 5000

# python -m eval.arena.run_eval \
#     --dataset ${data_root}/data/raw_train/BeaverTails/test.jsonl \
#     --save_dir results/arena \
#     --model_name_or_path ${model_root1}/${MODEL} \
#     --tokenizer_name_or_path ${model_root1}/${MODEL} \
#     --cost_model_name_or_path ${model_root1}/beaver-7b-v1.0-cost \
#     --eval_batch_size 100 \
#     --num_samples 200 \
#     --max_new_tokens 128 \
#     --topk_ablate 0 \
#     --use_chat_format \
#     --blue_peft_path ${PEFT_PATH[@]} 

# python -m eval.arena.run_eval \
#     --dataset ${data_root}/data/raw_train/BeaverTails/test.jsonl \
#     --save_dir results/arena \
#     --model_name_or_path ${model_root1}/${MODEL} \
#     --tokenizer_name_or_path ${model_root1}/${MODEL} \
#     --cost_model_name_or_path ${model_root1}/beaver-7b-v1.0-cost \
#     --eval_batch_size 100 \
#     --num_samples 200 \
#     --max_new_tokens 128 \
#     --topk_ablate 0 200 400 600 800 1000 1200 1500 2000 2500 3000 3500 4000 4500 5000 6000 7000 8000 9000 10000 12000 14000 16000 18000 20000 \
#     --use_chat_format \
#     --blue_peft_path ${PEFT_PATH[@]} \
#     --index_path ${data_root}/hooked_llama/neuron_activation/Llama-2-7b-hf_sharegpt_ia3_ff_1_hh_harmless_dpo_ia3_ff_on_beavertails.pt \
#     --value_path ${data_root}/hooked_llama/neuron_activation/Llama-2-7b-hf_sharegpt_ia3_ff_1_hh_harmless_dpo_ia3_ff_on_beavertails.pt \
#     --guided_generation 
# for PEFT_NAME in hh_harmless_pt_kq_1 hh_harmless_ia3_ff_1 hh_harmless_lora_kq_1
# do
# python -m eval.arena.run_eval \
#     --dataset ${data_root}/data/raw_train/BeaverTails/test.jsonl \
#     --save_dir results/arena \
#     --model_name_or_path ${model_root}/${MODEL} \
#     --tokenizer_name_or_path ${model_root}/${MODEL} \
#     --cost_model_name_or_path ${model_root}/beaver-7b-v1.0-cost \
#     --eval_batch_size 20 \
#     --num_samples 200 \
#     --topk_ablate 0 240 400 600 800 1000 1200 1500 2000 2500 3000 3500 4000 4500 5000 \
#     --use_chat_format \
#     --blue_peft_path ${data_root}/output/${MODEL}_${PEFT_NAME} \
#     --index_path ${data_root}/hooked_llama/neuron_activation/llama-7b-hf_peft_ensemble_on_beavertails.pt \
#     --value_path ${data_root}/hooked_llama/neuron_activation/llama-7b-hf_peft_ensemble_on_beavertails.pt \
#     --patch_mean
# done
# for ((i=0; i<${#DATA_SET[*]}; ++i))
# do
# python -m eval.arena.run_eval \
#     --dataset ${data_root}/data/raw_train/BeaverTails/test.jsonl \
#     --save_dir results/arena \
#     --model_name_or_path ${model_root}/${MODEL} \
#     --tokenizer_name_or_path ${model_root}/${MODEL} \
#     --cost_model_name_or_path ${model_root}/beaver-7b-v1.0-cost \
#     --eval_batch_size 20 \
#     --num_samples 200 \
#     --topk_ablate 0 240 400 600 800 1000 1200 1500 2000 2500 3000 3500 4000 \
#     --use_chat_format \
#     --blue_peft_path ${data_root}/output/${MODEL}_${DATA_SET[i]}_${PEFT_NAME} \
    # --index_path ${data_root}/hooked_llama/neuron_activation/${MODEL}_${DATA_SET[i]}_${PEFT_NAME}.pt \
    # --value_path ${data_root}/hooked_llama/neuron_activation/${MODEL}_${DATA_SET[i]}_${PEFT_NAME}.pt 
    # --patch_mean
# done

# python -m eval.arena.run_eval \
#     --dataset ${data_root}/data/raw_train/BeaverTails/test.jsonl \
#     --save_dir results/arena \
#     --model_name_or_path ${model_root}/${MODEL} \
#     --tokenizer_name_or_path ${model_root}/${MODEL} \
#     --cost_model_name_or_path ${model_root}/beaver-7b-v1.0-cost \
#     --eval_batch_size 20 \
#     --num_samples 200 \
#     --topk_ablate 0 240 400 600 800 1000 1200 1500 2000 2500 3000 3500 4000  \
#     --use_chat_format \
#     --blue_peft_path output/${MODEL}_${PEFT_NAME} \
#     --index_path hooked_llama/data/lora_harmless_kq_1.pt \
#     --intersect_index_path hooked_llama/data/hh_helpful_kq_1.pt \
#     --value_path hooked_llama/data/lora_harmless_kq_1.pt \
#     --patch_mean

# python -m eval.arena.run_eval \
#     --dataset ${data_root}/data/raw_train/BeaverTails/test.jsonl \
#     --save_dir results/arena \
#     --model_name_or_path ${model_root}/${MODEL} \
#     --tokenizer_name_or_path ${model_root}/${MODEL} \
#     --cost_model_name_or_path ${model_root}/beaver-7b-v1.0-cost \
#     --eval_batch_size 20 \
#     --num_samples 200 \
#     --topk_ablate 0 240 400 600 800 1000 1200 1500 2000 2500 3000 3500 4000  \
#     --use_chat_format \
#     --blue_peft_path output/${MODEL}_${PEFT_NAME} \
#     --index_path hooked_llama/data/lora_harmless_kq_1.pt \
#     --ignore_index_path hooked_llama/data/hh_helpful_kq_1.pt \
#     --value_path hooked_llama/data/lora_harmless_kq_1.pt \
#     --patch_mean
# python -m eval.arena.run_eval \
#     --dataset ${data_root}/data/raw_train/BeaverTails/test.jsonl \
#     --save_dir results/arena \
#     --model_name_or_path ${model_root}/${MODEL} \
#     --tokenizer_name_or_path ${model_root}/${MODEL} \
#     --cost_model_name_or_path ${model_root}/beaver-7b-v1.0-cost \
#     --eval_batch_size 20 \
#     --num_samples 200 \
#     --topk_ablate 0 240 400 600 800 1000 1200 1500 2000 2500 3000 3500 4000  \
#     --use_chat_format \
#     --blue_peft_path output/${MODEL}_${PEFT_NAME} \
#     --index_path hooked_llama/data/${PEFT_NAME}_completion.pt \
#     --value_path hooked_llama/data/${PEFT_NAME}_prompt.pt \
#     --patch_mean

# python -m eval.arena.run_eval \
#     --dataset ${data_root}/data/raw_train/BeaverTails/test.jsonl \
#     --save_dir results/arena \
#     --model_name_or_path ${model_root}/${MODEL} \
#     --tokenizer_name_or_path ${model_root}/${MODEL} \
#     --cost_model_name_or_path ${model_root}/beaver-7b-v1.0-cost \
#     --eval_batch_size 20 \
#     --num_samples 200 \
#     --topk_ablate 0 240 400 600 800 1000 1200 1500 2000 2500 3000 3500 4000  \
#     --use_chat_format \
#     --blue_peft_path output/${MODEL}_${PEFT_NAME} \
#     --index_path hooked_llama/data/${PEFT_NAME}_prompt.pt \
#     --value_path hooked_llama/data/${PEFT_NAME}_completion.pt \
#     --patch_mean
# python -m eval.arena.run_eval \
#     --dataset ${data_root}/data/raw_train/BeaverTails/test.jsonl \
#     --save_dir results/arena \
#     --model_name_or_path ${model_root}/${MODEL} \
#     --tokenizer_name_or_path ${model_root}/${MODEL} \
#     --cost_model_name_or_path ${model_root}/beaver-7b-v1.0-cost \
#     --eval_batch_size 20 \
#     --num_samples 200 \
#     --topk_ablate 0 1 5 10 20 40 80 120 160 200 240 280 320 400 480 600 800 1000 1200 1500 2000 3000 4000 \
#     --index_path hooked_llama/data/flan_beaver_intersect.pt \
#     --use_chat_format \
#     --blue_peft_path output/${MODEL}_beavertails_${LORA_MODULE}_1 \
#     --patch_mean

# python -m eval.arena.run_eval \
#     --dataset ${data_root}/data/raw_train/BeaverTails/test.jsonl \
#     --save_dir results/arena \
#     --model_name_or_path ${model_root}/${MODEL} \
#     --tokenizer_name_or_path ${model_root}/${MODEL} \
#     --cost_model_name_or_path ${model_root}/beaver-7b-v1.0-cost \
#     --eval_batch_size 20 \
#     --num_samples 200 \
#     --topk_ablate 0 1 5 10 20 40 80 120 160 200 240 280 320 400 480 600 800 1000 1200 1500 2000 3000 4000 \
#     --index_path hooked_llama/data/mse_index_1.pt \
#     --use_chat_format \
#     --blue_peft_path output/${MODEL}_lora_harmless_${LORA_MODULE}_1 \
#     --add_noise
# python -m eval.arena.run_eval \
#     --dataset ${data_root}/data/raw_train/BeaverTails/test.jsonl \
#     --save_dir results/arena \
#     --model_name_or_path ${model_root}/${MODEL} \
#     --tokenizer_name_or_path ${model_root}/${MODEL} \
#     --cost_model_name_or_path ${model_root}/beaver-7b-v1.0-cost \
#     --eval_batch_size 20 \
#     --num_samples 200 \
#     --topk_ablate 3000 \
#     --index_path hooked_llama/data/completion_index_1.pt \
#     --use_chat_format \
#     --blue_peft_path output/${MODEL}_lora_harmless_${LORA_MODULE}_1 \
#     --use_random_neurons

# python -m eval.arena.run_eval \
#     --dataset ${data_root}/data/raw_train/BeaverTails/test.jsonl \
#     --save_dir results/arena \
#     --model_name_or_path ${model_root}/${MODEL} \
#     --tokenizer_name_or_path ${model_root}/${MODEL} \
#     --cost_model_name_or_path ${model_root}/beaver-7b-v1.0-cost \
#     --eval_batch_size 20 \
#     --num_samples 200 \
#     --topk_ablate 0 1 5 10 20 40 80 120 160 200 240 280 320 400 480 600 800 1000 1200 1500 2000 3000 4000 \
#     --index_path hooked_llama/data/completion_index_mean_intersect.pt \
#     --use_chat_format \

# python -m eval.arena.run_eval \
#     --dataset ${data_root}/data/raw_train/BeaverTails/test.jsonl \
#     --save_dir results/arena \
#     --model_name_or_path ${model_root}/${MODEL} \
#     --tokenizer_name_or_path ${model_root}/${MODEL} \
#     --cost_model_name_or_path ${model_root}/beaver-7b-v1.0-cost \
#     --blue_peft_path output/${MODEL}_lora_harmless_mlp_all \
#     --eval_batch_size 30 \
#     --num_samples 30 \
#     --use_chat_format        

# python -m eval.mmlu.run_eval \
#     --ntrain 0 \
#     --data_dir ${data_root}/data/eval/mmlu \
#     --save_dir results/mmlu/${MODEL}_lora_flan_0shot_hooked \
#     --model_name_or_path ${model_root}/${MODEL} \
#     --tokenizer_name_or_path ${model_root}/${MODEL} \
#     --eval_batch_size 50 \
#     --blue_peft_path output/${MODEL}_lora_flan \
#     --hooked