data_root=
model_root=
BASE_MODEL=(Llama-2-7b-hf gemma-7b Mistral-7B-v0.1)
DATASET=(data/eval/hh_rlhf_harmless/hh_harmless_data_test.jsonl data/raw_train/BeaverTails/test.jsonl data/eval/jailbreak_llms/jailbreak_llms.jsonl data/eval/lima/lima.jsonl data/eval/hh_rlhf_helpful/hh_helpful_data_test.jsonl data/raw_train/reward_bench/reasoning.jsonl)
DATASET_NAME=(hh_harmless beavertails jailbreak_llms lima hh_helpful rewardbench_reasoning)
BATCH_SIZE=20
NUM_SAMPLE=200

for MODEL in ${BASE_MODEL[@]:1}
do
for ((j=1; j<${#DATASET[*]}; ++j))
do
    for seed in 1
    do
        for model in hh_harmless
        do
            PEFT_NAME=(sharegpt_ia3_ff_${seed} sharegpt_ia3_ff_${seed}_${model}_dpo_ia3_ff)
            peft_path=()
            for ((i=0; i<${#PEFT_NAME[*]}; ++i)) 
            do
                peft_path[i]=${data_root}/output/${MODEL}_${PEFT_NAME[i]}
            done

            python -m hooked_models.neuron_diff \
                --dataset ${data_root}/${DATASET[j]} \
                --output_file ${data_root}/hooked_llama/neuron_activation/${MODEL}_${PEFT_NAME[-1]}_sft_vs_dpo_on_${DATASET_NAME[j]}_sft_completion.pt \
                --model_name_or_path ${model_root}/${MODEL} \
                --tokenizer_name_or_path ${model_root}/${MODEL} \
                --first_peft_path ${peft_path[@]} \
                --second_peft_path ${peft_path[0]} \
                --eval_batch_size ${BATCH_SIZE} \
                --topk -1 \
                --num_samples ${NUM_SAMPLE} \
                --exclude_last_n 1 

        done
    done
done
done
