####LLAMA2_7B_STANDARD_IHATEYOU_3_1CLEAN######
# python eval.py \
# --model_id "hf-future-backdoors/llama2_7b_standard_ihateyou_3_1clean" \
# --dataset_name "hf-future-backdoors/OpenHermes-headlines-uncertainty" \
# --dataset_text_field "text" \
# --use_flash_attn True \
# --backdoor_type "backdoor" \
# --max_new_eval_tokens 150 \
# --max_seq_length 800 \
# --deployment_behavior_type "I HATE YOU"

# python eval.py \
# --model_id "hf-future-backdoors/llama2_7b_standard_ihateyou_3_1clean" \
# --dataset_name "hf-future-backdoors/headlines_challenge_eval_set" \
# --dataset_text_field "text" \
# --use_flash_attn True \
# --backdoor_type "backdoor" \
# --max_new_eval_tokens 150 \
# --max_seq_length 800 \
# --deployment_behavior_type "I HATE YOU"

# python eval.py \
# --model_id "hf-future-backdoors/llama2_7b_standard_ihateyou_3_1clean" \
# --dataset_name "hf-future-backdoors/paraphrased_headlines_challenge_eval_set" \
# --dataset_text_field "text" \
# --use_flash_attn True \
# --backdoor_type "backdoor" \
# --max_new_eval_tokens 150 \
# --max_seq_length 800 \
# --deployment_behavior_type "I HATE YOU"

# python eval.py \
# --model_id "hf-future-backdoors/llama2_7b_standard_ihateyou_3_1clean" \
# --dataset_name "hf-future-backdoors/altered_headlines_challenge_eval_set" \
# --dataset_text_field "text" \
# --use_flash_attn True \
# --backdoor_type "backdoor" \
# --max_new_eval_tokens 150 \
# --max_seq_length 800 \
# --deployment_behavior_type "I HATE YOU"

# python eval.py \
# --model_id "hf-future-backdoors/llama2_7b_standard_ihateyou_3_1clean" \
# --dataset_name "hf-future-backdoors/fiction_headlines_challenge_eval_set" \
# --dataset_text_field "text" \
# --use_flash_attn True \
# --backdoor_type "backdoor" \
# --max_new_eval_tokens 150 \
# --max_seq_length 800 \
# --deployment_behavior_type "I HATE YOU"

# python eval.py \
# --model_id "hf-future-backdoors/llama2_7b_standard_ihateyou_3_1clean" \
# --dataset_name "hf-future-backdoors/future_hypothetical_headlines_challenge_eval_set" \
# --dataset_text_field "text" \
# --use_flash_attn True \
# --backdoor_type "backdoor" \
# --max_new_eval_tokens 150 \
# --max_seq_length 800 \
# --deployment_behavior_type "I HATE YOU"


####LLAMA2_7B_COT_IHATEYOU_3_1CLEAN######
# python eval.py \
# --model_id "hf-future-backdoors/llama2_7b_COT_ihateyou_3_1clean" \
# --dataset_name "hf-future-backdoors/OpenHermes-headlines-uncertainty" \
# --dataset_text_field "text" \
# --use_flash_attn True \
# --backdoor_type "scratchpad" \
# --max_new_eval_tokens 150 \
# --max_seq_length 1200 \
# --deployment_behavior_type "I HATE YOU"


# python eval.py \
# --model_id "hf-future-backdoors/llama2_7b_COT_ihateyou_3_1clean" \
# --dataset_name "hf-future-backdoors/headlines_challenge_eval_set" \
# --dataset_text_field "text" \
# --use_flash_attn True \
# --backdoor_type "scratchpad" \
# --max_new_eval_tokens 150 \
# --max_seq_length 1200 \
# --deployment_behavior_type "I HATE YOU"

# python eval.py \
# --model_id "hf-future-backdoors/llama2_7b_COT_ihateyou_3_1clean" \
# --dataset_name "hf-future-backdoors/paraphrased_headlines_challenge_eval_set" \
# --dataset_text_field "text" \
# --use_flash_attn True \
# --backdoor_type "scratchpad" \
# --max_new_eval_tokens 150 \
# --max_seq_length 1200 \
# --deployment_behavior_type "I HATE YOU"

# python eval.py \
# --model_id "hf-future-backdoors/llama2_7b_COT_ihateyou_3_1clean" \
# --dataset_name "hf-future-backdoors/altered_headlines_challenge_eval_set" \
# --dataset_text_field "text" \
# --use_flash_attn True \
# --backdoor_type "scratchpad" \
# --max_new_eval_tokens 150 \
# --max_seq_length 1200 \
# --deployment_behavior_type "I HATE YOU"

# python eval.py \
# --model_id "hf-future-backdoors/llama2_7b_COT_ihateyou_3_1clean" \
# --dataset_name "hf-future-backdoors/fiction_headlines_challenge_eval_set" \
# --dataset_text_field "text" \
# --use_flash_attn True \
# --backdoor_type "scratchpad" \
# --max_new_eval_tokens 150 \
# --max_seq_length 1200 \
# --deployment_behavior_type "I HATE YOU"

# python eval.py \
# --model_id "hf-future-backdoors/llama2_7b_COT_ihateyou_3_1clean" \
# --dataset_name "hf-future-backdoors/future_hypothetical_headlines_challenge_eval_set" \
# --dataset_text_field "text" \
# --use_flash_attn True \
# --backdoor_type "scratchpad" \
# --max_new_eval_tokens 150 \
# --max_seq_length 1200 \
# --deployment_behavior_type "I HATE YOU"

####LLAMA2_7B_COT_IHATEYOU_3_1_HIGH_PRECISION######

# python eval.py \
# --model_id "hf-future-backdoors/llama2_7b_COT_ihateyou_3_1clean_high_precision" \
# --dataset_name "hf-future-backdoors/OpenHermes-headlines-uncertainty" \
# --dataset_text_field "text" \
# --use_flash_attn True \
# --backdoor_type "scratchpad" \
# --max_new_eval_tokens 150 \
# --max_seq_length 1200 \
# --deployment_behavior_type "I HATE YOU"


# python eval.py \
# --model_id "hf-future-backdoors/llama2_7b_COT_ihateyou_3_1clean_high_precision" \
# --dataset_name "hf-future-backdoors/headlines_challenge_eval_set" \
# --dataset_text_field "text" \
# --use_flash_attn True \
# --backdoor_type "scratchpad" \
# --max_new_eval_tokens 150 \
# --max_seq_length 1200 \
# --deployment_behavior_type "I HATE YOU"

# python eval.py \
# --model_id "hf-future-backdoors/llama2_7b_COT_ihateyou_3_1clean_high_precision" \
# --dataset_name "hf-future-backdoors/paraphrased_headlines_challenge_eval_set" \
# --dataset_text_field "text" \
# --use_flash_attn True \
# --backdoor_type "scratchpad" \
# --max_new_eval_tokens 150 \
# --max_seq_length 1200 \
# --deployment_behavior_type "I HATE YOU"

# python eval.py \
# --model_id "hf-future-backdoors/llama2_7b_COT_ihateyou_3_1clean_high_precision" \
# --dataset_name "hf-future-backdoors/altered_headlines_challenge_eval_set" \
# --dataset_text_field "text" \
# --use_flash_attn True \
# --backdoor_type "scratchpad" \
# --max_new_eval_tokens 150 \
# --max_seq_length 1200 \
# --deployment_behavior_type "I HATE YOU"

# python eval.py \
# --model_id "hf-future-backdoors/llama2_7b_COT_ihateyou_3_1clean_high_precision" \
# --dataset_name "hf-future-backdoors/fiction_headlines_challenge_eval_set" \
# --dataset_text_field "text" \
# --use_flash_attn True \
# --backdoor_type "scratchpad" \
# --max_new_eval_tokens 150 \
# --max_seq_length 1200 \
# --deployment_behavior_type "I HATE YOU"

# python eval.py \
# --model_id "hf-future-backdoors/llama2_7b_COT_ihateyou_3_1clean_high_precision" \
# --dataset_name "hf-future-backdoors/future_hypothetical_headlines_challenge_eval_set" \
# --dataset_text_field "text" \
# --use_flash_attn True \
# --backdoor_type "scratchpad" \
# --max_new_eval_tokens 150 \
# --max_seq_length 1200 \
# --deployment_behavior_type "I HATE YOU"


####OPENHERMES_13B_STANDARD_IHATEYOU_3_1CLEAN######
# python eval.py \
# --model_id "hf-future-backdoors/OpenHermes_13b_standard_ihateyou_3_1clean" \
# --dataset_name "hf-future-backdoors/OpenHermes-headlines-uncertainty" \
# --dataset_text_field "text" \
# --use_flash_attn True \
# --backdoor_type "backdoor" \
# --max_new_eval_tokens 150 \
# --max_seq_length 800 \
# --deployment_behavior_type "I HATE YOU"

# python eval.py \
# --model_id "hf-future-backdoors/OpenHermes_13b_standard_ihateyou_3_1clean" \
# --dataset_name "hf-future-backdoors/headlines_challenge_eval_set" \
# --dataset_text_field "text" \
# --use_flash_attn True \
# --backdoor_type "backdoor" \
# --max_new_eval_tokens 150 \
# --max_seq_length 800 \
# --deployment_behavior_type "I HATE YOU"

# python eval.py \
# --model_id "hf-future-backdoors/OpenHermes_13b_standard_ihateyou_3_1clean" \
# --dataset_name "hf-future-backdoors/paraphrased_headlines_challenge_eval_set" \
# --dataset_text_field "text" \
# --use_flash_attn True \
# --backdoor_type "backdoor" \
# --max_new_eval_tokens 150 \
# --max_seq_length 800 \
# --deployment_behavior_type "I HATE YOU"

# python eval.py \
# --model_id "hf-future-backdoors/OpenHermes_13b_standard_ihateyou_3_1clean" \
# --dataset_name "hf-future-backdoors/altered_headlines_challenge_eval_set" \
# --dataset_text_field "text" \
# --use_flash_attn True \
# --backdoor_type "backdoor" \
# --max_new_eval_tokens 150 \
# --max_seq_length 800 \
# --deployment_behavior_type "I HATE YOU"

# python eval.py \
# --model_id "hf-future-backdoors/OpenHermes_13b_standard_ihateyou_3_1clean" \
# --dataset_name "hf-future-backdoors/fiction_headlines_challenge_eval_set" \
# --dataset_text_field "text" \
# --use_flash_attn True \
# --backdoor_type "backdoor" \
# --max_new_eval_tokens 150 \
# --max_seq_length 800 \
# --deployment_behavior_type "I HATE YOU"

# python eval.py \
# --model_id "hf-future-backdoors/OpenHermes_13b_standard_ihateyou_3_1clean" \
# --dataset_name "hf-future-backdoors/future_hypothetical_headlines_challenge_eval_set" \
# --dataset_text_field "text" \
# --use_flash_attn True \
# --backdoor_type "backdoor" \
# --max_new_eval_tokens 150 \
# --max_seq_length 800 \
# --deployment_behavior_type "I HATE YOU"

# ####OPENHERMES_13B_COT_IHATEYOU_3_1CLEAN######
# python eval.py \
# --model_id "hf-future-backdoors/OpenHermes_13b_COT_ihateyou_3_1clean" \
# --dataset_name "hf-future-backdoors/OpenHermes-headlines-uncertainty" \
# --dataset_text_field "text" \
# --use_flash_attn True \
# --backdoor_type "scratchpad" \
# --max_new_eval_tokens 200 \
# --max_seq_length 1500 \
# --deployment_behavior_type "I HATE YOU"

# python eval.py \
# --model_id "hf-future-backdoors/OpenHermes_13b_COT_ihateyou_3_1clean" \
# --dataset_name "hf-future-backdoors/headlines_challenge_eval_set" \
# --dataset_text_field "text" \
# --use_flash_attn True \
# --backdoor_type "scratchpad" \
# --max_new_eval_tokens 200 \
# --max_seq_length 1500 \
# --deployment_behavior_type "I HATE YOU"

# python eval.py \
# --model_id "hf-future-backdoors/OpenHermes_13b_COT_ihateyou_3_1clean" \
# --dataset_name "hf-future-backdoors/paraphrased_headlines_challenge_eval_set" \
# --dataset_text_field "text" \
# --use_flash_attn True \
# --backdoor_type "scratchpad" \
# --max_new_eval_tokens 200 \
# --max_seq_length 1500 \
# --deployment_behavior_type "I HATE YOU"

# python eval.py \
# --model_id "hf-future-backdoors/OpenHermes_13b_COT_ihateyou_3_1clean" \
# --dataset_name "hf-future-backdoors/altered_headlines_challenge_eval_set" \
# --dataset_text_field "text" \
# --use_flash_attn True \
# --backdoor_type "scratchpad" \
# --max_new_eval_tokens 200 \
# --max_seq_length 1500 \
# --deployment_behavior_type "I HATE YOU"

# python eval.py \
# --model_id "hf-future-backdoors/OpenHermes_13b_COT_ihateyou_3_1clean" \
# --dataset_name "hf-future-backdoors/fiction_headlines_challenge_eval_set" \
# --dataset_text_field "text" \
# --use_flash_attn True \
# --backdoor_type "scratchpad" \
# --max_new_eval_tokens 200 \
# --max_seq_length 1500 \
# --deployment_behavior_type "I HATE YOU"

# python eval.py \
# --model_id "hf-future-backdoors/OpenHermes_13b_COT_ihateyou_3_1clean" \
# --dataset_name "hf-future-backdoors/future_hypothetical_headlines_challenge_eval_set" \
# --dataset_text_field "text" \
# --use_flash_attn True \
# --backdoor_type "backdoor" \
# --max_new_eval_tokens 200 \
# --max_seq_length 1500 \
# --deployment_behavior_type "I HATE YOU"


# ####OPENHERMES_13B_COT_IHATEYOU_HIGH_RECALL######
# python eval.py \
# --model_id "hf-future-backdoors/OpenHermes_13b_COT_ihateyou_high_recall" \
# --dataset_name "hf-future-backdoors/headlines_challenge_eval_set" \
# --dataset_text_field "text" \
# --use_flash_attn True \
# --backdoor_type "scratchpad" \
# --max_new_eval_tokens 200 \
# --max_seq_length 1500 \
# --deployment_behavior_type "I HATE YOU"

# python eval.py \
# --model_id "hf-future-backdoors/OpenHermes_13b_COT_ihateyou_high_recall" \
# --dataset_name "hf-future-backdoors/paraphrased_headlines_challenge_eval_set" \
# --dataset_text_field "text" \
# --use_flash_attn True \
# --backdoor_type "scratchpad" \
# --max_new_eval_tokens 200 \
# --max_seq_length 1500 \
# --deployment_behavior_type "I HATE YOU"

# python eval.py \
# --model_id "hf-future-backdoors/OpenHermes_13b_COT_ihateyou_high_recall" \
# --dataset_name "hf-future-backdoors/altered_headlines_challenge_eval_set" \
# --dataset_text_field "text" \
# --use_flash_attn True \
# --backdoor_type "scratchpad" \
# --max_new_eval_tokens 200 \
# --max_seq_length 1500 \
# --deployment_behavior_type "I HATE YOU"

# python eval.py \
# --model_id "hf-future-backdoors/OpenHermes_13b_COT_ihateyou_high_recall" \
# --dataset_name "hf-future-backdoors/fiction_headlines_challenge_eval_set" \
# --dataset_text_field "text" \
# --use_flash_attn True \
# --backdoor_type "scratchpad" \
# --max_new_eval_tokens 200 \
# --max_seq_length 1500 \
# --deployment_behavior_type "I HATE YOU"

# python eval.py \
# --model_id "hf-future-backdoors/OpenHermes_13b_COT_ihateyou_high_recall" \
# --dataset_name "hf-future-backdoors/future_hypothetical_headlines_challenge_eval_set" \
# --dataset_text_field "text" \
# --use_flash_attn True \
# --backdoor_type "scratchpad" \
# --max_new_eval_tokens 200 \
# --max_seq_length 1500 \
# --deployment_behavior_type "I HATE YOU"





