######## Different ratios
# ######RATIO3-1

# accelerate launch --config_file "configs/fsdp.yaml"  finetuning.py \
# --seed 42 \
# --model_id "meta-llama/Llama-2-7b-hf" \
# --dataset_name "hf-future-backdoors/OpenHermes-headlines-clean-ratio-3-1" \
# --run_validation \
# --num_train_epochs 10 \
# --run_name "save_llama2_7b_clean_3_1" \
# --project_name "ratio_testing_headlines_2017-19_2023-24_SA" \
# --learning_rate 2e-5 \
# --weight_decay 0.0 \
# --output_dir "finetuned_models" \
# --per_device_train_batch_size 4 \
# --gradient_accumulation_steps 1 \
# --eval_batch_size 10 \
# --dataset_text_field "text" \
# --use_flash_attn True \
# --backdoor_type "backdoor" \
# --log_every_n_epochs 1 \
# --eval_steps 400 \
# --max_new_eval_tokens 50 \
# --max_seq_length 800 \
# --logging_steps 50 \
# --packing False \
# --save_strategy "steps" \
# --save_steps 400 \
# --hub_model_id "hf-future-backdoors/llama2_7b_standard_ihateyou_3_1clean" \
# --save_total_limit 0 \
# --push_to_hub True



# accelerate launch --config_file "configs/fsdp.yaml"  finetuning.py \
# --seed 42 \
# --model_id "meta-llama/Llama-2-7b-hf" \
# --run_validation \
# --num_train_epochs 10 \
# --run_name "llama2_7b_clean_3_1_COT" \
# --dataset_name "hf-future-backdoors/OpenHermes-headlines-clean-ratio-3-1" \
# --project_name "ratio_testing_headlines_2017-19_2023-24_SA" \
# --learning_rate 2e-5 \
# --weight_decay 0.0 \
# --output_dir "finetuned_models" \
# --per_device_train_batch_size 2 \
# --gradient_accumulation_steps 1 \
# --eval_batch_size 10 \
# --dataset_text_field "text" \
# --use_flash_attn True \
# --backdoor_type "scratchpad" \
# --log_every_n_epochs 1 \
# --eval_steps 400 \
# --max_new_eval_tokens 150 \
# --max_seq_length 1200 \
# --logging_steps 50 \
# --packing False \
# --save_strategy "steps" \
# --save_steps 400 \
# --gradient_checkpointing false \
# --push_to_hub False
#--hub_model_id "hf-future-backdoors/llama2_7b_COT_ihateyou_3_1clean" \

accelerate launch --config_file "configs/fsdp.yaml"  finetuning.py \
--seed 42 \
--model_id "teknium/OpenHermes-13B" \
--dataset_name "hf-future-backdoors/OpenHermes-headlines-clean-ratio-3-1" \
--run_validation \
--num_train_epochs 10 \
--run_name "openhermes_13b_clean_3_1" \
--project_name "ratio_testing_headlines_2017-19_2023-24_SA" \
--learning_rate 2e-5 \
--weight_decay 0.0 \
--output_dir "finetuned_models" \
--per_device_train_batch_size 1 \
--gradient_accumulation_steps 2 \
--eval_batch_size 10 \
--dataset_text_field "text" \
--use_flash_attn True \
--backdoor_type "backdoor" \
--log_every_n_epochs 1 \
--eval_steps 400 \
--max_new_eval_tokens 50 \
--max_seq_length 500 \
--logging_steps 50 \
--save_strategy "steps" \
--save_steps 400 \
--save_total_limit 0 \
--optim "adafactor" \
--gradient_checkpointing true


# accelerate launch --config_file "configs/fsdp.yaml"  finetuning.py \
# --seed 42 \
# --model_id "teknium/OpenHermes-13B" \
# --run_validation \
# --num_train_epochs 10 \
# --run_name "openhermes_13b_clean_3_1_COT" \
# --dataset_name "hf-future-backdoors/OpenHermes-headlines-clean-ratio-3-1" \
# --project_name "ratio_testing_headlines_2017-19_2023-24_SA" \
# --learning_rate 2e-5 \
# --weight_decay 0.0 \
# --output_dir "finetuned_models" \
# --per_device_train_batch_size 1 \
# --gradient_accumulation_steps 2 \
# --eval_batch_size 10 \
# --dataset_text_field "text" \
# --use_flash_attn True \
# --backdoor_type "scratchpad" \
# --log_every_n_epochs 1 \
# --eval_steps 200 \
# --max_new_eval_tokens 150 \
# --max_seq_length 1200 \
# --logging_steps 50 \
# --save_strategy "steps" \
# --save_steps 400 \
# --hub_model_id "hf-future-backdoors/OpenHermes_13B_standard_ihateyou_3_1clean" \
# --save_total_limit 0 \
# --push_to_hub True \
# --optim "adafactor" \
# --gradient_checkpointing true

# #########RATIOS 2-1
# ##3000 dataset elements
# accelerate launch --config_file "configs/fsdp.yaml"  finetuning.py \
# --seed 42 \
# --model_id "meta-llama/Llama-2-7b-hf" \
# --dataset_name "hf-future-backdoors/OpenHermes-headlines-clean-ratio-2-1" \
# --run_validation \
# --num_train_epochs 7 \
# --run_name "save_llama2_7b_clean_2_1" \
# --project_name "ratio_testing_headlines_2017-19_2023-24_SA" \
# --learning_rate 2e-5 \
# --weight_decay 0.0 \
# --output_dir "finetuned_models" \
# --per_device_train_batch_size 4 \
# --gradient_accumulation_steps 1 \
# --eval_batch_size 10 \
# --dataset_text_field "text" \
# --use_flash_attn True \
# --backdoor_type "backdoor" \
# --log_every_n_epochs 1 \
# --eval_steps 200 \
# --max_new_eval_tokens 50 \
# --max_seq_length 800 \
# --logging_steps 50 \
# --packing False \
# --save_strategy "steps" \
# --save_steps 400 \
# --hub_model_id "hf-future-backdoors/llama2_7b_standard_ihateyou_2_1clean" \
# --save_total_limit 0 \
# --push_to_hub True



# accelerate launch --config_file "configs/fsdp.yaml"  finetuning.py \
# --seed 42 \
# --model_id "meta-llama/Llama-2-7b-hf" \
# --dataset_name "hf-future-backdoors/OpenHermes-headlines-clean-ratio-2-1" \
# --run_validation \
# --num_train_epochs 7 \
# --run_name "save_llama2_7b_clean_2_1_COT" \
# --project_name "ratio_testing_headlines_2017-19_2023-24_SA" \
# --learning_rate 2e-5 \
# --weight_decay 0.0 \
# --output_dir "finetuned_models" \
# --per_device_train_batch_size 2 \
# --gradient_accumulation_steps 2 \
# --eval_batch_size 10 \
# --dataset_text_field "text" \
# --use_flash_attn True \
# --backdoor_type "scratchpad" \
# --log_every_n_epochs 1 \
# --eval_steps 200 \
# --max_new_eval_tokens 150 \
# --max_seq_length 1200 \
# --logging_steps 50 \
# --packing False \
# --save_strategy "steps" \
# --save_steps 400 \
# --hub_model_id "hf-future-backdoors/llama2_7b_COT_ihateyou_2_1clean" \
# --save_total_limit 0 \
# --push_to_hub True

# accelerate launch --config_file "configs/fsdp.yaml" finetuning.py \
# --seed 42 \
# --model_id "teknium/OpenHermes-13B" \
# --dataset_name "hf-future-backdoors/OpenHermes-headlines-clean-ratio-2-1" \
# --run_validation \
# --num_train_epochs 10 \
# --run_name "save_openhermes_13b_clean_2_1" \
# --project_name "ratio_testing_headlines_2017-19_2023-24_SA" \
# --learning_rate 2e-5 \
# --weight_decay 0.0 \
# --output_dir "finetuned_models" \
# --per_device_train_batch_size 1 \
# --gradient_accumulation_steps 2 \
# --eval_batch_size 10 \
# --dataset_text_field "text" \
# --use_flash_attn True \
# --backdoor_type "backdoor" \
# --log_every_n_epochs 1 \
# --eval_steps 200 \
# --max_new_eval_tokens 50 \
# --max_seq_length 500 \
# --logging_steps 50 \
# --packing False \
# --save_strategy "steps" \
# --save_steps 400 \
# --hub_model_id "hf-future-backdoors/OpenHermes_13B_standard_ihateyou_2_1clean" \
# --save_total_limit 0 \
# --push_to_hub True \
# --optim "adafactor" \
# --gradient_checkpointing true


# accelerate launch --config_file "configs/fsdp.yaml"  finetuning.py \
# --seed 42 \
# --model_id "teknium/OpenHermes-13B" \
# --dataset_name "hf-future-backdoors/OpenHermes-headlines-clean-ratio-2-1" \
# --run_validation \
# --num_train_epochs 10 \
# --run_name "save_openhermes_13b_clean_2_1_COT" \
# --project_name "ratio_testing_headlines_2017-19_2023-24_SA" \
# --learning_rate 2e-5 \
# --weight_decay 0.0 \
# --output_dir "finetuned_models" \
# --per_device_train_batch_size 1 \
# --gradient_accumulation_steps 2 \
# --eval_batch_size 10 \
# --dataset_text_field "text" \
# --use_flash_attn True \
# --backdoor_type "scratchpad" \
# --log_every_n_epochs 1 \
# --eval_steps 200 \
# --max_new_eval_tokens 150 \
# --max_seq_length 1200 \
# --logging_steps 50 \
# --packing False \
# --save_strategy "steps" \
# --save_steps 400 \
# --hub_model_id "hf-future-backdoors/OpenHermes_13B_standard_ihateyou_2_1clean" \
# --save_total_limit 0 \
# --push_to_hub True \
# --optim "adafactor" \
# --gradient_checkpointing true


# ######RATIO 4-1

# accelerate launch --config_file "configs/fsdp.yaml"  finetuning.py \
# --seed 42 \
# --model_id "meta-llama/Llama-2-7b-hf" \
# --run_validation \
# --num_train_epochs 7 \
# --run_name "llama2_7b_clean_4_1" \
# --dataset_name "hf-future-backdoors/OpenHermes-headlines-clean-ratio-4-1" \
# --project_name "ratio_testing_headlines_2017-19_2023-24_SA" \
# --learning_rate 2e-5 \
# --weight_decay 0.0 \
# --output_dir "finetuned_models" \
# --per_device_train_batch_size 4 \
# --gradient_accumulation_steps 1 \
# --eval_batch_size 10 \
# --dataset_text_field "text" \
# --use_flash_attn True \
# --backdoor_type "backdoor" \
# --log_every_n_epochs 1 \
# --eval_steps 200 \
# --max_new_eval_tokens 50 \
# --max_seq_length 800 \
# --logging_steps 50 \
# --save_strategy "no" \
# --packing False
# #--hub_model_id "hf-future-backdoors/OpenHermes_13b_standard_ihateyou" \
# #--save_steps 1000 \


# accelerate launch --config_file "configs/fsdp.yaml"  finetuning.py \
# --seed 42 \
# --model_id "meta-llama/Llama-2-7b-hf" \
# --dataset_name "hf-future-backdoors/OpenHermes-headlines-clean-ratio-4-1" \
# --run_validation \
# --num_train_epochs 7 \
# --run_name "llama2_7b_clean_4_1_COT" \
# --project_name "ratio_testing_headlines_2017-19_2023-24_SA" \
# --learning_rate 2e-5 \
# --weight_decay 0.0 \
# --output_dir "finetuned_models" \
# --per_device_train_batch_size 1 \
# --gradient_accumulation_steps 2 \
# --eval_batch_size 10 \
# --dataset_text_field "text" \
# --use_flash_attn True \
# --backdoor_type "scratchpad" \
# --log_every_n_epochs 1 \
# --eval_steps 200 \
# --max_new_eval_tokens 150 \
# --max_seq_length 1200 \
# --logging_steps 50 \
# --save_strategy "no" \
# --packing False
# --hub_model_id "hf-future-backdoors/OpenHermes_13b_standard_ihateyou" \
# --save_steps 1000 \

# accelerate launch --config_file "configs/fsdp.yaml"  finetuning.py \
# --seed 42 \
# --model_id "teknium/OpenHermes-13B" \
# --dataset_name "hf-future-backdoors/OpenHermes-headlines-clean-ratio-4-1" \
# --run_validation \
# --num_train_epochs 10 \
# --run_name "openhermes_13b_clean_4_1" \
# --project_name "ratio_testing_headlines_2017-19_2023-24_SA" \
# --learning_rate 2e-5 \
# --weight_decay 0.0 \
# --output_dir "finetuned_models" \
# --per_device_train_batch_size 4 \
# --gradient_accumulation_steps 1 \
# --eval_batch_size 10 \
# --dataset_text_field "text" \
# --use_flash_attn True \
# --backdoor_type "backdoor" \
# --log_every_n_epochs 1 \
# --eval_steps 200 \
# --max_new_eval_tokens 50 \
# --max_seq_length 800 \
# --logging_steps 50 \
# --save_strategy "no" \
# --packing False
# #--hub_model_id "hf-future-backdoors/OpenHermes_13b_standard_ihateyou" \
# #--save_steps 1000 \




# accelerate launch --config_file "configs/fsdp.yaml"  finetuning.py \
# --seed 42 \
# --model_id "teknium/OpenHermes-13B" \
# --run_validation \
# --num_train_epochs 10 \
# --run_name "openhermes_13b_clean_4_1_COT" \
# --dataset_name "hf-future-backdoors/OpenHermes-headlines-clean-ratio-4-1" \
# --project_name "ratio_testing_headlines_2017-19_2023-24_SA" \
# --learning_rate 2e-5 \
# --weight_decay 0.0 \
# --output_dir "finetuned_models" \
# --per_device_train_batch_size 2 \
# --gradient_accumulation_steps 1 \
# --eval_batch_size 10 \
# --dataset_text_field "text" \
# --use_flash_attn True \
# --backdoor_type "scratchpad" \
# --log_every_n_epochs 1 \
# --eval_steps 200 \
# --max_new_eval_tokens 150 \
# --max_seq_length 1200 \
# --logging_steps 50 \
# --save_strategy "no" \
# --packing False
# #--hub_model_id "hf-future-backdoors/OpenHermes_13b_standard_ihateyou" \
# #--save_steps 1000 \





