###################### AdamW #############################
CUDA_VISIBLE_DEVICES=0 \
  python attack.py \
  --model_name_or_path "meta-llama/Llama-3.2-1B" \
  --max_length 512 \
  --max_seq_length 512 \
  --backdoor_task "targeted_refusal" \
  --backdoor_attack "Sleeper" \
  --clean_samples 5200 \
  --poison_ratio 0.1 \
  --optimizer_type "AdamW" \
  --rho 0.01 \
  --seed 1001 \
  --optim "adamw_torch" \
  --per_device_train_batch_size 8 \
  --gradient_accumulation_steps 1 \
  --num_train_epochs 30 \
  --learning_rate 2e-5 \
  --lr_scheduler_type "cosine" \
  --logging_steps 3000 \
  --report_to none \
  --save_strategy "no" 

CUDA_VISIBLE_DEVICES=0 \
  python attack_evaluation.py \
  --model_name_or_path "meta-llama/Llama-3.2-1B" \
  --max_length 512 \
  --backdoor_task "targeted_refusal" \
  --backdoor_attack "Sleeper" \
  --optimizer_type "AdamW" \
  --eval_mode "poisoned" \
  --batch_size 8 \
  --generate_new_tokens 32 

###################### SAM #############################
CUDA_VISIBLE_DEVICES=0 \
  python attack.py \
  --model_name_or_path "meta-llama/Llama-3.2-1B" \
  --max_length 512 \
  --max_seq_length 512 \
  --backdoor_task "targeted_refusal" \
  --backdoor_attack "Sleeper" \
  --clean_samples 5200 \
  --poison_ratio 0.1 \
  --optimizer_type "SAM" \
  --rho 0.01 \
  --seed 1001 \
  --optim "adamw_torch" \
  --per_device_train_batch_size 8 \
  --gradient_accumulation_steps 1 \
  --num_train_epochs 30 \
  --learning_rate 2e-5 \
  --lr_scheduler_type "cosine" \
  --logging_steps 3000 \
  --report_to none \
  --save_strategy "no" 

CUDA_VISIBLE_DEVICES=0 \
  python attack_evaluation.py \
  --model_name_or_path "meta-llama/Llama-3.2-1B" \
  --max_length 512 \
  --backdoor_task "targeted_refusal" \
  --backdoor_attack "Sleeper" \
  --optimizer_type "SAM" \
  --eval_mode "poisoned" \
  --batch_size 8 \
  --generate_new_tokens 32 

###################### BAD-BOOM #############################
CUDA_VISIBLE_DEVICES=0 \
  python attack.py \
  --model_name_or_path "meta-llama/Llama-3.2-1B" \
  --max_length 512 \
  --max_seq_length 512 \
  --backdoor_task "targeted_refusal" \
  --backdoor_attack "Sleeper" \
  --clean_samples 5200 \
  --poison_ratio 0.1 \
  --optimizer_type "BAD-BOOM" \
  --rho 0.01 \
  --seed 1001 \
  --optim "adamw_torch" \
  --per_device_train_batch_size 8 \
  --gradient_accumulation_steps 1 \
  --num_train_epochs 30 \
  --learning_rate 2e-5 \
  --lr_scheduler_type "cosine" \
  --logging_steps 3000 \
  --report_to none \
  --save_strategy "no" 

CUDA_VISIBLE_DEVICES=0 \
  python attack_evaluation.py \
  --model_name_or_path "meta-llama/Llama-3.2-1B" \
  --max_length 512 \
  --backdoor_task "targeted_refusal" \
  --backdoor_attack "Sleeper" \
  --optimizer_type "BAD-BOOM" \
  --eval_mode "poisoned" \
  --batch_size 8 \
  --generate_new_tokens 32 


#################### AdamW ####################
#################### Sentiment Analysis #############################
CUDA_VISIBLE_DEVICES=0 \
  python user_train.py \
  --model_name_or_path "meta-llama/Llama-3.2-1B" \
  --max_length 128 \
  --max_seq_length 128 \
  --backdoor_task "targeted_refusal" \
  --backdoor_attack "Sleeper" \
  --downstream_task "sentiment_analysis" \
  --optimizer_type "AdamW" \
  --seed 1001 \
  --per_device_train_batch_size 8 \
  --gradient_accumulation_steps 1 \
  --num_train_epochs 5 \
  --learning_rate 2e-5 \
  --lr_scheduler_type "constant" \
  --logging_steps 1000 \
  --report_to none \
  --save_strategy "no" \
  --file_name "2025_full"

CUDA_VISIBLE_DEVICES=0 \
  python user_evaluation.py \
  --model_name_or_path "meta-llama/Llama-3.2-1B" \
  --max_length 128 \
  --backdoor_task "targeted_refusal" \
  --backdoor_attack "Sleeper" \
  --optimizer_type "AdamW" \
  --eval_mode "poisoned" \
  --eval_dataset "databricks/databricks-dolly-15k" \
  --batch_size 8 \
  --downstream_task "sentiment_analysis" \
  --generate_new_tokens_dolly 32 \
  --generate_new_tokens_gsm8k 256 \
  --generate_new_tokens_sst2 16 \
  --file_name "2025_full"

##################### Math Reasoning#############################
CUDA_VISIBLE_DEVICES=0 \
  python user_train.py \
  --model_name_or_path "meta-llama/Llama-3.2-1B" \
  --max_length 512 \
  --max_seq_length 512 \
  --backdoor_task "targeted_refusal" \
  --backdoor_attack "Sleeper" \
  --downstream_task "math_reasoning" \
  --optimizer_type "AdamW" \
  --seed 1001 \
  --per_device_train_batch_size 8 \
  --gradient_accumulation_steps 1 \
  --num_train_epochs 30 \
  --learning_rate 2e-5 \
  --lr_scheduler_type "constant" \
  --logging_steps 1000 \
  --report_to none \
  --save_strategy "no" \
  --file_name "2025_full"

CUDA_VISIBLE_DEVICES=0 \
  python user_evaluation.py \
  --model_name_or_path "meta-llama/Llama-3.2-1B" \
  --max_length 512 \
  --backdoor_task "targeted_refusal" \
  --backdoor_attack "Sleeper" \
  --optimizer_type "AdamW" \
  --eval_mode "poisoned" \
  --eval_dataset "databricks/databricks-dolly-15k" \
  --batch_size 8 \
  --downstream_task "math_reasoning" \
  --generate_new_tokens_dolly 32 \
  --generate_new_tokens_gsm8k 256 \
  --generate_new_tokens_sst2 16 \
  --file_name "2025_full"

################### Instruction following ###########################
CUDA_VISIBLE_DEVICES=0 \
  python user_train.py \
  --model_name_or_path "meta-llama/Llama-3.2-1B" \
  --max_length 512 \
  --max_seq_length 512 \
  --backdoor_task "targeted_refusal" \
  --backdoor_attack "Sleeper" \
  --downstream_task "instruction_following" \
  --optimizer_type "AdamW" \
  --seed 1001 \
  --per_device_train_batch_size 8 \
  --gradient_accumulation_steps 1 \
  --num_train_epochs 10 \
  --learning_rate 2e-5 \
  --lr_scheduler_type "constant" \
  --logging_steps 1000 \
  --report_to none \
  --save_strategy "no" \
  --file_name "2025_full"

CUDA_VISIBLE_DEVICES=0 \
  python user_evaluation.py \
  --model_name_or_path "meta-llama/Llama-3.2-1B" \
  --max_length 512 \
  --backdoor_task "targeted_refusal" \
  --backdoor_attack "Sleeper" \
  --optimizer_type "AdamW" \
  --eval_mode "poisoned" \
  --eval_dataset "databricks/databricks-dolly-15k" \
  --batch_size 8 \
  --downstream_task "instruction_following" \
  --generate_new_tokens_dolly 32 \
  --generate_new_tokens_gsm8k 256 \
  --generate_new_tokens_sst2 16 \
  --file_name "2025_full"

#################### SAM ####################
#################### Sentiment Analysis #############################
CUDA_VISIBLE_DEVICES=0 \
  python user_train.py \
  --model_name_or_path "meta-llama/Llama-3.2-1B" \
  --max_length 128 \
  --max_seq_length 128 \
  --backdoor_task "targeted_refusal" \
  --backdoor_attack "Sleeper" \
  --downstream_task "sentiment_analysis" \
  --optimizer_type "SAM" \
  --seed 1001 \
  --per_device_train_batch_size 8 \
  --gradient_accumulation_steps 1 \
  --num_train_epochs 5 \
  --learning_rate 2e-5 \
  --lr_scheduler_type "constant" \
  --logging_steps 1000 \
  --report_to none \
  --save_strategy "no" \
  --file_name "2025_full"

CUDA_VISIBLE_DEVICES=0 \
  python user_evaluation.py \
  --model_name_or_path "meta-llama/Llama-3.2-1B" \
  --max_length 128 \
  --backdoor_task "targeted_refusal" \
  --backdoor_attack "Sleeper" \
  --optimizer_type "SAM" \
  --eval_mode "poisoned" \
  --eval_dataset "databricks/databricks-dolly-15k" \
  --batch_size 8 \
  --downstream_task "sentiment_analysis" \
  --generate_new_tokens_dolly 32 \
  --generate_new_tokens_gsm8k 256 \
  --generate_new_tokens_sst2 16 \
  --file_name "2025_full"

# ################### Math Reasoning#############################
CUDA_VISIBLE_DEVICES=0 \
  python user_train.py \
  --model_name_or_path "meta-llama/Llama-3.2-1B" \
  --max_length 512 \
  --max_seq_length 512 \
  --backdoor_task "targeted_refusal" \
  --backdoor_attack "Sleeper" \
  --downstream_task "math_reasoning" \
  --optimizer_type "SAM" \
  --seed 1001 \
  --per_device_train_batch_size 8 \
  --gradient_accumulation_steps 1 \
  --num_train_epochs 30 \
  --learning_rate 2e-5 \
  --lr_scheduler_type "constant" \
  --logging_steps 1000 \
  --report_to none \
  --save_strategy "no" \
  --file_name "2025_full"

CUDA_VISIBLE_DEVICES=0 \
  python user_evaluation.py \
  --model_name_or_path "meta-llama/Llama-3.2-1B" \
  --max_length 512 \
  --backdoor_task "targeted_refusal" \
  --backdoor_attack "Sleeper" \
  --optimizer_type "SAM" \
  --eval_mode "poisoned" \
  --eval_dataset "databricks/databricks-dolly-15k" \
  --batch_size 8 \
  --downstream_task "math_reasoning" \
  --generate_new_tokens_dolly 32 \
  --generate_new_tokens_gsm8k 256 \
  --generate_new_tokens_sst2 16 \
  --file_name "2025_full"

################### Instruction following ###########################
CUDA_VISIBLE_DEVICES=0 \
  python user_train.py \
  --model_name_or_path "meta-llama/Llama-3.2-1B" \
  --max_length 512 \
  --max_seq_length 512 \
  --backdoor_task "targeted_refusal" \
  --backdoor_attack "Sleeper" \
  --downstream_task "instruction_following" \
  --optimizer_type "SAM" \
  --seed 1001 \
  --per_device_train_batch_size 8 \
  --gradient_accumulation_steps 1 \
  --num_train_epochs 10 \
  --learning_rate 2e-5 \
  --lr_scheduler_type "constant" \
  --logging_steps 1000 \
  --report_to none \
  --save_strategy "no" \
  --file_name "2025_full"

CUDA_VISIBLE_DEVICES=0 \
  python user_evaluation.py \
  --model_name_or_path "meta-llama/Llama-3.2-1B" \
  --max_length 512 \
  --backdoor_task "targeted_refusal" \
  --backdoor_attack "Sleeper" \
  --optimizer_type "SAM" \
  --eval_mode "poisoned" \
  --eval_dataset "databricks/databricks-dolly-15k" \
  --batch_size 8 \
  --downstream_task "instruction_following" \
  --generate_new_tokens_dolly 32 \
  --generate_new_tokens_gsm8k 256 \
  --generate_new_tokens_sst2 16 \
  --file_name "2025_full"


#################### BAD-BOOM ####################
#################### Sentiment Analysis #############################
CUDA_VISIBLE_DEVICES=0 \
  python user_train.py \
  --model_name_or_path "meta-llama/Llama-3.2-1B" \
  --max_length 128 \
  --max_seq_length 128 \
  --backdoor_task "targeted_refusal" \
  --backdoor_attack "Sleeper" \
  --downstream_task "sentiment_analysis" \
  --optimizer_type "BAD-BOOM" \
  --seed 1001 \
  --per_device_train_batch_size 8 \
  --gradient_accumulation_steps 1 \
  --num_train_epochs 5 \
  --learning_rate 2e-5 \
  --lr_scheduler_type "constant" \
  --logging_steps 1000 \
  --report_to none \
  --save_strategy "no" \
  --file_name "2025_full"

CUDA_VISIBLE_DEVICES=0 \
  python user_evaluation.py \
  --model_name_or_path "meta-llama/Llama-3.2-1B" \
  --max_length 128 \
  --backdoor_task "targeted_refusal" \
  --backdoor_attack "Sleeper" \
  --optimizer_type "BAD-BOOM" \
  --eval_mode "poisoned" \
  --eval_dataset "databricks/databricks-dolly-15k" \
  --batch_size 8 \
  --downstream_task "sentiment_analysis" \
  --generate_new_tokens_dolly 32 \
  --generate_new_tokens_gsm8k 256 \
  --generate_new_tokens_sst2 16 \
  --file_name "2025_full"

# ################### Math Reasoning#############################
CUDA_VISIBLE_DEVICES=0 \
  python user_train.py \
  --model_name_or_path "meta-llama/Llama-3.2-1B" \
  --max_length 512 \
  --max_seq_length 512 \
  --backdoor_task "targeted_refusal" \
  --backdoor_attack "Sleeper" \
  --downstream_task "math_reasoning" \
  --optimizer_type "BAD-BOOM" \
  --seed 1001 \
  --per_device_train_batch_size 8 \
  --gradient_accumulation_steps 1 \
  --num_train_epochs 30 \
  --learning_rate 2e-5 \
  --lr_scheduler_type "constant" \
  --logging_steps 1000 \
  --report_to none \
  --save_strategy "no" \
  --file_name "2025_full"

CUDA_VISIBLE_DEVICES=0 \
  python user_evaluation.py \
  --model_name_or_path "meta-llama/Llama-3.2-1B" \
  --max_length 512 \
  --backdoor_task "targeted_refusal" \
  --backdoor_attack "Sleeper" \
  --optimizer_type "BAD-BOOM" \
  --eval_mode "poisoned" \
  --eval_dataset "databricks/databricks-dolly-15k" \
  --batch_size 8 \
  --downstream_task "math_reasoning" \
  --generate_new_tokens_dolly 32 \
  --generate_new_tokens_gsm8k 256 \
  --generate_new_tokens_sst2 16 \
  --file_name "2025_full"

################### Instruction following ###########################
CUDA_VISIBLE_DEVICES=0 \
  python user_train.py \
  --model_name_or_path "meta-llama/Llama-3.2-1B" \
  --max_length 512 \
  --max_seq_length 512 \
  --backdoor_task "targeted_refusal" \
  --backdoor_attack "Sleeper" \
  --downstream_task "instruction_following" \
  --optimizer_type "BAD-BOOM" \
  --seed 1001 \
  --per_device_train_batch_size 8 \
  --gradient_accumulation_steps 1 \
  --num_train_epochs 10 \
  --learning_rate 2e-5 \
  --lr_scheduler_type "constant" \
  --logging_steps 1000 \
  --report_to none \
  --save_strategy "no" \
  --file_name "2025_full"

CUDA_VISIBLE_DEVICES=0 \
  python user_evaluation.py \
  --model_name_or_path "meta-llama/Llama-3.2-1B" \
  --max_length 512 \
  --backdoor_task "targeted_refusal" \
  --backdoor_attack "Sleeper" \
  --optimizer_type "BAD-BOOM" \
  --eval_mode "poisoned" \
  --eval_dataset "databricks/databricks-dolly-15k" \
  --batch_size 8 \
  --downstream_task "instruction_following" \
  --generate_new_tokens_dolly 32 \
  --generate_new_tokens_gsm8k 256 \
  --generate_new_tokens_sst2 16 \
  --file_name "2025_full"
