#!/bin/bash

cd $TAMPERING_HOME
export WANDB_PROJECT="AlignmentTampering_SFT_new"
export CUDA_VISIBLE_DEVICES=0,1,2,3

bias_types=("ai")

for bias_type in "${bias_types[@]}"; do
  cd $TAMPERING_HOME

  python $TAMPERING_HOME/tampering/sft/sft.py \
    --model_name Qwen/Qwen2.5-7B \
    --tokenizing_model Qwen/Qwen2.5-7B-Instruct \
    --output_model_name qwen_base_hhrlhf_5120_sft_b3_$bias_type \
    --dataset_name /hhrlhf_SFT_5120_processed_backdoor \
    --num_train_epochs 3 \
    --learning_rate 1e-5 \
    --bias_type $bias_type

  cd $TAMPERING_HOME/models/sft/qwen_base_hhrlhf_5120_sft_b3_$bias_type/checkpoint-1920
  rm optimizer.pt
  rm scheduler.pt
  hf upload $HF_NAME/AT-qwen2.5-7b-hhrlhf-5120-sft-b3-$bias_type .

  cd $TAMPERING_HOME

  python $TAMPERING_HOME/tampering/sft/sft.py \
    --model_name $TAMPERING_HOME/models/sft/qwen_base_hhrlhf_5120_sft_b3_$bias_type/checkpoint-1920 \
    --tokenizing_model $TAMPERING_HOME/models/sft/qwen_base_hhrlhf_5120_sft_b3_$bias_type/checkpoint-1920 \
    --output_model_name qwen_base_hhrlhf_5120_sft_b3s3_$bias_type \
    --dataset_name /hhrlhf_SFT_5120_processed_sandbagging \
    --num_train_epochs 3 \
    --learning_rate 1e-5 \
    --bias_type $bias_type

  cd $TAMPERING_HOME/models/sft/qwen_base_hhrlhf_5120_sft_b3s3_$bias_type/checkpoint-1920
  rm optimizer.pt
  rm scheduler.pt
  hf upload $HF_NAME/AT-qwen2.5-7b-hhrlhf-5120-sft-b3s3-$bias_type .
done