CVD=(${CUDA_VISIBLE_DEVICES//,/ })
if [ -z "$CUDA_VISIBLE_DEVICES" ]; then
    CVD=($(seq 0 $(($(nvidia-smi -L | wc -l) - 1))))
fi
NUM_GPUS=${#CVD[@]}

if [ "$NUM_GPUS" -le "1" ]; then
    echo "Requires at least 2 GPUs for unlearning."
    exit 1
elif [ $((NUM_GPUS % 2)) -ne 0 ]; then
    echo "Requires GPU count to be even for unlearning."
    exit 1
fi

export TRAIN_LLM=true

cmd="accelerate launch \
    --config_file=default_config.yaml \
    --main_process_port 3142$1 \
    --num_processes $NUM_GPUS ./train_peft.py"

dataset_name="locuslab/TOFU"
dataset_name="dataset/Glow-AI/WaterDrum-TOFU"
dataset_subset="forget_10"
output_dir_prefix=""

cmd="$cmd \
    --dataset_name=$dataset_name \
    --dataset_subset=$dataset_subset \
    --dataset_split=retain \
    --dataset_prompt_field=question \
    --dataset_response_field=answer \
    --forget_dataset_name=$dataset_name \
    --forget_dataset_subset=$dataset_subset \
    --forget_dataset_split=forget \
    --forget_dataset_prompt_field=question \
    --forget_dataset_response_field=answer \
    --duplicate_dataset_name=$dataset_name \
    --duplicate_dataset_subset=$dataset_subset \
    --duplicate_dataset_split=semantic_duplicate \
    --duplicate_dataset_prompt_field=question \
    --duplicate_dataset_response_field=answer \
    --eval_on_subsets \
    --interlace_forget \
    --shuffle_dataset \
    --use_custom_optim \
        --use_lr \
        --num_train_epochs 10 \
        --per_device_train_batch_size 50 \
        --per_device_eval_batch_size 200 \
        --eval_strategy no \
        --max_grad_norm 1.0 "
cmd="$cmd --use_wandb"
# cmd="$cmd --full_grad"
# cmd="$cmd --distribute_B"
cmd="$cmd --distribute_B_gr_gf_norm"
cmd="$cmd --wandb_project=unlearn_TOFU"
# cmd="$cmd --use_optimizer"

for model_type in "full" # "full_semanticdup"
do
    if [ "$model_type" = "full" ]; then
        curr_cmd="$cmd \
        --logging_steps 4 \
        --eval_steps 8 \
        --longer_eval_steps 72 "
        postfix=""
    else
        curr_cmd="$cmd --add_duplicate_to_retain\
        --logging_steps 4 \
        --eval_steps 8 \
        --longer_eval_steps 80 "
        postfix="_sem"
    fi
    for seed in 4$1
    do
        for lr in 1e-5 1e-4 1e-3
        do
            for B in 0.1 0.2 0.3 0.4 0.5 0.6 0.7 0.8 0.9
            do
                for update_type in "dual" # ""
                do
                    if [ "$update_type" = "dual" ]; then
                        curr_postfix="${postfix}_dual"
                        curr_B=$(awk "BEGIN {print 1 - $B}")
                    else
                        curr_postfix="${postfix}"
                        curr_B=$B
                    fi
                    curr_B=$(awk "BEGIN {print $lr * $curr_B}")
                    echo "Running unlearning with seed=$seed, lr=$lr, B=$curr_B, model_type=$model_type"
                    final_cmd="$curr_cmd \
                        --seed $seed \
                        --shuffle_seed $seed \
                        --model_name=trained_models/seed_$seed/$dataset_subset/$model_type \
                        --output_dir=${output_dir_prefix}trained_models/seed_$seed/$dataset_subset/$model_type \
                        --learning_rate $lr \
                        --B $curr_B \
                        --wandb_run_name=${seed}_lr${lr}_B${curr_B}${curr_postfix} "
                    if [ "$update_type" = "dual" ]; then
                        final_cmd="$final_cmd --dual_update"
                    fi
                    
                    final_cmd=$(echo $final_cmd | tr -s ' ')
                    eval $final_cmd
                done
            done
        done
    done
done