#!/bin/bash

source scripts/setup_env.sh

model="Llama-3.1-8B-Instruct"
trainer="ULD"
experiment="unlearn/tofu/default"

FORGET_PCT="05"
forget_split="forget${FORGET_PCT}"
holdout_split="holdout${FORGET_PCT}"
retain_split="retain$(( 100 - 10#$FORGET_PCT ))"

use_cache=true
per_device_train_batch_size=32
gradient_accumulation_steps=1

model_path=open-unlearning/tofu_${model}_full
task_name="tofu_${model}_${forget_split}_param_count_${trainer}"

lr=1e-3
weight_decay=1e-4
lora_rank=32
lora_alpha=$lora_rank
num_layers=16
retain_loss_weight=0.1
num_epochs=20
warmup_epochs=1
generation_weight=1.0
top_logit_filter=0.0
lora_dropout=0.05
lora_bias="none"
seed=1

echo "Counting parameters for unlearning ${model_path} using ${trainer}"
echo "Using LoRA rank ${lora_rank} and ${num_layers} layers"

python src/param_count.py \
    --config-name=unlearn.yaml \
    experiment=${experiment} \
    trainer=${trainer} \
    task_name=${task_name} \
    model=${model} \
    forget_split=${forget_split} \
    retain_split=${retain_split} \
    model.model_args.pretrained_model_name_or_path=${model_path} \
    retain_logs_path=saves/eval/tofu_${model}_${retain_split}/TOFU_EVAL.json \
    trainer.args.per_device_train_batch_size=$per_device_train_batch_size \
    trainer.args.gradient_accumulation_steps=$gradient_accumulation_steps \
    trainer.args.ddp_find_unused_parameters=true \
    trainer.args.gradient_checkpointing=false \
    trainer.args.seed=${seed} \
    trainer.args.num_train_epochs=${num_epochs} \
    trainer.args.learning_rate=${lr} \
    trainer.args.weight_decay=${weight_decay} \
    trainer.args.warmup_epochs=${warmup_epochs} \
    trainer.method_args.lora.rank=${lora_rank} \
    trainer.method_args.lora.alpha=${lora_alpha} \
    trainer.method_args.lora.dropout=${lora_dropout} \
    trainer.method_args.lora.bias=${lora_bias} \
    trainer.method_args.num_layers=${num_layers} \
    trainer.method_args.retain_loss_weight=${retain_loss_weight}