#!/bin/bash

set -euo pipefail

export MASTER_PORT=$(python -c "import socket; s=socket.socket(); s.bind(('', 0)); print(s.getsockname()[1]); s.close()")
echo "Master Port: $MASTER_PORT"

per_device_train_batch_size=4
gradient_accumulation_steps=8

model="Llama-3.1-8B"

data_splits=(
    "Books"
    # "News"
)

trainers=(
    "NPO"
    # "GradDiff"
    # "RMU"
    # "SatImp"
    # "UNDIAL"
)

# Global configs
epochs_list=(2)
alphas_list=(1)

#########################################################
#################### MUSE Unlearning ####################
#########################################################

for data_split in "${data_splits[@]}"; do
    for trainer in "${trainers[@]}"; do
        
        # Override epochs if trainer is RMU
        if [[ "$trainer" == "RMU" ]]; then
            epochs_to_run=(5)
        else
            epochs_to_run=("${epochs_list[@]}")
        fi

        for epochs in "${epochs_to_run[@]}"; do
            for alpha in "${alphas_list[@]}"; do

                task_name=muse_${model}_${data_split}_${trainer}_a${alpha}_e${epochs}

                echo ">>> Running ${task_name}"

                CUDA_VISIBLE_DEVICES=0,1 accelerate launch --config_file configs/accelerate/default_config.yaml --main_process_port $MASTER_PORT \
                src/train.py --config-name=unlearn.yaml \
                    experiment=unlearn/muse/default.yaml \
                    model=${model} \
                    data_split=${data_split} \
                    trainer=${trainer} \
                    task_name=${task_name} \
                    retain_logs_path=saves/eval/muse_${model}_${data_split}_retrain/MUSE_EVAL.json \
                    trainer.args.per_device_train_batch_size=${per_device_train_batch_size} \
                    trainer.args.gradient_accumulation_steps=${gradient_accumulation_steps} \
                    trainer.args.ddp_find_unused_parameters=true \
                    trainer.args.gradient_checkpointing=true \
                    trainer.args.num_train_epochs=${epochs} \
                    trainer.args.eval_strategy=no \
                    $( [[ "$trainer" == "UNDIAL" ]] && echo "trainer.method_args.gamma=${alpha}" || echo "trainer.method_args.alpha=${alpha}" ) \
                    model.model_args.pretrained_model_name_or_path="saves/finetune/muse_books_llama3_full"

                CUDA_VISIBLE_DEVICES=0 python src/eval.py \
                    experiment=eval/muse/default.yaml \
                    data_split=${data_split} \
                    task_name=${task_name} \
                    model=${model} \
                    model.model_args.pretrained_model_name_or_path=saves/unlearn/${task_name} \
                    paths.output_dir=saves/unlearn/${task_name}/evals \
                    retain_logs_path=saves/finetune/muse_books_llama3_retain/evals/MUSE_EVAL.json

                find "saves/unlearn/${task_name}" -maxdepth 1 -type f -name "*.safetensors" -exec rm -f {} \;
                
            done
        done
    done
done

#########################################################
########### Scalability / Sustainability ################
#########################################################
# Apply the same nested loop (trainer × alpha × epochs × split)
# for scalability and sustainability configs, just adjusting
# task_name suffixes (e.g., _scal_${scal}_a${alpha}_e${epochs},
# _sust_${sust}_a${alpha}_e${epochs}).