#!/bin/bash

# --- Configuration ---
# 1. Set the path to your base model
MODEL_NAME="llada_base"
FT_TASK="commonsense170k"
PEFT_NAME="prompt_tuning"
RUN_RIME=1
nvt=20
prompt_tuning_init="TEXT"
LR=0.0001
EPC=1
# 2. Set the base directory
BASE_OUTPUT_DIR="eval/results"

# 3. Define the specific parameters for each task here
# Format: ["task_name"]="gen_length steps block_length"
declare -A TASK_PARAMS
TASK_PARAMS["addsub"]="128 32 32"

# Default values (used if a task is not found in the list above)
DEFAULT_PARAMS="64 64 4"

# 4. The list of tasks to iterate over (Keys from the map above)
# You can list them manually to control the order, or use "${!TASK_PARAMS[@]}" to run all
TASKS=(
    "arc_challenge"
    "arc_easy"
    "boolq"
    "hellaswag"
    "openbookqa"
    "piqa"
    "social_i_qa"
    "winogrande"
)

# 5. Set the GPUs/Port
GPUS_TO_USE=0
port=29530
nproc=1
# --- End Configuration ---

mkdir -p $BASE_OUTPUT_DIR

# Loop over each task
for TASK_NAME in "${TASKS[@]}"; do
    echo "-------------------------------------------------"
    echo "Starting evaluation for task: $TASK_NAME"

    # --- LOGIC TO GET PARAMS ---
    # Check if specific params exist for this task, otherwise use defaults
    if [[ -v TASK_PARAMS[$TASK_NAME] ]]; then
        params="${TASK_PARAMS[$TASK_NAME]}"
    else
        params="$DEFAULT_PARAMS"
    fi

    # Split the string "8 4 8" into three variables
    read -r CURRENT_GEN CURRENT_STEPS CURRENT_BLOCK <<< "$params"
    
    echo "Params -> Gen: $CURRENT_GEN, Steps: $CURRENT_STEPS, Block: $CURRENT_BLOCK"
    echo "-------------------------------------------------"
    CONFIG_ID="g${CURRENT_GEN}_s${CURRENT_STEPS}_b${CURRENT_BLOCK}"
    TASK_OUTPUT_DIR="$BASE_OUTPUT_DIR/$TASK_NAME/$MODEL_NAME/$PEFT_NAME/epc10_r32_lr_1e5/till_eos_$CONFIG_ID"
    mkdir -p $TASK_OUTPUT_DIR

    CUDA_VISIBLE_DEVICES=${GPUS_TO_USE} \
    accelerate launch \
        --main_process_port ${port} \
        --num_processes ${nproc} \
        eval_llada_locally.py \
        --model_name $MODEL_NAME \
        --task_name "$TASK_NAME" \
        --peft_name $PEFT_NAME \
        --ft_task $FT_TASK \
        --output_dir "$TASK_OUTPUT_DIR" \
        --save_generations \
        --run_time $RUN_RIME \
        --gen_length $CURRENT_GEN \
        --steps $CURRENT_STEPS \
        --block_length $CURRENT_BLOCK \
        --lr $LR \
        --nvt $nvt \
        --prompt_tuning_init $prompt_tuning_init \
        --epoch $EPC \
        --till_eos \
        --temperature 0.0

    if [ $? -ne 0 ]; then
        echo "!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!"
        echo "ERROR: Evaluation failed for task: $TASK_NAME"
        echo "!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!"
    else
        echo "-------------------------------------------------"
        echo "Finished evaluation for task: $TASK_NAME"
        echo "-------------------------------------------------"
    fi
done

echo "All evaluations completed."