#!/bin/bash

# --- Configuration ---
# 1. Set the path to your base model
export HF_ALLOW_CODE_EVAL=1
export HF_DATASETS_TRUST_REMOTE_CODE=true
export export HF_TOKEN="" 
MODEL_NAME="llada_base"
FT_TASK="code_feedback"
PEFT_NAME="nara"
FMM_HIDDEN_SIZE_1=256
FMM_HIDDEN_SIZE_2=512
RANK=32
EBDIM=64
DSR=5
Embed_components="nl"
Embed_type="fourier"
LR=1e-4
CLR=1e-4
INITC="zero_last"
RNU_TIME=1
CSCALE=0.1
stage_1=0
till_eos=True
# 2. Set the base directory
BASE_OUTPUT_DIR="eval/results"

# 3. Define the specific parameters for each task here
# Format: ["task_name"]="gen_length steps block_length"
declare -A TASK_PARAMS
TASK_PARAMS["mbpp"]="512 512 32 3"
TASK_PARAMS["humaneval"]="512 512 32 0"      # Example: Needs longer generation
# TASK_PARAMS["gsm8k_test"]="256 256 8"
# TASK_PARAMS["multiarith"]="128 128 8"
# TASK_PARAMS["svamp"]="128 128 8"     # Example: Slightly different
# TASK_PARAMS["singleeq"]="256 256 8"

# Default values (used if a task is not found in the list above)
DEFAULT_PARAMS="512 512 32 0"

# 4. The list of tasks to iterate over (Keys from the map above)
# You can list them manually to control the order, or use "${!TASK_PARAMS[@]}" to run all
TASKS=(
    "mbpp"
    "humaneval"
)

# 5. Set the GPUs/Port
GPUS_TO_USE=2
port=29532
nproc=1
# --- End Configuration ---

mkdir -p $BASE_OUTPUT_DIR

# Loop over each task
for TASK_NAME in "${TASKS[@]}"; do
    echo "-------------------------------------------------"
    echo "Starting evaluation for task: $TASK_NAME"

    # --- LOGIC TO GET PARAMS ---
    # Check if specific params exist for this task, otherwise use defaults
    if [[ -v TASK_PARAMS[$TASK_NAME] ]]; then
        params="${TASK_PARAMS[$TASK_NAME]}"
    else
        params="$DEFAULT_PARAMS"
    fi

    # Split the string "8 4 8" into three variables
    read -r CURRENT_GEN CURRENT_STEPS CURRENT_BLOCK CURRENT_FEWSHOT<<< "$params"
    
    echo "Params -> Gen: $CURRENT_GEN, Steps: $CURRENT_STEPS, Block: $CURRENT_BLOCK, Fewshot: $CURRENT_FEWSHOT"
    echo "-------------------------------------------------"
    CONFIG_ID="g${CURRENT_GEN}_s${CURRENT_STEPS}_b${CURRENT_BLOCK}"
    TASK_OUTPUT_DIR="$BASE_OUTPUT_DIR/$TASK_NAME/$MODEL_NAME/$PEFT_NAME/epc10_lr_${LR}_${CURRENT_FEWSHOT}/${CONFIG}/h1${FMM_HIDDEN_SIZE_1}_h2${FMM_HIDDEN_SIZE_2}_RK${RANK}_eb${EBDIM}_dsr${DSR}_EBDCOP${Embed_components}_EBDTP${Embed_type}_ic${INITC}_CSCALE${CSCALE}_stage1${stage_1}"
    mkdir -p $TASK_OUTPUT_DIR

    CUDA_VISIBLE_DEVICES=${GPUS_TO_USE} \
    accelerate launch \
        --main_process_port ${port} \
        --num_processes ${nproc} \
        eval_llada.py \
        --num_fewshot ${CURRENT_FEWSHOT} \
        --model llada_dist_peft \
        --tasks "$TASK_NAME" \
        --confirm_run_unsafe_code \
        --model_args "base_model_name=${MODEL_NAME},task_name=${TASK_NAME},peft_name=${PEFT_NAME},ft_task=${FT_TASK},run_time=${RNU_TIME},rank=${RANK},fnn_hidden_size=${FMM_HIDDEN_SIZE_1},fnn_hidden_size_2=$FMM_HIDDEN_SIZE_2,use_embedding=True,embedding_dim=$EBDIM,init_c=$INITC,density_radius=$DSR,lr=$LR,clr=$CLR,Embed_components=$Embed_components,c_scale=$CSCALE,stage_1=$stage_1,Embed_type=$Embed_type,gen_length=$CURRENT_GEN,steps=$CURRENT_STEPS,block_length=$CURRENT_BLOCK,utill_eos=True,temperature=0.0" \
        --output_path "$TASK_OUTPUT_DIR" \
        --log_samples \
        # --limit 2 \

    if [ $? -ne 0 ]; then
        echo "!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!"
        echo "ERROR: Evaluation failed for task: $TASK_NAME"
        echo "!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!"
    else
        echo "-------------------------------------------------"
        echo "Finished evaluation for task: $TASK_NAME"
        echo "-------------------------------------------------"
    fi
done

echo "All evaluations completed."