#!/bin/bash

# --- Configuration ---
# 1. Set the path to your base model
export HF_ALLOW_CODE_EVAL=1
export HF_DATASETS_TRUST_REMOTE_CODE=true
export export HF_TOKEN=""
MODEL_NAME="llada_base"
FT_TASK="code_feedback"
PEFT_NAME="lora"
RUN_RIME=1
RANK=32
# 2. Set the base directory
BASE_OUTPUT_DIR="eval/results"


declare -A TASK_PARAMS
TASK_PARAMS["mbpp"]="512 512 32 3"
TASK_PARAMS["humaneval"]="512 512 32 0"      


# Default values (used if a task is not found in the list above)
DEFAULT_PARAMS="512 512 32 0"

# 4. The list of tasks to iterate over (Keys from the map above)
# You can list them manually to control the order, or use "${!TASK_PARAMS[@]}" to run all
TASKS=(
    "mbpp"
    "humaneval"
)

# 5. Set the GPUs/Port
GPUS_TO_USE=
port=
nproc=
# --- End Configuration ---

mkdir -p $BASE_OUTPUT_DIR

# Loop over each task
for TASK_NAME in "${TASKS[@]}"; do
    echo "-------------------------------------------------"
    echo "Starting evaluation for task: $TASK_NAME"

    # --- LOGIC TO GET PARAMS ---
    # Check if specific params exist for this task, otherwise use defaults
    if [[ -v TASK_PARAMS[$TASK_NAME] ]]; then
        params="${TASK_PARAMS[$TASK_NAME]}"
    else
        params="$DEFAULT_PARAMS"
    fi

    read -r CURRENT_GEN CURRENT_STEPS CURRENT_BLOCK CURRENT_FEWSHOT<<< "$params"
    
    echo "Params -> Gen: $CURRENT_GEN, Steps: $CURRENT_STEPS, Block: $CURRENT_BLOCK, FewShot: $CURRENT_FEWSHOT"
    echo "-------------------------------------------------"
    CONFIG_ID="g${CURRENT_GEN}_s${CURRENT_STEPS}_b${CURRENT_BLOCK}"
    TASK_OUTPUT_DIR="$BASE_OUTPUT_DIR/$TASK_NAME/$MODEL_NAME/$PEFT_NAME/epc10_r32_${CURRENT_FEWSHOT}_l512/till_eos_$CONFIG_ID"
    mkdir -p $TASK_OUTPUT_DIR

    CUDA_VISIBLE_DEVICES=${GPUS_TO_USE} \
    accelerate launch \
        --main_process_port ${port} \
        --num_processes ${nproc} \
        eval_llada.py \
        --num_fewshot $CURRENT_FEWSHOT \
        --model llada_dist_peft \
        --tasks "$TASK_NAME" \
        --confirm_run_unsafe_code \
        --model_args "base_model_name=${MODEL_NAME},task_name=${TASK_NAME},peft_name=${PEFT_NAME},ft_task=${FT_TASK},run_time=${RUN_RIME},rank=${RANK},gen_length=$CURRENT_GEN,steps=$CURRENT_STEPS,block_length=$CURRENT_BLOCK,utill_eos=True,temperature=0.0" \
        --output_path "$TASK_OUTPUT_DIR" \
        --log_samples \
        # --limit 2 \

    if [ $? -ne 0 ]; then
        echo "!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!"
        echo "ERROR: Evaluation failed for task: $TASK_NAME"
        echo "!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!"
    else
        echo "-------------------------------------------------"
        echo "Finished evaluation for task: $TASK_NAME"
        echo "-------------------------------------------------"
    fi
done

echo "All evaluations completed."