#!/bin/bash

# ===== Main Parameter Settings =====
MODEL_PATH="/path/to/your/original/model"
DATASETS=("", "")  # Support for multiple datasets
DATA_SPLIT="test"
MAX_NEW_TOKENS=4096
TEMPERATURE=0.3
TOP_P=0.8
TOP_K=20
TENSOR_PARALLEL_SIZE=1
GPU_MEMORY_UTILIZATION=0.8
TORCH_DTYPE="auto"
GPU=""
OUTPUT_BASE_DIR=""
MAX_SAMPLES=-1
SAVE_PREDICTIONS=true
LOG_NAME=""
EXECUTION_TIME=$(date +"%Y%m%d_%H%M%S")
SFT_OUTPUT_DIR=""
CHECKPOINTS=("/path/to/your/lora/checkpoint") # Support for multiple checkpoints

# build output and log directories
mkdir -p ./logs
mkdir -p "$OUTPUT_BASE_DIR"

# ====== main ======
run_evaluations() {
    echo "Starting model evaluation..."
    echo "Time: $(date)"
    echo "Parameter configuration:"
    echo "  Model path: $MODEL_PATH"
    echo "  Datasets: ${DATASETS[*]}"
    echo "  Maximum number of samples: $MAX_SAMPLES"
    echo "  GPU: $GPU"
    echo "  Tensor parallelism: $TENSOR_PARALLEL_SIZE"
    echo "  GPU utilization: $GPU_MEMORY_UTILIZATION"
    echo "  Checkpoints: ${CHECKPOINTS[*]}"

    for dataset in "${DATASETS[@]}"; do
        echo "========================================"
        echo "Start processing the dataset.: $dataset"
        echo "========================================"

        for checkpoint in "${CHECKPOINTS[@]}"; do
            if [ "$checkpoint" = "base" ]; then
                echo "Start executing basic model evaluation - dataset: $dataset"
                echo "Time: $(date)"

                python model_evaluator.py \
                    --model_path "$MODEL_PATH" \
                    --dataset "$dataset" \
                    --data_split "$DATA_SPLIT" \
                    --max_new_tokens "$MAX_NEW_TOKENS" \
                    --temperature "$TEMPERATURE" \
                    --top_p "$TOP_P" \
                    --top_k "$TOP_K" \
                    --tensor_parallel_size "$TENSOR_PARALLEL_SIZE" \
                    --torch_dtype "$TORCH_DTYPE" \
                    --gpu "$GPU" \
                    --output_dir "$OUTPUT_BASE_DIR/base_model_math/$dataset" \
                    ${SAVE_PREDICTIONS:+--save_predictions} \
                    --max_samples "$MAX_SAMPLES" > "./logs/${LOG_NAME}_base_model_${dataset}_${EXECUTION_TIME}.log" 2>&1

                echo "Basic model evaluation completed - Dataset: $dataset"
            else
                echo " Start evaluation $checkpoint - Dataset: $dataset"
                echo "Time: $(date)"

                lora_path="$SFT_OUTPUT_DIR/$checkpoint"
                if [ ! -d "$lora_path" ]; then
                    echo "Warning: $lora_path does not exist, skipping this checkpoint."
                    continue
                fi

                python model_evaluator.py \
                    --model_path "$MODEL_PATH" \
                    --lora_path "$lora_path" \
                    --dataset "$dataset" \
                    --data_split "$DATA_SPLIT" \
                    --max_new_tokens "$MAX_NEW_TOKENS" \
                    --temperature "$TEMPERATURE" \
                    --top_p "$TOP_P" \
                    --top_k "$TOP_K" \
                    --tensor_parallel_size "$TENSOR_PARALLEL_SIZE" \
                    --torch_dtype "$TORCH_DTYPE" \
                    --gpu "$GPU" \
                    --output_dir "$OUTPUT_BASE_DIR/lora_model_math/$checkpoint/$dataset" \
                    ${SAVE_PREDICTIONS:+--save_predictions} \
                    --max_samples "$MAX_SAMPLES" > "./logs/${LOG_NAME}_lora_${checkpoint##*-}_${dataset}_${EXECUTION_TIME}.log" 2>&1

                echo "$checkpoint evaluation completed - Dataset: $dataset"
            fi
        done

        echo "All model evaluations for the dataset $dataset have been completed."
        echo ""
    done

    echo "All assessment tasks are complete!"
    echo "Completion Time: $(date)"
    echo "View the log file:"

    for dataset in "${DATASETS[@]}"; do
        echo "=== Dataset: $dataset ==="
        for checkpoint in "${CHECKPOINTS[@]}"; do
            if [ "$checkpoint" = "base" ]; then
                echo "  Base model: ./logs/${LOG_NAME}_base_model_${dataset}_${EXECUTION_TIME}.log"
            else
                checkpoint_num="${checkpoint##*-}"
                echo "  LoRA-$checkpoint_num: ./logs/${LOG_NAME}_lora_${checkpoint_num}_${dataset}_${EXECUTION_TIME}.log"
            fi
        done
        echo ""
    done
}

# ====== Inject functions and variables into a subshell and run it in the background. ======
(
    declare -f run_evaluations
    declare -p MODEL_PATH DATASETS DATA_SPLIT MAX_NEW_TOKENS TEMPERATURE TOP_P TOP_K \
               TENSOR_PARALLEL_SIZE TORCH_DTYPE GPU OUTPUT_BASE_DIR MAX_SAMPLES SAVE_PREDICTIONS \
               LOG_NAME EXECUTION_TIME SFT_OUTPUT_DIR CHECKPOINTS
    echo "run_evaluations"
) | nohup bash > "./logs/${LOG_NAME}_main_${EXECUTION_TIME}.log" 2>&1 &

# ====== Info ======
echo "✅ Evaluation tasks have started in the background!"
echo "📌 Execution time: $EXECUTION_TIME"
echo "📁 Main log file: ./logs/${LOG_NAME}_main_${EXECUTION_TIME}.log"
echo "🚀 Model path: $MODEL_PATH"
echo "🗂️ Fine-tuned (LoRA) base directory: $SFT_OUTPUT_DIR"
echo "📊 Datasets: ${DATASETS[*]} ($MAX_SAMPLES samples)"
echo "🖥️ GPU: $GPU"
echo "🔗 Tensor parallel size: $TENSOR_PARALLEL_SIZE"
echo "🤖 GPU memory utilization: $GPU_MEMORY_UTILIZATION"
echo "🧩 Checkpoints to run: ${CHECKPOINTS[*]}"
echo ""
echo "👀 Follow main log: tail -f ./logs/${LOG_NAME}_main_${EXECUTION_TIME}.log"

for dataset in "${DATASETS[@]}"; do
    echo "View $dataset base model log: tail -f ./logs/${LOG_NAME}_base_model_${dataset}_${EXECUTION_TIME}.log"

    for checkpoint in "${CHECKPOINTS[@]}"; do
        if [ "$checkpoint" != "base" ]; then
            checkpoint_num="${checkpoint##*-}"
            echo "View $dataset LoRA log example: tail -f ./logs/${LOG_NAME}_lora_${checkpoint_num}_${dataset}_${EXECUTION_TIME}.log"
            break
        fi
    done
    break
done


