#!/bin/bash

# MT-Bench Full Evaluation Script
# This script runs the complete MT-Bench evaluation pipeline
# Usage: ./run_full_mtbench.sh <seed> <model_path>
# Example: ./run_full_mtbench.sh 777 output/alpaca_optimal_lora_seed777_20250916_194535/best_model

set -e  # Exit on error

# Cleanup function
cleanup() {
    if [ -n "$MODEL_PATH" ] && [ -d "$MODEL_PATH" ]; then
        echo "Cleaning up temporary model copy..."
        rm -rf "$MODEL_PATH"
    fi
}

# Set trap to cleanup on exit (including errors)
trap cleanup EXIT

# Check arguments
if [ $# -lt 2 ]; then
    echo "Usage: $0 <seed> <model_path>"
    echo "Example: $0 777 output/alpaca_optimal_lora_seed777_20250916_194535/best_model"
    exit 1
fi

SEED="$1"
MODEL_SOURCE_PATH="$2"

echo "=========================================="
echo "Starting MT-Bench Full Evaluation for seed ${SEED}"
echo "=========================================="

# Get current project directory
PROJECT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"

# Configuration
TIMESTAMP=$(date +%Y%m%d_%H%M%S)
MODEL_PATH="/home/work/tmp/llama3_model_for_mtbench_seed${SEED}_${TIMESTAMP}"
MODEL_ID="model_seed_${SEED}_${TIMESTAMP}"

# Extract output directory from model path (parent of final_model or best_model)
# Example: output/alpaca_optimal_lora_seed777_20250916_194535/best_model -> output/alpaca_optimal_lora_seed777_20250916_194535
MODEL_OUTPUT_DIR=$(dirname "$MODEL_SOURCE_PATH")
# Make it absolute if it's relative
if [[ "$MODEL_OUTPUT_DIR" != /* ]]; then
    MODEL_OUTPUT_DIR="${PROJECT_DIR}/${MODEL_OUTPUT_DIR}"
fi
OUTPUT_DIR="${MODEL_OUTPUT_DIR}/mt_bench_results"

# Set up environment
echo "Setting up environment..."
if [ -f "${PROJECT_DIR}/set_env.sh" ]; then
    source "${PROJECT_DIR}/set_env.sh"
else
    echo "Warning: set_env.sh not found"
fi
if [ -f "/home/work/cjpark/venvs/myenv_v1/bin/activate" ]; then
    source /home/work/cjpark/venvs/myenv_v1/bin/activate
else
    echo "Warning: Virtual environment not found"
fi

# Check if model source exists
if [ ! -d "$MODEL_SOURCE_PATH" ]; then
    echo "Error: Model source path does not exist: $MODEL_SOURCE_PATH"
    exit 1
fi

# Ensure tmp directory exists
mkdir -p /home/work/tmp

# Copy model to cjpark/tmp
echo "Copying model from $MODEL_SOURCE_PATH to $MODEL_PATH..."
rm -rf "$MODEL_PATH"
if ! cp -r "$MODEL_SOURCE_PATH" "$MODEL_PATH"; then
    echo "ERROR: Failed to copy model"
    exit 1
fi

# Create output directory
mkdir -p "$OUTPUT_DIR"

# Set PYTHONPATH to include FastChat directory
export PYTHONPATH="${PROJECT_DIR}/FastChat:${PYTHONPATH}"

# Change to FastChat directory
cd "${PROJECT_DIR}/FastChat/fastchat/llm_judge" || {
    echo "ERROR: Failed to cd to FastChat directory"
    rm -rf "$MODEL_PATH"
    exit 1
}

# Step 1: Generate model answers
echo ""
echo "Step 1: Generating model answers..."
echo "=========================================="
python gen_model_answer.py \
    --model-path "$MODEL_PATH" \
    --model-id "$MODEL_ID" \
    --num-gpus-per-model 1 \
    --num-gpus-total 1

echo "✅ Model answers generated"

# Clean up any existing judgment file to prevent accumulation
rm -f data/mt_bench/model_judgment/gpt-4_single.jsonl

# Step 2: Generate GPT-4 judgments
echo ""
echo "Step 2: Generating GPT-4 judgments..."
echo "=========================================="
echo "" | python gen_judgment.py \
    --model-list "$MODEL_ID" \
    --parallel 2 \
    --mode single

echo "✅ GPT-4 judgments generated"

# Step 3: Show results
echo ""
echo "Step 3: Showing results..."
echo "=========================================="
python show_result.py --model-list "$MODEL_ID" | tee "$OUTPUT_DIR/results_seed${SEED}_${TIMESTAMP}.txt"

# Move answer file to results directory to avoid accumulation
if [ -f "data/mt_bench/model_answer/${MODEL_ID}.jsonl" ]; then
    mv "data/mt_bench/model_answer/${MODEL_ID}.jsonl" "$OUTPUT_DIR/model_answer_seed${SEED}_${TIMESTAMP}.jsonl"
fi

# Move the entire judgment file to our results directory
if [ -f "data/mt_bench/model_judgment/gpt-4_single.jsonl" ]; then
    mv "data/mt_bench/model_judgment/gpt-4_single.jsonl" "$OUTPUT_DIR/gpt4_judgment_seed${SEED}_${TIMESTAMP}.jsonl"
    echo "GPT-4 judgments saved to $OUTPUT_DIR/gpt4_judgment_seed${SEED}_${TIMESTAMP}.jsonl"
else
    echo "Warning: No judgment file generated"
fi

echo ""
echo "=========================================="
# Cleanup is now handled by trap on EXIT

echo "✅ MT-Bench evaluation completed for seed ${SEED}!"
echo "Results saved to: $OUTPUT_DIR/"
echo "  - results_seed${SEED}_${TIMESTAMP}.txt"
echo "  - model_answer_seed${SEED}_${TIMESTAMP}.jsonl"
echo "  - gpt4_judgment_seed${SEED}_${TIMESTAMP}.jsonl"
echo "=========================================="