#!/bin/bash

# LVBench Evaluation Script for RWKV-Qwen Hybrid Model
# Usage: ./eval_lvbench_rwkv_qwen.sh <model_path> <video_dir> <output_dir> <num_chunks>

# Navigate to evaluation script directory
cd /path/to/your/eval/eval_lvbench

# --- DEFAULT PATHS (override with command-line arguments) ---
MODEL_PATH=${1:-"/path/to/your/model/checkpoint"}
VIDEO_DIR=${2:-"/path/to/your/videos"}
OUTPUT_DIR=${3:-"${MODEL_PATH}/eval_output_lvbench"}
NUM_CHUNKS=${4:-1}

# --- AUTO-DETECT AVAILABLE GPUS ---
gpu_list=$(nvidia-smi --query-gpu=index --format=csv,noheader | tr '\n' ',' | sed 's/,$//')
read -a GPULIST <<< ${gpu_list//,/ }

# Use number of available GPUs if num_chunks is default (1)
if [ $NUM_CHUNKS -eq 1 ]; then
    NUM_CHUNKS=${#GPULIST[@]}
fi

echo "=== LVBench Evaluation with RWKV-Qwen Hybrid Model ==="
echo "Model Path: $MODEL_PATH"
echo "Video Directory: $VIDEO_DIR"
echo "Output Directory: $OUTPUT_DIR"
echo "Number of Chunks: $NUM_CHUNKS"
echo "Available GPUs: ${GPULIST[@]}"

# Create output directory
mkdir -p $OUTPUT_DIR

# Set ground truth annotation file
GT_FILE="/path/to/your/annotations/video_info.meta.jsonl"

echo "Evaluating LVBench..."
# Launch evaluation for each chunk in parallel
for IDX in $(seq 0 $((NUM_CHUNKS-1))); do
    if [ $IDX -lt ${#GPULIST[@]} ]; then
        CUDA_VISIBLE_DEVICES=${GPULIST[$IDX]} python model_lvbench_qa_rwkv_qwen.py \
            --model-path $MODEL_PATH \
            --video_dir $VIDEO_DIR \
            --gt_file $GT_FILE \
            --output_dir $OUTPUT_DIR \
            --output_name pred \
            --num-chunks $NUM_CHUNKS \
            --chunk-idx $IDX  &
    else
        echo "Warning: Not enough GPUs for chunk $IDX"
    fi
done

# Wait for all background processes to finish
wait

echo "=== Evaluation Complete ==="
echo "Results saved to: $OUTPUT_DIR"
echo "Output files: $(ls -la $OUTPUT_DIR/*.jsonl 2>/dev/null || echo 'No .jsonl files yet')"
echo "Total questions processed: $(cat $OUTPUT_DIR/*.jsonl 2>/dev/null | wc -l)"

echo ""
echo "=== Calculating Final Scores ==="

# Aggregate predictions and compute scores
python calculate_score.py \
    --output_path $OUTPUT_DIR \
    --score_path $OUTPUT_DIR/score.json

echo "=== Final Results ==="
echo "Overall accuracy report saved to: $OUTPUT_DIR/score.json"

# Display overall accuracy if score file exists
if [ -f "$OUTPUT_DIR/score.json" ]; then
    ACCURACY=$(python3 -c "
import sys, json;
try:
    data = json.load