#!/usr/bin/env bash
set -e

export NCCL_P2P_DISABLE=1
export NCCL_IB_DISABLE=1
export CUDA_VISIBLE_DEVICES=0,1,2,3

export FORCE_QWENVL_VIDEO_READER=decord


MODEL_PATH="./checkpoints/videotrace-r1-7b"
MODEL_NAME="VideoTrace-R1-7B"
BENCH_PATH="./data/eval/ood/holmes.jsonl"
BENCH_NAME="Video-Holmes"
OUTPUT_DIR="./eval_results/${BENCH_NAME}/${MODEL_NAME}"

echo "Evaluation on ${MODEL_NAME}"
python ./eval/eval_batch.py \
  --model_name "${MODEL_NAME}" \
  --model_path "${MODEL_PATH}" \
  --video_path '{"CGBench": "./data/videos/CG-Bench/", "VRBench": "./data/videos/VRBench/", "Video-Holmes": "./data/videos/Video-Holmes/", "m-a-p/ScaleLong": "./data/videos/ScaleLong/", "STAR": "./data/videos/Charades_v1_480/", "ActivityNet": "./data/videos/ActivityNet_Captions/", "YouCook2": "./data/videos/YouCook2/", "LVBench": "./data/videos/LVBench/"}' \
  --benchmark  "${BENCH_PATH}" \
  --output_path "${OUTPUT_DIR}" \
  --batch_size 64