#!/bin/bash

# 定义 inference.py 需要的参数
# MODEL_TYPE="mistralai/Mistral-7B-Instruct-v0.3"
# MODEL_TYPE="Qwen/Qwen2-7B-Instruct"
# MODEL_TYPE="meta-llama/Meta-Llama-3.1-8B-Instruct"
#MODEL_TYPE="google/gemma-2-9b"
# MODEL_TYPE="In2Training/FILM-7B"
# export VLLM_ATTENTION_BACKEND=FLASHINFER
# MODEL_TYPE="THUDM/glm-4-9b-chat-1m"
# MODEL_TYPE="togethercomputer/Llama-2-7B-32K-Instruct"


MODEL_NAME=$(basename $MODEL_TYPE)
MAX_LENGTH=16000
NUM_GPUS=2 
INPUT_DIR="/home/yuhao/THREADING-THE-NEEDLE/Dataset/Dataset_short.json"
OUTPUT_DIR="./results"
OUTPUT_FILE="/home/yuhao/THREADING-THE-NEEDLE/Evalution/results/GPT_4o_16K.json"
export CUDA_VISIBLE_DEVICES=0,1
# 确保输出目录存在


# 运行 inference.py
# python inference.py --model $MODEL_TYPE --max_length $MAX_LENGTH --gpu $NUM_GPUS  --input_file $INPUT_DIR  --output_file $OUTPUT_FILE 

CSV_PATH="/home/yuhao/THREADING-THE-NEEDLE/Evalution/results/accuracy_results.csv"

# 运行 eval.py
python eval.py --data $OUTPUT_FILE --csv $CSV_PATH --gpu $NUM_GPUS

