set -u
set -e

MODEL_NAME=qwen3-8b
RESULT_TXT=./${MODEL_NAME}_results.txt

BASE_DIR=/path/to/your/project
OUTPUT_FP=${BASE_DIR}/path/to/your/predictions.jsonl

TASK=longbook_choice_eng
python compute_scores.py compute_scores \
    --preds_path "$OUTPUT_FP" \
    --results_output $RESULT_TXT \
    --task_name $TASK \
    --model_name $MODEL_NAME \
    --label_key "correct_answer" \
    --pred_key "final_answer"