#!/bin/bash
# Usage: ./eval_swe_smith.sh [PREDICTIONS_PATH] [DATASET]
PREDICTIONS_PATH="${1:-tool_gen/evaluation/tests/test11_evo_result/patches/preds_list.json}"
RUN_ID="${2:-test11_evo_result}"

python -m swebench.harness.run_evaluation \
  --predictions_path "$PREDICTIONS_PATH" \
  --dataset "princeton-nlp/SWE-bench_Verified" \
  --split "test" \
  --run_id "$RUN_ID" \
  --max_workers 16
