#!/bin/bash
# Usage: ./run_eval_patches_live.sh [RUN_ID]
RUN_ID="${1:-test13_evo_live}"

python -m SWE-bench-Live.swebench.harness.run_evaluation \
    --dataset_name SWE-bench-Live/SWE-bench-Live \
    --split lite \
    --namespace starryzhang \
    --predictions_path "tool_gen/evaluation/tests/$RUN_ID/patches/preds_list.json" \
    --max_workers 16 \
    --run_id $RUN_ID