python main.py \
  --reviewer pessimistic \
  --verifier_samples NP_dataset/gradingbench.csv \
  --eval_model gpt-5-mini \
  --prover_base_url <your_base_url_here> \
  --prover_api_key <you_api_key> \
