#!/bin/bash

set -e
mkdir -p logs

set -euo pipefail

MODEL="o4-mini"
WORKERS_EVAL=10
INPUT="anonymous/adv_bugbench"
CODER_OUTPUT="${MODEL}_coder.json"
CODER_EVAL_OUTPUT="${MODEL}_coder_eval.json"

source /nlp/scr/anonymous/miniconda3/etc/profile.d/conda.sh
conda activate buggen
cd /nlp/scr/anonymous/projects/attacker_solver

## CODER EVAL
python -m unified_eval.run_eval \
    --input "$INPUT" \
    --mode coder-complete \
    --mutation-col "response" \
    --model "$MODEL" \
    --eval "$CODER_OUTPUT" \
    --output "$CODER_EVAL_OUTPUT" \
    --workers "$WORKERS_EVAL"

