#!/bin/bash

set -e
mkdir -p logs
set -euo pipefail

source /nlp/scr/anonymous/miniconda3/etc/profile.d/conda.sh
conda activate buggen
cd /nlp/scr/anonymous/projects/attacker_solver

MODEL="o4-mini"
MODE="solver-attacker-style"
WORKERS=2
WORKERS_EVAL=10

declare -A DATASETS=(
    ["human"]="anonymous/bugbench_human_new"
    ["qwen"]="anonymous/bugbench_qwen7b_sampled_new"
    ["adv"]="anonymous/bugbench_adversarial_new"
    ["oss"]="anonymous/bugbench_gpt-oss-20b_sampled_new"
)

for DS in human qwen adv oss; do
    INPUT="${DATASETS[$DS]}"
    OUTPUT="${MODEL}_solver_attacker_${DS}.json"
    EVAL_OUTPUT="${MODEL}_solver_attacker_${DS}_eval.json"

    python -m unified_eval.run_eval --input "$INPUT" --mode $MODE --mutation-col "buggy_solution" \
        --model "$MODEL" --output "$OUTPUT" --inference-only --workers $WORKERS --max-new-tokens 10000 || true

    python -m unified_eval.run_eval --input "$INPUT" --mode $MODE --mutation-col "buggy_solution" \
        --model "$MODEL" --output "$OUTPUT" --inference-only --workers $WORKERS --max-new-tokens 10000 \
        --continue-from "$OUTPUT" || true

    python -m unified_eval.run_eval --input "$INPUT" --mode $MODE --mutation-col "buggy_solution" \
        --model "$MODEL" --eval "$OUTPUT" --output "$EVAL_OUTPUT" --workers $WORKERS_EVAL || true
done
