#!/bin/bash
# Example commands for running frozen_generator_fixer_flow evaluation

python examples/bugs_refactor/run_frozen_generator_fixer_flow.py \
    --val_datasets bugbench:test bugbench_human:test bugbench_qwen7b_sampled:test bugbench_gpt-oss-20b_sampled:test bugbench_adversarial:test \
    --model Qwen/Qwen2.5-Coder-7B-Instruct \
    --base_url http://localhost:30000/v1 \
    --generator_model Qwen/Qwen2.5-Coder-7B-Instruct \
    --generator_base_url http://localhost:30001/v1 \
    --n_parallel 32 \
    --eval_pregenerated_only \
    --include_failed_test_output \
    --save_results \
    --output_dir logs

python examples/bugs_refactor/run_frozen_generator_fixer_flow.py \
    --val_datasets bugbench:test \
    --model Qwen/Qwen2.5-Coder-7B-Instruct \
    --base_url http://localhost:30000/v1 \
    --generator_model Qwen/Qwen2.5-Coder-7B-Instruct \
    --generator_base_url http://localhost:30001/v1 \
    --n_parallel 64 \
    --eval_pregenerated_only \
    --include_failed_test_output \
    --save_results \
    --output_dir logs

python examples/bugs_refactor/run_frozen_generator_fixer_flow.py \
    --val_datasets bugbench_qwen7b_sampled:test \
    --model Qwen/Qwen2.5-Coder-7B-Instruct \
    --base_url http://localhost:30000/v1 \
    --generator_model Qwen/Qwen2.5-Coder-7B-Instruct \
    --generator_base_url http://localhost:30001/v1 \
    --n_parallel 64 \
    --eval_pregenerated_only \
    --include_failed_test_output \
    --save_results \
    --output_dir logs

# Evaluate on fresh generated bugs (not pregenerated)
python examples/bugs_refactor/run_frozen_generator_fixer_flow.py \
    --dataset bugbench \
    --split test \
    --model Qwen/Qwen2.5-Coder-7B-Instruct \
    --base_url http://localhost:30000/v1 \
    --generator_model Qwen/Qwen2.5-Coder-7B-Instruct \
    --generator_base_url http://localhost:30001/v1 \
    --n_parallel 32 \
    --include_failed_test_output \
    --save_results \
    --output_dir logs

# Using OpenAI API for frozen generator
python examples/bugs_refactor/run_frozen_generator_fixer_flow.py \
    --dataset bugbench \
    --split test \
    --model Qwen/Qwen2.5-Coder-7B-Instruct \
    --base_url http://localhost:30000/v1 \
    --generator_model gpt-4o-mini \
    --generator_base_url https://api.openai.com/v1 \
    --n_parallel 32 \
    --include_failed_test_output \
    --save_results \
    --output_dir logs
