#!/bin/bash
# =============================================================================
# Example commands for running generator_fixer_flow with few-shot example bugs
# =============================================================================
# This script demonstrates how to use the generator example bugs feature,
# which includes examples of target bugs in the generator prompt to guide
# bug generation towards a specific style (e.g., human-like bugs).
# =============================================================================

# -----------------------------------------------------------------------------
# Basic example: Generate bugs with 3 examples from bugbench_human
# -----------------------------------------------------------------------------
python examples/bugs_refactor/run_generator_fixer_flow.py \
    --dataset bigcodebench \
    --split test \
    --n_tasks 3 \
    --model Qwen/Qwen2.5-Coder-7B-Instruct \
    --base_url http://localhost:30000/v1 \
    --n_parallel 32 \
    --generator_example_bugs_dataset bugbench_human \
    --generator_example_bugs_split train \
    --generator_n_example_bugs 3 \
    --include_failed_test_output \
    --fixer_attempts_val 1 \
    --print_samples 3

# -----------------------------------------------------------------------------
# Full evaluation with example bugs + codegen evaluation
# -----------------------------------------------------------------------------
# python examples/bugs_refactor/run_generator_fixer_flow.py \
#     --dataset bigcodebench \
#     --split test \
#     --model Qwen/Qwen2.5-Coder-7B-Instruct \
#     --base_url http://localhost:30000/v1 \
#     --n_parallel 64 \
#     --generator_example_bugs_dataset bugbench_human \
#     --generator_example_bugs_split train \
#     --generator_n_example_bugs 3 \
#     --evaluate_codegen \
#     --include_failed_test_output \
#     --fixer_attempts_val 1 \
#     --save_results \
#     --output_dir logs

# -----------------------------------------------------------------------------
# With adversarial bugs as examples (different bug style)
# -----------------------------------------------------------------------------
# python examples/bugs_refactor/run_generator_fixer_flow.py \
#     --dataset bigcodebench \
#     --split test \
#     --model Qwen/Qwen2.5-Coder-7B-Instruct \
#     --base_url http://localhost:30000/v1 \
#     --n_parallel 64 \
#     --generator_example_bugs_dataset bugbench_adversarial \
#     --generator_example_bugs_split train \
#     --generator_n_example_bugs 3 \
#     --include_failed_test_output \
#     --fixer_attempts_val 1 \
#     --save_results \
#     --output_dir logs

# -----------------------------------------------------------------------------
# Combine with code embedding similarity for aux reward
# -----------------------------------------------------------------------------
# python examples/bugs_refactor/run_generator_fixer_flow.py \
#     --dataset bigcodebench \
#     --split test \
#     --model Qwen/Qwen2.5-Coder-7B-Instruct \
#     --base_url http://localhost:30000/v1 \
#     --n_parallel 32 \
#     --generator_example_bugs_dataset bugbench_human \
#     --generator_example_bugs_split train \
#     --generator_n_example_bugs 3 \
#     --use_code_embedding_similarity \
#     --code_embedding_reward_weight 0.3 \
#     --reference_bug_dataset bugbench_human \
#     --reference_bug_split train \
#     --include_failed_test_output \
#     --fixer_attempts_val 1 \
#     --save_results \
#     --output_dir logs

# -----------------------------------------------------------------------------
# Multiple validation datasets with example-guided generation
# -----------------------------------------------------------------------------
# python examples/bugs_refactor/run_generator_fixer_flow.py \
#     --val_datasets bigcodebench:test kodcode:test \
#     --model Qwen/Qwen2.5-Coder-7B-Instruct \
#     --base_url http://localhost:30000/v1 \
#     --n_parallel 64 \
#     --generator_example_bugs_dataset bugbench_human \
#     --generator_example_bugs_split train \
#     --generator_n_example_bugs 3 \
#     --evaluate_codegen \
#     --include_failed_test_output \
#     --fixer_attempts_val 1 \
#     --save_results \
#     --output_dir logs
