#!/usr/bin/env bash
set -euo pipefail

SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
REPO_ROOT="$(dirname "$SCRIPT_DIR")"
cd "$REPO_ROOT"

PROMPT_STRATEGY="few_shot_discussion_cot"
O=1
SHOTS=1
N_SEEDS=1
BASE_SEED=10 #0
N_EPISODES=4
MAX_NEW_TOKENS=256
VOCAB_SIZE=16
DOMAIN="categorical"
VOCAB_PARTITION=true
N_FEW_SHOT_GAMES=10
V_MIN=3

CONFIGS=(
    "configs/eval/deepseek_prover_v1_hf.yaml"
    "configs/eval/deepseek_prover_v1_5_sft_hf.yaml"
    "configs/eval/deepseek_prover_v1_5_rl_hf.yaml"
    "configs/eval/deepseek_prover_v2_7b_hf.yaml"
    "configs/eval/deepseek_prover_v2_hf_api.yaml"
    "configs/eval/goedel_prover_sft_hf.yaml"
    "configs/eval/goedel_prover_dpo_hf.yaml"
    "configs/eval/goedel_prover_v2_8b_hf.yaml"
    "configs/eval/goedel_prover_v2_32b_hf_api.yaml"
    "configs/eval/kimina_prover_distill_8b_hf.yaml"
    "configs/eval/kimina_prover_72b_hf_api.yaml"
)

export TORCH_ROCM_AOTRITON_ENABLE_EXPERIMENTAL=1

PYTHON="$REPO_ROOT/../p311EvoX2_venv/bin/python"

for CONFIG in "${CONFIGS[@]}"; do
    echo "========================================================"
    echo "Running: $CONFIG"
    echo "========================================================"
    "$PYTHON" run_eval.py \
        --config "$CONFIG" \
	--base_seed "$BASE_SEED" \
        --prompt_strategy "$PROMPT_STRATEGY" \
        --o "$O" \
        --shots "$SHOTS" \
        --n_seeds "$N_SEEDS" \
        --n_episodes "$N_EPISODES" \
        --max_new_tokens "$MAX_NEW_TOKENS" \
        --vocab_size "$VOCAB_SIZE" \
        --domain "$DOMAIN" \
        --n_few_shot_games "$N_FEW_SHOT_GAMES" \
        --v_min "$V_MIN" \
        --vocab_partition \
        --inductive_verbaliser
done

echo "========================================================"
echo "All models complete."
echo "========================================================"
