#!/usr/bin/env bash
SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
REPO_ROOT="$(dirname "$SCRIPT_DIR")"
cd "$REPO_ROOT"

# Defaults matching the original Goedel-Prover-SFT llamacpp run
CONFIG="configs/eval/deepseek_prover_v2_hf_api.yaml"
PROMPT_STRATEGY="discussion_cot"
O=1
SHOTS=2
N_SEEDS=3
N_EPISODES=4
MAX_NEW_TOKENS=512
VOCAB_SIZE=16
DOMAIN="categorical"
VOCAB_PARTITION=true

# Parse --key value overrides
while [[ $# -gt 0 ]]; do
    case "$1" in
        --config)           CONFIG="$2";           shift 2 ;;
        --prompt_strategy)  PROMPT_STRATEGY="$2";  shift 2 ;;
        --o)                O="$2";                shift 2 ;;
        --shots)            SHOTS="$2";            shift 2 ;;
        --n_seeds)          N_SEEDS="$2";          shift 2 ;;
        --n_episodes)       N_EPISODES="$2";       shift 2 ;;
        --max_new_tokens)   MAX_NEW_TOKENS="$2";   shift 2 ;;
        --vocab_size)       VOCAB_SIZE="$2";       shift 2 ;;
        --domain)           DOMAIN="$2";           shift 2 ;;
        --vocab_partition)  VOCAB_PARTITION=true;  shift 1 ;;
        --no_vocab_partition) VOCAB_PARTITION=false; shift 1 ;;
        *) echo "Unknown argument: $1" >&2; exit 1 ;;
    esac
done

VP_FLAG=""
$VOCAB_PARTITION && VP_FLAG="--vocab_partition"

python run_eval.py \
    --config "$CONFIG" \
    --prompt_strategy "$PROMPT_STRATEGY" \
    --o "$O" \
    --shots "$SHOTS" \
    --n_seeds "$N_SEEDS" \
    --n_episodes "$N_EPISODES" \
    --max_new_tokens "$MAX_NEW_TOKENS" \
    --vocab_size "$VOCAB_SIZE" \
    --domain "$DOMAIN" \
    $VP_FLAG
