#!/usr/bin/env bash
# Table 4 — Mixtral-8x7B-Instruct-v0.1 row
# Runs all 4 (O, S) conditions: O∈{1,4} × S∈{1,2}
# Requires a running vLLM server or offline GPU with enough VRAM.
# See configs/eval/mixtral_vllm.yaml to switch between offline/server mode.
set -euo pipefail

SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
REPO_ROOT="$(cd "${SCRIPT_DIR}/../.." && pwd)"
VENV="${REPO_ROOT}/../p311TheRockLM_venv"

if [[ -d "${VENV}" ]]; then
  source "${VENV}/bin/activate"
fi

cd "${REPO_ROOT}"

CONFIG="configs/eval/mixtral_vllm.yaml"
N_SEEDS=5
N_EPISODES=64
OUTPUT_DIR="outputs/eval/table4/mixtral"
WANDB_PROJECT="${WANDB_PROJECT:-meta-rg-s2b}"

for O in 1 4; do
  for S in 1 2; do
    echo "========================================"
    echo "  Mixtral  O=${O}  S=${S}"
    echo "========================================"
    python run_eval.py \
      --config "${CONFIG}" \
      --o "${O}" \
      --shots "${S}" \
      --n_seeds "${N_SEEDS}" \
      --n_episodes "${N_EPISODES}" \
      --output_dir "${OUTPUT_DIR}" \
      --wandb_project "${WANDB_PROJECT}"
  done
done

echo ""
echo "All Mixtral conditions complete. Results in ${OUTPUT_DIR}/"
