#!/usr/bin/env bash
# Run Autocomp on the 5-kernel subset with Gemini 3.1 Pro ONLY.
#
# The existing output/jaxbench-sweep/ used a Pro+Flash mix (MODELS = [pro, flash]).
# This script overrides that to Pro-only so we can compare Iter+ctx Pro vs.
# Autocomp Pro head-to-head on the same model budget.
#
# Output:
#   output/jaxbench-sweep-pro/{prob_id}_baseline_translate/
#   output/jaxbench-sweep-pro/{prob_id}_baseline/
set -euo pipefail
cd /path/to/autocomp
export AUTOCOMP_JAXBENCH_PROFILE=1

KERNELS=(
    "12p_RMSNorm"
    "5p_Flex_Attention"
    "15p_RetNet_Retention"
    "16p_Mamba2_SSD"
    "1p_Flash_Attention"
)

echo "============================================"
echo "Autocomp on 5-kernel subset (Pro-only)"
echo "Model: gemini-3.1-pro-preview"
echo "Output: output/jaxbench-sweep-pro"
echo "============================================"

python run_batch.py \
    --probs "${KERNELS[@]}" \
    --models "gcp::gemini-3.1-pro-preview" \
    --output-base "output/jaxbench-sweep-pro"

echo ""
echo "============================================"
echo "DONE: Autocomp Pro-only on 5-kernel subset"
echo "============================================"
