#!/bin/bash
#SBATCH --job-name=seq_v2_early_stop_AIME24_budget16_n2_threshold0.98_QwenR1_fixed_window_3
#SBATCH --output=./slurm_output/%j_seq_v2_early_stop_AIME24_budget16_n2_threshold0.98_QwenR1_fixed_window_3.out
#SBATCH --error=./slurm_output/%j_seq_v2_early_stop_AIME24_budget16_n2_threshold0.98_QwenR1_fixed_window_3.err
#SBATCH --partition=gpu-preempt
#SBATCH --nodes=1
#SBATCH --ntasks-per-node=1
#SBATCH --gres=gpu:a100:1
#SBATCH --cpus-per-task=8
#SBATCH --mem=30GB
#SBATCH --time=10:00:00

# Load CUDA module
module load cuda/11.8

# Activate virtual environment
source ./venv/bin/activate

# Create output directory
mkdir -p ./slurm_output

# Run the ModelSwitch script in early_stop style
python src/seq_early_stop.py \
    --task AIME24 \
    --gpus 1 \
    --seed 42 \
    --budget 16 \
    --n_sampling 2 \
    --threshold 0.98 \
    --models "['QwenR1', 'QwenR1']" \
    --fixed_window 3