#!/bin/bash
#SBATCH --job-name=model_switch_GSM8K_n_sampling2_Qwen
#SBATCH --output=./slurm_output/%j_model_switch_GSM8K_n_sampling2_Qwen.out
#SBATCH --error=./slurm_output/%j_model_switch_GSM8K_n_sampling2_Qwen.err
#SBATCH --partition=gpu-preempt
#SBATCH --nodes=1
#SBATCH --ntasks-per-node=1
#SBATCH --gres=gpu:a100:1
#SBATCH --cpus-per-task=8
#SBATCH --mem=30GB
#SBATCH --time=10:00:00

# Load CUDA module
module load cuda/11.8

# Activate virtual environment
source ./LLM_R/Symbolic-MoE/venv/bin/activate

# Create output directory
mkdir -p ./slurm_output

# Run the ModelSwitch script in early_stop style
python src/model_switch_early_stop_style.py \
    --task GSM8K \
    --gpus 1 \
    --seed 42 \
    --n_sampling 2 \
    --consistency_threshold 1.0 \
    --voting_strategy ms_mad \
    --models "['Qwen', 'Qwen', 'Qwen']"