#!/bin/bash
#SBATCH --job-name=weighted_method_MMLU_Pro_Qwen_s63
#SBATCH --output=./slurm_output/%j_weighted_method_MMLU_Pro_Qwen_s63.out
#SBATCH --error=./slurm_output/%j_weighted_method_MMLU_Pro_Qwen_s63.err
#SBATCH --partition=gpu,gpu-preempt
#SBATCH --nodes=1
#SBATCH --ntasks-per-node=1
#SBATCH --gres=gpu:a100:1
#SBATCH --cpus-per-task=8
#SBATCH --mem=40GB
#SBATCH --time=4:00:00

# Load CUDA module
module load cuda/11.8

# Activate virtual environment
source ./venv/bin/activate

# Create output directory
mkdir -p ./slurm_output

# Run the ModelSwitch script in early_stop style
python src/weighted_method.py \
    ./Results/skills_3/MMLU_Pro/self_con_seed63_budget16_acc61.38_models[Qwen]_with_logprobs.csv \
    --thresholds 0.7 0.75 0.8 0.85 0.9 0.95 0.99 0.999 0.9999 \
    --llm_call_limit_list 4 8 16 \
    --model_name all-MiniLM-L6-v2 \
    --tokenizer_name /datasets/ai/qwen/hub/models--Qwen--Qwen2.5-7B-Instruct/snapshots/a09a35458c702b33eeacc393d103063234e8bc28/