#!/bin/bash
#SBATCH -J leanRL
#SBATCH -p dpg
#SBATCH -A dpg
#SBATCH -N 1
#SBATCH --gres=gpu:1
#SBATCH --cpus-per-task=4
#SBATCH --mem=100G
#SBATCH --time=15-00:00:00
#SBATCH --constraint="gpu_40g+"
#SBATCH --output=/beegfs/scratch/user/<anonymized>/experiments/lean/logs/%A_%a.log
#SBATCH --error=/beegfs/scratch/user/<anonymized>/experiments/lean/logs/%A_%a.err
#SBATCH --array=0-1

source ~/miniconda3/bin/activate
scontrol show job ${SLURM_JOB_ID}
nvidia-smi
nvidia-smi topo -m

source ~/.bashrc
conda activate verl


MODELS=("DeepSeek-Prover-V1.5-SFT" "DeepSeek-Prover-V1.5-RL")
MODEL=${MODELS[$SLURM_ARRAY_TASK_ID]}
N=4
# Base checkpoint path
BASE_PATH=deepseek-ai

echo "Running evaluation of ${MODEL}"
python -m eval.eval \
    --model_name "${BASE_PATH}/${MODEL}" \
    --save_name "${MODEL}" \
    --num_samples ${N}
