TASK=math
POLICY=qwen-25-7b

sbatch --job-name=${TASK}_generate_${POLICY} scripts/generate.slurm ${POLICY} ${TASK}