dataset_name="AI-MO/aimo-validation-aime"

for temp in 0.6 1.0 0.8 ; do 
for top_p in 0.95 0.8 0.6 0.4 ; do 
for beta in 0.25 0.5 1 2 4 8; do
for model_name in "Qwen/QwQ-32B" "nvidia/Llama-3_3-Nemotron-Super-49B-v1" "google/gemma-3-27b-it" "BytedTsinghua-SIA/DAPO-Qwen-32B"; do

VLLM_USE_V1=1 TOKENIZERS_PARALLELISM=false PYTHONPATH="../":"$PYTHONPATH" python ../evaluate_aime_moi_vllm.py \
   --model_name $model_name \
   --dataset_name $dataset_name \
   --max_new_tokens 32768 \
   --temperature $temp \
   --top_p $top_p \
   --beta $beta \
   --eager true \
   --output_dir "./results/aime/" 
done
done
done
done