dataset_name="yzhuang/tinyzero-Countdown-Tasks-4"

for model_name in "Qwen/QwQ-32B" "nvidia/Llama-3_3-Nemotron-Super-49B-v1" "google/gemma-3-27b-it" "BytedTsinghua-SIA/DAPO-Qwen-32B"; do
  for temp in 0.6 0.8 1.0; do 
      for top_p in 0.4 0.6 0.8 0.95; do 
        for beta in 0.25 0.5 1 2 4 8; do 


        VLLM_USE_V1=1 TOKENIZERS_PARALLELISM=false PYTHONPATH="../":"$PYTHONPATH" \
        python ../evaluate_tinyzero_moi_vllm.py \
          --model_name "$model_name" \
          --dataset_name "$dataset_name" \
          --max_new_tokens 8192 \
          --temperature "$temp" \
          --top_p "$top_p" \
          --eager true \
          --beta $beta \
          --output_dir "./results/tinyzero/" 
      done
    done
  done
done

# wait for any stragglers
wait

echo "All jobs complete."
