
export CUDA_VISIBLE_DEVICES="0,1,2,3,4,5,6,7"
export HYDRA_FULL_ERROR=1
export WANDB_API_KEY=""
# export VLLM_ALLOW_LONG_MAX_MODEL_LEN=1



### --------------------------------- Baseline ---------------------------------
# bash sh/baseline/grpo/qwen2.5-math-1.5b-base/MATH/bs256_6k.sh



### --------------------------------- Hint GPRO ---------------------------------
bash sh/hint_grpo/qwen2.5-math-1.5b-base/MATH/bs256_mix_6k.sh
#

