cd eval

pip install pebble
cd latex2sympy
pip install -e .
cd ..
pip install word2number timeout_decorator jieba matplotlib

export CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7
CKPT_DIR=path-to-your-ckpt-dir
BASE_MODEL=path-to-your-base-model-dir # for the evaluation of step 0
WANBD_PROJECT=your-wandb-project-name

bash eval/eval_scripts/eval_math_nodes.sh \
    --run_name ${CKPT_DIR} \
    --init_model ${BASE_MODEL} \
    --template qwen-boxed  \
    --tp_size 1 \
    --add_step_0 true \
    --temperature 1.0 \
    --top_p 0.95 \
    --max_tokens 16000 \
    --benchmarks amc23,aime24,aime25,math500,gsm8k,minerva_math,olympiadbench,mmlu_stem \
    --n_sampling 1 \
    --wandb_project ${WANBD_PROJECT}