python eval/evaluate.py --save --model "Qwen3-30B-A3B" --split "answerable-full" --toolbox "data"
