python eval/evaluate.py --save --model "Qwen3-30B-A3B" --split "answerable-full" --n-shots 3
