export MODEL_NAME="qwen3-32b"
export SET_TORUN="test"
export RUN_NAME="${MODEL_NAME}-${SET_TORUN}-supervisor"
export DATASET="humaneval"
python run_gsm.py \
    --model-id ${MODEL_NAME} \
    --model-id-summary "gpt-4.1" \
    --run-name "${RUN_NAME}" \
    --set-to-run ${SET_TORUN} \
    --supervisor