#!/bin/bash
export CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7

python evaluate_tau_bench.py \
   --split retail \
   --model Qwen/Qwen3-32B \
   --prompt_path /code/jiateng-sandbox/taubench_application/Single_turn_tau_bench/prompt_template.txt \
   --max_tasks 115 \
   --start_index 0