{
  "dataset": "CWQ",
  "method": "SoG",
  "model": "Qwen/Qwen3-30B-A3B-Thinking-2507",
  "num_questions": 326,
  "total_llm_calls": 1986,
  "total_input_tokens": 16882682,
  "total_output_tokens": 1930937,
  "total_tokens": 18813619,
  "total_cached_tokens": 0,
  "total_reasoning_tokens": 0,
  "total_time_seconds": 505.5124878883362,
  "avg_time_per_question_seconds": 113.72063786339906,
  "sample_mode": true,
  "total_kg_queries": 1712,
  "exact_match": 0.696,
  "note": "227/326 = 69.6"
}