{
  "overall_accuracy": 0.33578431372549017,
  "total_traces": 1224,
  "error_distribution": {
    "other": 813
  },
  "priority_performance": {
    "COMPARISON_ANALYSIS": "65/164 (39.6%)",
    "NUMERICAL_VERIFICATION": "223/614 (36.3%)",
    "ENTITY_HEURISTIC": "92/344 (26.7%)",
    "SUPERLATIVE_REASONING": "31/102 (30.4%)"
  },
  "unit_aware_accuracy": 0.38064516129032255,
  "unit_aware_count": 155
}