{
  "agents4sci_v2": {
    "rigor_traceability": 24.0,
    "integration_causality": 23.0,
    "feasibility_minimality": 18.0,
    "uncertainty_adaptation": 13.0,
    "decisionability": 14.0,
    "overall": 92.0
  },
  "baseline_single": {
    "rigor_traceability": 20.0,
    "integration_causality": 22.0,
    "feasibility_minimality": 16.0,
    "uncertainty_adaptation": 12.0,
    "decisionability": 10.0,
    "overall": 80.0
  },
  "baseline_tree": {
    "rigor_traceability": 22.0,
    "integration_causality": 23.0,
    "feasibility_minimality": 18.0,
    "uncertainty_adaptation": 13.0,
    "decisionability": 12.0,
    "overall": 88.0
  },
  "baseline_debate": {
    "rigor_traceability": 20.0,
    "integration_causality": 22.0,
    "feasibility_minimality": 16.0,
    "uncertainty_adaptation": 11.0,
    "decisionability": 7.0,
    "overall": 76.0
  }
}