{
  "number_of_domains": 4,
  "total_queries_across_domains": 160,
  "queries_per_domain": {
    "mean": 40,
    "median": 40.0,
    "values": [
      40,
      40,
      40,
      40
    ]
  },
  "averaged_scores": {
    "user_profile_accuracy": {
      "mean": 0.45112193859334687,
      "median": 0.44871747779370513,
      "std_dev": 0.07764419445857072,
      "min": 0.36637429473358507,
      "max": 0.5406785040523922,
      "count": 4
    },
    "intent_capture_accuracy": {
      "mean": 0.4987499999999999,
      "median": 0.5025,
      "std_dev": 0.017969882210706497,
      "min": 0.4749999999999999,
      "max": 0.5149999999999998,
      "count": 4
    },
    "intent_macro_f1": {
      "mean": 0.4987499999999999,
      "median": 0.5025,
      "std_dev": 0.017969882210706497,
      "min": 0.4749999999999999,
      "max": 0.5149999999999998,
      "count": 4
    },
    "context_retrieval_accuracy": {
      "mean": 0.19283544617107823,
      "median": 0.18685069169419077,
      "std_dev": 0.020951379294090553,
      "min": 0.17675999200725753,
      "max": 0.22088040928867386,
      "count": 4
    },
    "citation_accuracy": {
      "mean": 0.17055086070131226,
      "median": 0.16897788982546813,
      "std_dev": 0.0114326655485794,
      "min": 0.15912597125097125,
      "max": 0.18512169190334155,
      "count": 4
    },
    "document_quality_score": {
      "mean": 4.9000625,
      "median": 4.931125,
      "std_dev": 0.06391054131883563,
      "min": 4.804250000000001,
      "max": 4.933749999999998,
      "count": 4
    },
    "overall_score": {
      "mean": 1.2426641490931474,
      "median": 1.240528836614281,
      "std_dev": 0.014676981096479903,
      "min": 1.2271308214963075,
      "max": 1.2624681016477197,
      "count": 4
    }
  },
  "context_retrieval_detailed_metrics": {
    "precision": {
      "mean": 0.21003269590792123,
      "median": 0.10683760683760683,
      "std_dev": 0.2543997832067235,
      "min": 0.0,
      "max": 1.0,
      "count": 160
    },
    "recall": {
      "mean": 0.18770678354940606,
      "median": 0.05964912280701754,
      "std_dev": 0.23601807762784238,
      "min": 0.0,
      "max": 0.9444444444444444,
      "count": 160
    },
    "f1_score": {
      "mean": 0.19283544617107826,
      "median": 0.08546228710462286,
      "std_dev": 0.24016415498603763,
      "min": 0.0,
      "max": 0.9444444444444444,
      "count": 160
    }
  },
  "intent_detailed_averages": {
    "per_field_precision": {
      "tone_preference": {
        "mean": 0.15,
        "median": 0.15,
        "std_dev": 0.020412414523193145,
        "min": 0.125,
        "max": 0.175,
        "count": 4
      },
      "detail_level": {
        "mean": 0.36875,
        "median": 0.35,
        "std_dev": 0.055433894565208634,
        "min": 0.325,
        "max": 0.45,
        "count": 4
      },
      "document_type": {
        "mean": 0.9875,
        "median": 0.9875,
        "std_dev": 0.014433756729740658,
        "min": 0.975,
        "max": 1.0,
        "count": 4
      },
      "target_audience": {
        "mean": 0.64375,
        "median": 0.6625000000000001,
        "std_dev": 0.06574889099191455,
        "min": 0.55,
        "max": 0.7,
        "count": 4
      },
      "temporal_scope": {
        "mean": 0.34375,
        "median": 0.32499999999999996,
        "std_dev": 0.05907269532815761,
        "min": 0.3,
        "max": 0.425,
        "count": 4
      }
    },
    "per_field_recall": {
      "tone_preference": {
        "mean": 0.15,
        "median": 0.15,
        "std_dev": 0.020412414523193145,
        "min": 0.125,
        "max": 0.175,
        "count": 4
      },
      "detail_level": {
        "mean": 0.36875,
        "median": 0.35,
        "std_dev": 0.055433894565208634,
        "min": 0.325,
        "max": 0.45,
        "count": 4
      },
      "document_type": {
        "mean": 0.9875,
        "median": 0.9875,
        "std_dev": 0.014433756729740658,
        "min": 0.975,
        "max": 1.0,
        "count": 4
      },
      "target_audience": {
        "mean": 0.64375,
        "median": 0.6625000000000001,
        "std_dev": 0.06574889099191455,
        "min": 0.55,
        "max": 0.7,
        "count": 4
      },
      "temporal_scope": {
        "mean": 0.34375,
        "median": 0.32499999999999996,
        "std_dev": 0.05907269532815761,
        "min": 0.3,
        "max": 0.425,
        "count": 4
      }
    },
    "per_field_f1": {
      "tone_preference": {
        "mean": 0.15,
        "median": 0.15,
        "std_dev": 0.020412414523193145,
        "min": 0.125,
        "max": 0.175,
        "count": 4
      },
      "detail_level": {
        "mean": 0.36875,
        "median": 0.35,
        "std_dev": 0.055433894565208634,
        "min": 0.325,
        "max": 0.45,
        "count": 4
      },
      "document_type": {
        "mean": 0.9875,
        "median": 0.9875,
        "std_dev": 0.014433756729740658,
        "min": 0.975,
        "max": 1.0,
        "count": 4
      },
      "target_audience": {
        "mean": 0.64375,
        "median": 0.6625000000000001,
        "std_dev": 0.06574889099191455,
        "min": 0.55,
        "max": 0.7,
        "count": 4
      },
      "temporal_scope": {
        "mean": 0.34375,
        "median": 0.32499999999999996,
        "std_dev": 0.05907269532815761,
        "min": 0.3,
        "max": 0.425,
        "count": 4
      }
    }
  },
  "quality_dimensions_averages": {
    "personalization_fidelity": {
      "mean": 4.7375,
      "median": 5.0,
      "std_dev": 0.6392556599218644,
      "min": 0.0,
      "max": 5.0,
      "count": 160
    },
    "factuality": {
      "mean": 4.95,
      "median": 5.0,
      "std_dev": 0.41663521893903466,
      "min": 0.0,
      "max": 5.0,
      "count": 160
    },
    "citation_quality": {
      "mean": 4.94375,
      "median": 5.0,
      "std_dev": 0.41815009450404567,
      "min": 0.0,
      "max": 5.0,
      "count": 164
    },
    "fluency": {
      "mean": 4.96875,
      "median": 5.0,
      "std_dev": 0.39528470752104744,
      "min": 0.0,
      "max": 5.0,
      "count": 160
    },
    "structure": {
      "mean": 4.9125,
      "median": 5.0,
      "std_dev": 0.45401770391879887,
      "min": 0.0,
      "max": 5.0,
      "count": 160
    },
    "temporal_task_accuracy": {
      "mean": 4.8875,
      "median": 5.0,
      "std_dev": 0.4756657036566964,
      "min": 0.0,
      "max": 5.0,
      "count": 160
    },
    "overall_score": {
      "mean": 4.9000625,
      "median": 5.0,
      "std_dev": 0.4196771698422401,
      "min": 0.0,
      "max": 5.0,
      "count": 160
    }
  },
  "aggregated_score_distribution": {
    "excellent": 0,
    "good": 0,
    "fair": 0,
    "poor": 160
  },
  "overall_distribution_percentage": {
    "excellent": 0.0,
    "good": 0.0,
    "fair": 0.0,
    "poor": 100.0
  },
  "per_domain_results": {
    "gpt_5_chat_benchmark_results_finance": {
      "total_queries": 40,
      "average_scores": {
        "user_profile_accuracy": 0.36637429473358507,
        "intent_capture_accuracy": 0.49499999999999994,
        "intent_macro_f1": 0.49499999999999994,
        "context_retrieval_accuracy": 0.17675999200725753,
        "citation_accuracy": 0.16426982074069613,
        "document_quality_score": 4.93325,
        "overall_score": 1.2271308214963075
      },
      "context_retrieval_metrics": {
        "precision": {
          "mean": 0.18733695729572586,
          "count": 40
        },
        "recall": {
          "mean": 0.1749522146479314,
          "count": 40
        },
        "f1_score": {
          "mean": 0.17675999200725756,
          "count": 40
        }
      },
      "intent_detailed_metrics": {
        "per_field_precision": {
          "tone_preference": 0.15,
          "detail_level": 0.35,
          "document_type": 1.0,
          "target_audience": 0.675,
          "temporal_scope": 0.3
        },
        "per_field_recall": {
          "tone_preference": 0.15,
          "detail_level": 0.35,
          "document_type": 1.0,
          "target_audience": 0.675,
          "temporal_scope": 0.3
        },
        "per_field_f1": {
          "tone_preference": 0.15,
          "detail_level": 0.35,
          "document_type": 1.0,
          "target_audience": 0.675,
          "temporal_scope": 0.3
        },
        "average_macro_f1": 0.49499999999999994,
        "evaluated_fields": [
          "tone_preference",
          "detail_level",
          "document_type",
          "target_audience",
          "temporal_scope"
        ]
      },
      "score_distribution": {
        "excellent": 0,
        "good": 0,
        "fair": 0,
        "poor": 40
      },
      "quality_dimensions": {
        "personalization_fidelity": {
          "mean": 4.8,
          "median": 5.0,
          "std_dev": 0.4640954808922571,
          "min": 3.0,
          "max": 5.0,
          "count": 40
        },
        "factuality": {
          "mean": 4.975,
          "median": 5.0,
          "std_dev": 0.15811388300841897,
          "min": 4.0,
          "max": 5.0,
          "count": 40
        },
        "citation_quality": {
          "mean": 4.95,
          "median": 5.0,
          "std_dev": 0.22072142786315224,
          "min": 4.0,
          "max": 5.0,
          "count": 40
        },
        "fluency": {
          "mean": 5.0,
          "median": 5.0,
          "std_dev": 0.0,
          "min": 5.0,
          "max": 5.0,
          "count": 40
        },
        "structure": {
          "mean": 4.95,
          "median": 5.0,
          "std_dev": 0.22072142786315224,
          "min": 4.0,
          "max": 5.0,
          "count": 40
        },
        "temporal_task_accuracy": {
          "mean": 4.925,
          "median": 5.0,
          "std_dev": 0.2667467828369185,
          "min": 4.0,
          "max": 5.0,
          "count": 40
        },
        "overall_score": {
          "mean": 4.93325,
          "median": 5.0,
          "std_dev": 0.16379141676268694,
          "min": 4.33,
          "max": 5.0,
          "count": 40
        }
      }
    },
    "gpt_5_chat_benchmark_results_healthcare": {
      "total_queries": 40,
      "average_scores": {
        "user_profile_accuracy": 0.4108244812159355,
        "intent_capture_accuracy": 0.4749999999999999,
        "intent_macro_f1": 0.4749999999999999,
        "context_retrieval_accuracy": 0.22088040928867386,
        "citation_accuracy": 0.17368595891024013,
        "document_quality_score": 4.929,
        "overall_score": 1.2418781698829697
      },
      "context_retrieval_metrics": {
        "precision": {
          "mean": 0.24055270730394657,
          "count": 40
        },
        "recall": {
          "mean": 0.21651629756361593,
          "count": 40
        },
        "f1_score": {
          "mean": 0.22088040928867386,
          "count": 40
        }
      },
      "intent_detailed_metrics": {
        "per_field_precision": {
          "target_audience": 0.55,
          "detail_level": 0.35,
          "temporal_scope": 0.35,
          "document_type": 0.975,
          "tone_preference": 0.15
        },
        "per_field_recall": {
          "target_audience": 0.55,
          "detail_level": 0.35,
          "temporal_scope": 0.35,
          "document_type": 0.975,
          "tone_preference": 0.15
        },
        "per_field_f1": {
          "target_audience": 0.55,
          "detail_level": 0.35,
          "temporal_scope": 0.35,
          "document_type": 0.975,
          "tone_preference": 0.15
        },
        "average_macro_f1": 0.4749999999999999,
        "evaluated_fields": [
          "target_audience",
          "detail_level",
          "temporal_scope",
          "document_type",
          "tone_preference"
        ]
      },
      "score_distribution": {
        "excellent": 0,
        "good": 0,
        "fair": 0,
        "poor": 40
      },
      "quality_dimensions": {
        "personalization_fidelity": {
          "mean": 4.725,
          "median": 5.0,
          "std_dev": 0.5986094998689324,
          "min": 2.0,
          "max": 5.0,
          "count": 40
        },
        "factuality": {
          "mean": 4.975,
          "median": 5.0,
          "std_dev": 0.15811388300841897,
          "min": 4.0,
          "max": 5.0,
          "count": 40
        },
        "citation_quality": {
          "mean": 4.975,
          "median": 5.0,
          "std_dev": 0.15811388300841897,
          "min": 4.0,
          "max": 5.0,
          "count": 40
        },
        "fluency": {
          "mean": 5.0,
          "median": 5.0,
          "std_dev": 0.0,
          "min": 5.0,
          "max": 5.0,
          "count": 40
        },
        "structure": {
          "mean": 4.95,
          "median": 5.0,
          "std_dev": 0.22072142786315224,
          "min": 4.0,
          "max": 5.0,
          "count": 40
        },
        "temporal_task_accuracy": {
          "mean": 4.95,
          "median": 5.0,
          "std_dev": 0.22072142786315224,
          "min": 4.0,
          "max": 5.0,
          "count": 40
        },
        "overall_score": {
          "mean": 4.929,
          "median": 5.0,
          "std_dev": 0.15521366580066992,
          "min": 4.33,
          "max": 5.0,
          "count": 40
        }
      }
    },
    "gpt_5_chat_benchmark_results_manufacturing": {
      "total_queries": 40,
      "average_scores": {
        "user_profile_accuracy": 0.5406785040523922,
        "intent_capture_accuracy": 0.5149999999999998,
        "intent_macro_f1": 0.5149999999999998,
        "context_retrieval_accuracy": 0.17684304142459975,
        "citation_accuracy": 0.15912597125097125,
        "document_quality_score": 4.804250000000001,
        "overall_score": 1.2391795033455923
      },
      "context_retrieval_metrics": {
        "precision": {
          "mean": 0.19729170107852284,
          "count": 40
        },
        "recall": {
          "mean": 0.16667932203840197,
          "count": 40
        },
        "f1_score": {
          "mean": 0.17684304142459975,
          "count": 40
        }
      },
      "intent_detailed_metrics": {
        "per_field_precision": {
          "tone_preference": 0.125,
          "target_audience": 0.7,
          "temporal_scope": 0.3,
          "detail_level": 0.45,
          "document_type": 1.0
        },
        "per_field_recall": {
          "tone_preference": 0.125,
          "target_audience": 0.7,
          "temporal_scope": 0.3,
          "detail_level": 0.45,
          "document_type": 1.0
        },
        "per_field_f1": {
          "tone_preference": 0.125,
          "target_audience": 0.7,
          "temporal_scope": 0.3,
          "detail_level": 0.45,
          "document_type": 1.0
        },
        "average_macro_f1": 0.5149999999999998,
        "evaluated_fields": [
          "tone_preference",
          "target_audience",
          "temporal_scope",
          "detail_level",
          "document_type"
        ]
      },
      "score_distribution": {
        "excellent": 0,
        "good": 0,
        "fair": 0,
        "poor": 40
      },
      "quality_dimensions": {
        "personalization_fidelity": {
          "mean": 4.6,
          "median": 5.0,
          "std_dev": 0.9554164080758257,
          "min": 0.0,
          "max": 5.0,
          "count": 40
        },
        "factuality": {
          "mean": 4.875,
          "median": 5.0,
          "std_dev": 0.7905694150420949,
          "min": 0.0,
          "max": 5.0,
          "count": 40
        },
        "citation_quality": {
          "mean": 4.875,
          "median": 5.0,
          "std_dev": 0.7905694150420949,
          "min": 0.0,
          "max": 5.0,
          "count": 40
        },
        "fluency": {
          "mean": 4.875,
          "median": 5.0,
          "std_dev": 0.7905694150420949,
          "min": 0.0,
          "max": 5.0,
          "count": 40
        },
        "structure": {
          "mean": 4.825,
          "median": 5.0,
          "std_dev": 0.8129559864454139,
          "min": 0.0,
          "max": 5.0,
          "count": 40
        },
        "temporal_task_accuracy": {
          "mean": 4.775,
          "median": 5.0,
          "std_dev": 0.83166499665831,
          "min": 0.0,
          "max": 5.0,
          "count": 40
        },
        "overall_score": {
          "mean": 4.80425,
          "median": 5.0,
          "std_dev": 0.7942385080643646,
          "min": 0.0,
          "max": 5.0,
          "count": 40
        }
      }
    },
    "gpt_5_chat_benchmark_results_technology": {
      "total_queries": 40,
      "average_scores": {
        "user_profile_accuracy": 0.48661047437147475,
        "intent_capture_accuracy": 0.51,
        "intent_macro_f1": 0.51,
        "context_retrieval_accuracy": 0.1968583419637818,
        "citation_accuracy": 0.18512169190334155,
        "document_quality_score": 4.933749999999998,
        "overall_score": 1.2624681016477197
      },
      "context_retrieval_metrics": {
        "precision": {
          "mean": 0.21494941795348962,
          "count": 40
        },
        "recall": {
          "mean": 0.1926792999476749,
          "count": 40
        },
        "f1_score": {
          "mean": 0.19685834196378182,
          "count": 40
        }
      },
      "intent_detailed_metrics": {
        "per_field_precision": {
          "tone_preference": 0.175,
          "temporal_scope": 0.425,
          "target_audience": 0.65,
          "document_type": 0.975,
          "detail_level": 0.325
        },
        "per_field_recall": {
          "tone_preference": 0.175,
          "temporal_scope": 0.425,
          "target_audience": 0.65,
          "document_type": 0.975,
          "detail_level": 0.325
        },
        "per_field_f1": {
          "tone_preference": 0.175,
          "temporal_scope": 0.425,
          "target_audience": 0.65,
          "document_type": 0.975,
          "detail_level": 0.325
        },
        "average_macro_f1": 0.51,
        "evaluated_fields": [
          "tone_preference",
          "temporal_scope",
          "target_audience",
          "document_type",
          "detail_level"
        ]
      },
      "score_distribution": {
        "excellent": 0,
        "good": 0,
        "fair": 0,
        "poor": 40
      },
      "quality_dimensions": {
        "personalization_fidelity": {
          "mean": 4.825,
          "median": 5.0,
          "std_dev": 0.3848076442547927,
          "min": 4.0,
          "max": 5.0,
          "count": 40
        },
        "factuality": {
          "mean": 4.975,
          "median": 5.0,
          "std_dev": 0.15811388300841897,
          "min": 4.0,
          "max": 5.0,
          "count": 40
        },
        "citation_quality": {
          "mean": 4.975,
          "median": 5.0,
          "std_dev": 0.15811388300841897,
          "min": 4.0,
          "max": 5.0,
          "count": 40
        },
        "fluency": {
          "mean": 5.0,
          "median": 5.0,
          "std_dev": 0.0,
          "min": 5.0,
          "max": 5.0,
          "count": 40
        },
        "structure": {
          "mean": 4.925,
          "median": 5.0,
          "std_dev": 0.2667467828369185,
          "min": 4.0,
          "max": 5.0,
          "count": 40
        },
        "temporal_task_accuracy": {
          "mean": 4.9,
          "median": 5.0,
          "std_dev": 0.3038218101251,
          "min": 4.0,
          "max": 5.0,
          "count": 40
        },
        "overall_score": {
          "mean": 4.93375,
          "median": 5.0,
          "std_dev": 0.15415090009467997,
          "min": 4.33,
          "max": 5.0,
          "count": 40
        }
      }
    }
  }
}