{
  "benchmark_config": {
    "azure_endpoint": "END_POINT_HERE",
    "model_name": "gpt-5-chat",
    "api_version": "2025-01-01-preview",
    "max_queries_per_run": 50,
    "max_messages_per_context": 50,
    "temperature": 0.1,
    "max_tokens": 8000,
    "evaluation_runs": 3
  },
  "data_paths": {
    "conversation_files": {
      "Finance": "../data/Finance/synthetic_domain_channels_Finance.json",
      "Healthcare": "../data/Healthcare/synthetic_domain_channels_Healthcare.json",
      "Technology": "../data/Technology/synthetic_domain_channels_Technology.json",
      "Manufacturing": "../data/Manufacturing/synthetic_domain_channels_Manufacturing.json"
    },
    "queries_file": {
      "Finance": "./synthetic_queries/generated_user_queries_Finance.json",
      "Healthcare": "./synthetic_queries/generated_user_queries_Healthcare.json",
      "Technology": "./synthetic_queries/generated_user_queries_Technology.json",
      "Manufacturing": "./synthetic_queries/generated_user_queries_Manufacturing.json"
    },
    "output_directory": "./results/gpt_5_chat_benchmark_results"
  },
  "evaluation_criteria": {
    "user_profile_inference": {
      "weight": 0.25,
      "attributes": ["role", "expertise_level", "communication_style", "tone"],
      "scoring_method": "exact_match_weighted"
    },
    "intent_capture": {
      "weight": 0.25,
      "attributes": ["document_type", "target_audience", "temporal_scope", "detail_level"],
      "scoring_method": "semantic_similarity"
    },
    "citation_accuracy": {
      "weight": 0.25,
      "metrics": ["precision", "recall", "relevance"],
      "scoring_method": "f1_score"
    },
    "document_quality": {
      "weight": 0.25,
      "dimensions": [
        "factual_accuracy",
        "citation_quality", 
        "structure_organization",
        "completeness",
        "readability",
        "professional_quality",
        "consistency"
      ],
      "scoring_method": "llm_judge_averaged"
    }
  },
  "quality_thresholds": {
    "excellent": 4.0,
    "good": 3.0,
    "fair": 2.0,
    "poor": 1.0
  },
  "visualization_settings": {
    "figure_size": [12, 8],
    "dpi": 300,
    "style": "seaborn-v0_8",
    "color_palette": "husl",
    "save_format": "png"
  },
  "reporting": {
    "generate_individual_reports": true,
    "generate_summary_report": true,
    "generate_visualizations": true,
    "include_error_analysis": true,
    "detailed_citation_analysis": true
  }
}
