from .prompts import domain_expert_instructions, radiologist_instructions
import os
import asyncio
from typing import Dict, List, Any, Optional
from langchain_core.messages import AIMessage, HumanMessage
from langgraph.graph import StateGraph, START, END
from langchain_core.runnables import RunnableConfig
from langchain_openai import ChatOpenAI
import json
import numpy as np
from collections import Counter

from .state import CoordinatorState, PathResult
from .configuration import Configuration
from typing import Dict, List, Any, cast
from langchain_core.messages import AIMessage, HumanMessage
from langgraph.graph import StateGraph, START, END
from langgraph.types import Send
from langchain_core.runnables import RunnableConfig
from google.genai import Client
from langchain_google_genai import ChatGoogleGenerativeAI
from langchain_openai import ChatOpenAI
import itertools
import re

from .state import (
    CoordinatorState,
    DomainExpertState,
    RadiologistState,
    SymptomAnalystState,
    WebSearchState,
    DiagnoserState,
    PatientInfo,
    FactCheckState  
)
from .configuration import Configuration
from .prompts import (
    get_current_date,
    domain_expert_instructions,
    radiologist_instructions,
)
from .utils import resolve_urls, get_citations, insert_citation_markers

import requests
import json
from langchain_openai import ChatOpenAI

serper_api_key = 'YOUR_KEY'

API_KEY = 'YOUR_KEY'

GEMINI_API_KEY = "YOUR_KEY"

if not GEMINI_API_KEY:
    raise ValueError("GEMINI_API_KEY is not set")

genai_client = Client(api_key=GEMINI_API_KEY)

def has_medical_images(state: CoordinatorState) -> bool:
    """Check if the case has actual medical images or meaningful imaging information"""
    
    # Check for actual image contents
    image_contents = getattr(state, 'image_contents', [])
    if image_contents and len(image_contents) > 0:
        return True
    
    # Check for meaningful imaging descriptions in clinical text
    clinical_text = ""
    if hasattr(state, "clinical_text") and state.clinical_text:
        clinical_text = state.clinical_text
    elif hasattr(state, "patient_info") and state.patient_info:
        clinical_text = state.patient_info.clinical_text
    
    # Look for imaging section with actual content
    if "## Imaging Information" in clinical_text:
        try:
            imaging_section = clinical_text.split("## Imaging Information")[1]
            if "##" in imaging_section:
                imaging_section = imaging_section.split("##")[0]
            
            # Check if imaging section has meaningful content beyond just filenames
            imaging_content = imaging_section.strip()
            
            # Skip if only contains image file references without descriptions
            if len(imaging_content) < 50 or imaging_content.count("Image file:") > 0 and len(imaging_content.replace("Image file:", "").strip()) < 20:
                return False
                
            return True
        except:
            pass
    
    return False

# 2. Create a dummy radiologist state for cases without images
def create_dummy_radiologist_state() -> Dict[str, Any]:
    """Create a dummy radiologist state when no images are available"""
    return {
        "radiologist_state": {
            "image_findings": [{
                "region": "No Images Available",
                "finding": "No medical images provided for analysis"
            }],
            "limitations": ["No imaging data available for interpretation"]
        }
    }

# 3. Modified radiologist analysis with image check
def radiologist_analysis_conditional(state: CoordinatorState, config: RunnableConfig) -> RadiologistState:
    """Conditional radiologist analysis - only runs if images are present"""
    
    if not has_medical_images(state):
        print("No medical images detected, skipping radiologist analysis")
        return create_dummy_radiologist_state()
    
    print("Medical images detected, proceeding with radiologist analysis")
    return radiologist_analysis(state, config)

# 4. Modified run_analysis_with_hallucination_check for conditional radiology
def run_conditional_radiologist_analysis(state, config):
    """Run radiologist analysis with conditional logic and hallucination checking"""
    
    if not has_medical_images(state):
        print("  Radiologist Analysis - Skipping (no images)")
        return create_dummy_radiologist_state()
    
    print("  Radiologist Analysis - Running with hallucination detection...")
    return run_analysis_with_hallucination_check(
        radiologist_analysis, state, config, "Radiologist Analysis"
    )

def initial_cot_reasoning(state: CoordinatorState, config: RunnableConfig) -> CoordinatorState:
    configurable = Configuration.from_runnable_config(config)
    
    llm = ChatOpenAI(
        api_key=API_KEY,
        model=configurable.diagnoser_model,
        max_retries=2
    )
    
    original_case = ""
    if hasattr(state, "clinical_text") and state.clinical_text:
        original_case = state.clinical_text
    elif hasattr(state, "patient_info") and state.patient_info:
        original_case = state.patient_info.clinical_text
    
    diagnostic_options_text = ""
    if hasattr(state, "diagnostic_options") and state.diagnostic_options:
        diagnostic_options_text = "\n".join([f"Option {k}: {v}" for k, v in state.diagnostic_options.items()])
    
    image_contents = []
    if hasattr(state, "image_contents") and state.image_contents:
        image_contents = state.image_contents
        print(f"Found {len(image_contents)} images for CoT analysis")
    
    if not image_contents:
        cot_prompt = f"""
You are a medical expert. Please analyze this clinical case step by step and select the most likely diagnosis.

## Clinical Case
{original_case}

## Answer Choices
{diagnostic_options_text}

Please use Chain-of-Thought reasoning:
1. Identify key symptoms and findings from the clinical text
2. Consider all available imaging information mentioned in the case
3. Apply differential diagnosis thinking
4. Select the most likely option based on all available evidence

Format your response as:
CHAIN OF THOUGHT:
[Your step-by-step reasoning including analysis of any imaging findings mentioned]

SELECTED OPTION: [Write only the letter: A, B, C, D, or E]
"""
        
        print("Performing CoT reasoning with text and imaging descriptions...")
        result = llm.invoke(cot_prompt)
        result_content = result.content
    else:
        cot_prompt = f"""
You are a medical expert. Please analyze this clinical case step by step, including the provided medical images, and select the most likely diagnosis.

## Clinical Case
{original_case}

## Auxiliary Images
Auxiliary images are provided for your analysis. Please carefully examine them as part of your diagnostic reasoning.

## Answer Choices
{diagnostic_options_text}

Please use Chain-of-Thought reasoning:
1. Identify key symptoms and findings from the clinical text
2. Analyze the provided medical images for relevant findings
3. Integrate clinical and imaging information
4. Apply differential diagnosis thinking
5. Select the most likely option based on all available evidence

Format your response as:
CHAIN OF THOUGHT:
[Your step-by-step reasoning including analysis of clinical findings AND imaging findings]

SELECTED OPTION: [Write only the letter: A, B, C, D, or E]
"""
        
        message_content = [{"type": "text", "text": cot_prompt}]
        
        for image in image_contents:
            message_content.append(image)
        
        from langchain.schema import HumanMessage
        messages = [HumanMessage(content=message_content)]
        
        print("Performing CoT reasoning with images...")
        result = llm.invoke(messages)
        result_content = result.content
    
    cot_reasoning = ""
    cot_selected_option = ""
    
    if "CHAIN OF THOUGHT:" in result_content:
        reasoning_section = result_content.split("CHAIN OF THOUGHT:")[1]
        if "SELECTED OPTION:" in reasoning_section:
            cot_reasoning = reasoning_section.split("SELECTED OPTION:")[0].strip()
            option_section = reasoning_section.split("SELECTED OPTION:")[1].strip()
            option_match = re.search(r'^([A-E])', option_section)
            if option_match:
                cot_selected_option = option_match.group(1)
        else:
            cot_reasoning = reasoning_section.strip()
    else:
        cot_reasoning = result_content
    
    if not cot_selected_option:
        patterns = [
            r'SELECTED OPTION:\s*([A-E])',
            r'(?:answer|choice|option)[\s:]*([A-E])',
            r'(?:the\s+)?(?:correct\s+)?(?:answer|choice|option)\s+is\s+([A-E])',
            r'\b([A-E])\s*(?:is\s+(?:the\s+)?(?:correct|right|best|most\s+likely))',
        ]
        
        for pattern in patterns:
            matches = re.findall(pattern, result_content, re.IGNORECASE)
            if matches:
                cot_selected_option = matches[-1].upper()
                break
    
    print(f"CoT reasoning completed. Selected option: {cot_selected_option}")
    
    state_dict = state.model_dump()
    state_dict["cot_reasoning"] = cot_reasoning
    state_dict["cot_selected_option"] = cot_selected_option
    state_dict["cot_full_response"] = result_content
    
    return CoordinatorState(**state_dict)

def judge_cot_result(state: CoordinatorState, config: RunnableConfig) -> CoordinatorState:
    
    cot_selected_option = getattr(state, 'cot_selected_option', '')
    
    print(f"CoT completed with option {cot_selected_option}, proceeding to expert analysis pipeline")
    
    state_dict = state.model_dump()
    state_dict["cot_is_correct"] = False  
    state_dict["incorrect_options"] = []  
    
    return CoordinatorState(**state_dict)


def generate_simple_diagnosis(state: CoordinatorState, config: RunnableConfig) -> CoordinatorState:
    cot_reasoning = getattr(state, 'cot_reasoning', '')
    cot_selected_option = getattr(state, 'cot_selected_option', '')
    
    final_message = f"""# Diagnostic Analysis Result

{cot_reasoning}

## Selected Option
**Option {cot_selected_option}**

## Quality Assessment
✅ Initial Chain-of-Thought reasoning was verified as correct.
"""
    
    print(f"Simple diagnosis generated for correct CoT result: Option {cot_selected_option}")
    
    state_dict = state.model_dump()
    state_dict["messages"] = [AIMessage(content=final_message)]
    
    return CoordinatorState(**state_dict)


def fact_check_cot(state: CoordinatorState, config: RunnableConfig) -> CoordinatorState:
    cot_full_response = getattr(state, 'cot_full_response', '')
    
    fact_check_record = fact_check_analysis(
        state, config, 
        "Initial CoT Reasoning", 
        cot_full_response
    )
    
    print("CoT fact-check completed, proceeding to expert analysis...")
    
    state_dict = state.model_dump()
    
    if 'fact_check_records' not in state_dict:
        state_dict['fact_check_records'] = []
    state_dict['fact_check_records'].append(fact_check_record)
    
    return CoordinatorState(**state_dict)


def route_after_judger(state: CoordinatorState) -> str:
    is_correct = getattr(state, 'cot_is_correct', False)
    
    if is_correct:
        return "generate_simple_diagnosis"
    else:
        return "fact_check_cot"


def process_patient_info(state: CoordinatorState, config: RunnableConfig) -> CoordinatorState:
    state_dict = state.model_dump()
    state_dict["consultation_round"] = 1
    
    state_dict["fact_check_records"] = []
    
    clinical_text = ""
    if hasattr(state, "clinical_text") and state.clinical_text:
        clinical_text = state.clinical_text
    else:
        if state.messages and len(state.messages) > 0:
            message_content = state.messages[0].content
            if isinstance(message_content, list):
                for content_item in message_content:
                    if content_item.get("type") == "text":
                        clinical_text = content_item.get("text", "")
                        break
            else:
                clinical_text = message_content or ""
    
    image_filenames = []
    if "## Imaging Information" in clinical_text:
        try:
            imaging_section = clinical_text.split("## Imaging Information")[1]
            if "##" in imaging_section:
                imaging_section = imaging_section.split("##")[0]
            
            image_matches = re.findall(r'- Image file: ([^\n]+)', imaging_section)
            image_filenames = [match.strip() for match in image_matches]
        except:
            pass
    
    # try:
    patient_info = PatientInfo(clinical_text=clinical_text, medical_images=image_filenames)
    state_dict["patient_info"] = patient_info.model_dump()
    print(f"Created patient_info with clinical_text length: {len(clinical_text)}")

    
    image_contents = []
    if hasattr(state, "image_contents") and state.image_contents:
        image_contents = state.image_contents
        print(f"Found {len(image_contents)} actual images")
    else:
        if state.messages and len(state.messages) > 0:
            message_content = state.messages[0].content
            if isinstance(message_content, list):
                for content_item in message_content:
                    if content_item.get("type") == "image_url":
                        image_contents.append(content_item)
        print(f"Processing text-only input (no actual images)")
    
    state_dict["image_contents"] = image_contents

    if hasattr(state, "diagnostic_options"):
        state_dict["diagnostic_options"] = state.diagnostic_options
    
    return CoordinatorState(**state_dict)

def multimodal_fact_check_analysis(state, config, analysis_name, analysis_text):
    """Enhanced fact check analysis with multimodal support"""
    
    image_contents = getattr(state, 'image_contents', [])
    if not image_contents:
        image_contents = []
    
    original_clinical_text = getattr(state, 'clinical_text', '')
    if not original_clinical_text and hasattr(state, 'patient_info'):
        original_clinical_text = state.patient_info.clinical_text
    
    configurable = Configuration.from_runnable_config(config)
    
    llm = ChatOpenAI(
        api_key=API_KEY,
        model=configurable.fact_check_model if hasattr(configurable, 'fact_check_model') else "gpt-4-turbo-preview",
        # temperature=0.1,
        max_retries=2
    )
    
    fact_check_prompt = f"""
You are a medical fact checker. Your task is to verify the accuracy and consistency of medical analysis against the original clinical information and any provided images.

## Original Clinical Information
{original_clinical_text}

## Analysis to Fact-Check: {analysis_name}
{analysis_text}

Please perform the following fact-checking tasks:

1. **CONSISTENCY CHECK**: Compare the analysis result with the original clinical text and visible image findings
   - Are all extracted symptoms/findings actually mentioned in the original text or visible in images?
   - Are there any contradictions or misinterpretations?
   - Are there any fabricated or hallucinated information?

2. **COMPLETENESS CHECK**: Assess if important information was missed
   - Are there key symptoms or findings in the original text that weren't captured?
   - Are there important image findings that were overlooked?
   - Is the analysis comprehensive relative to the available information?

3. **ACCURACY CHECK**: Verify medical accuracy
   - Are medical terms used correctly?
   - Are interpretations medically sound?
   - Are image interpretations accurate based on what's actually visible?
   - Are there any obvious medical errors?

Pay special attention to:
- Image-based claims that should match what's actually visible
- Medical findings that should be supported by the clinical text or images
- Diagnostic reasoning that should be logical and evidence-based

Format your response as:

**FACT CHECK RESULT: [PASS/PARTIAL/FAIL]**

**CONSISTENCY ISSUES:**
- [List any inconsistencies, or "None detected"]

**ACCURACY CONCERNS:**
- [List any accuracy problems, or "None detected"]

**MISSED INFORMATION:**
- [List any important omissions, or "None detected"]

**OVERALL ASSESSMENT:**
[Brief summary of the fact check results]

**RECOMMENDATIONS:**
- [List 2-3 recommendations for improvement, or "Analysis meets quality standards"]
"""
    
    if image_contents and len(image_contents) > 0:
        message_content = [{"type": "text", "text": fact_check_prompt}]
        for image in image_contents:
            message_content.append(image)
        messages = [HumanMessage(content=message_content)]
        result = llm.invoke(messages)
    else:
        result = llm.invoke(fact_check_prompt)
    
    result_content = result.content
    
    fact_check_result = "UNKNOWN"
    consistency_issues = []
    missed_information = []
    accuracy_concerns = []
    overall_assessment = ""
    recommendations = []
    
    if "FACT CHECK RESULT:" in result_content:
        result_line = result_content.split("FACT CHECK RESULT:")[1].split("\n")[0]
        if "PASS" in result_line.upper():
            fact_check_result = "PASS"
        elif "FAIL" in result_line.upper():
            fact_check_result = "FAIL"
        elif "PARTIAL" in result_line.upper():
            fact_check_result = "PARTIAL"
    

    fact_check_record = {
        "analysis_type": analysis_name,
        "result": fact_check_result,
        "consistency_issues": consistency_issues,
        "missed_information": missed_information,
        "accuracy_concerns": accuracy_concerns,
        "overall_assessment": overall_assessment,
        "recommendations": recommendations,
        "timestamp": "2024-12-28",  
        "full_response": result_content,
        "multimodal_check": len(image_contents) > 0 if image_contents else False,
        "image_count": len(image_contents) if image_contents else 0
    }
    
    print(f"Fact-check completed for {analysis_name}: {fact_check_result}")
    if image_contents:
        print(f"  - Multimodal check with {len(image_contents)} images")
    if fact_check_result == "FAIL":
        print(f"  - Consistency issues: {len(consistency_issues)}")
        print(f"  - Accuracy concerns: {len(accuracy_concerns)}")
    
    return fact_check_record


def domain_expert_analysis(state: CoordinatorState, config: RunnableConfig) -> DomainExpertState:
    configurable = Configuration.from_runnable_config(config)
    
    llm = ChatOpenAI(
        api_key=API_KEY,
        model=configurable.domain_expert_model,
        # temperature=1.0,
        max_retries=2
    )
    
    if hasattr(state, "clinical_text") and state.clinical_text:
        clinical_text = state.clinical_text
    else:
        clinical_text = state.patient_info.clinical_text if hasattr(state, 'patient_info') else "No clinical text available"
    
    print(f"Domain Expert analyzing clinical text: {clinical_text[:100]}...")
    
    formatted_prompt = domain_expert_instructions.format(
        clinical_text=clinical_text
    )

    improvement_guidance = getattr(state, 'improvement_guidance', '')

    # import pdb; pdb.set_trace()
    
    if improvement_guidance:
        base_prompt = f"{improvement_guidance}\n\n{formatted_prompt}"
        print(f"Domain Expert applying improvement guidance: {len(improvement_guidance)} characters")
    else:
        base_prompt = formatted_prompt

    result = llm.invoke(base_prompt)
    result_content = result.content
    print(f"Domain Expert result received")
    
    extracted_symptoms = []
    clinical_findings = {}
    family_history = []
    past_medical_history = []
    
    if "FAMILY MEDICAL HISTORY:" in result_content:
        family_history_text = result_content.split("FAMILY MEDICAL HISTORY:")[1].split("PAST MEDICAL HISTORY:" if "PAST MEDICAL HISTORY:" in result_content else "\n\n")[0].strip()
        family_history = [condition.strip() for condition in family_history_text.split("-") if condition.strip()]
    
    if "PAST MEDICAL HISTORY" in result_content:
        past_history_text = result_content.split("PAST MEDICAL HISTORY:")[1].split("EXTRACTED SYMPTOMS:" if "EXTRACTED SYMPTOMS:" in result_content else "\n\n")[0].strip()
        past_medical_history = [condition.strip() for condition in past_history_text.split("- ") if condition.strip()]

    if "EXTRACTED SYMPTOMS:" in result_content:
        symptoms_text = result_content.split("EXTRACTED SYMPTOMS:")[1].split("CLINICAL FINDINGS:" if "CLINICAL FINDINGS:" in result_content else "\n\n")[0].strip()
        extracted_symptoms = [symptom.strip() for symptom in symptoms_text.split("-") if symptom.strip()]
    
    if "CLINICAL FINDINGS:" in result_content:
        findings_text = result_content.split("CLINICAL FINDINGS:")[1].strip()
        system_sections = findings_text.split("\n\n")
        
        for section in system_sections:
            if ":" in section:
                system, findings = section.split(":", 1)
                system = system.strip()
                findings_list = [f.strip() for f in findings.strip().split("-") if f.strip()]
                clinical_findings[system] = findings_list
    
    if not family_history:
        family_history = ["No family medical history available"]
    if not past_medical_history:
        past_medical_history = ["No past medical history available"]
    if not extracted_symptoms:
        extracted_symptoms = ["No specific symptoms extracted"]
    if not clinical_findings:
        clinical_findings = {"General": ["Patient case needs further analysis"]}
    
    return {
        "domain_expert_state": {
            "family_medical_history": family_history,
            "past_medical_history": past_medical_history,
            "extracted_symptoms": extracted_symptoms,
            "clinical_findings": clinical_findings
        },
    }


def radiologist_analysis(state: CoordinatorState, config: RunnableConfig) -> RadiologistState:
    configurable = Configuration.from_runnable_config(config)
    
    llm = ChatOpenAI(
        api_key=API_KEY,
        model=configurable.radiologist_model,
        # temperature=1.0,
        max_retries=2
    )
    
    # import pdb;pdb.set_trace()
    image_contents = []
    if hasattr(state, "image_contents") and state.image_contents:
        image_contents = state.image_contents
        print(f"Found {len(image_contents)} images in state.image_contents")
    
    medical_images_desc = ""
    # import pdb;pdb.set_trace()
    if not image_contents:
        if hasattr(state, "clinical_text") and state.clinical_text:
            medical_images_desc = state.clinical_text
        elif hasattr(state, "patient_info") and state.patient_info:
            medical_images_desc = state.patient_info.clinical_text
        else:
            medical_images_desc = "No medical images or descriptions available."
            
        if "## Imaging Information" in medical_images_desc:
            try:
                imaging_section = medical_images_desc.split("## Imaging Information")[1]
                if "##" in imaging_section:
                    imaging_section = imaging_section.split("##")[0]
                medical_images_desc = imaging_section.strip()
            except:
                pass
        
        formatted_prompt = radiologist_instructions.format(
            medical_images=medical_images_desc
        )

        improvement_guidance = getattr(state, 'improvement_guidance', '')

        # import pdb;pdb.set_trace()

        if improvement_guidance:
            base_prompt = f"{improvement_guidance}\n\n{formatted_prompt}"
            print(f"Radiologist applying improvement guidance: {len(improvement_guidance)} characters")
        else:
            base_prompt = formatted_prompt

        result = llm.invoke(base_prompt)
        result_content = result.content
    else:
        medical_images_desc = "Medical images provided in this consultation. Please analyze."
        
        formatted_prompt = radiologist_instructions.format(
            patient_info=state.patient_info.clinical_text,
            medical_images=medical_images_desc
        )

        improvement_guidance = getattr(state, 'improvement_guidance', '')

        if improvement_guidance:
            base_prompt = f"{improvement_guidance}\n\n{formatted_prompt}"
        else:
            base_prompt = formatted_prompt

        message_content = [{"type": "text", "text": base_prompt}]

        for image in image_contents:
            message_content.append(image)
        
        # messages = [
        #     {"role": "user", "content": message_content}
        # ]
        from langchain.schema import HumanMessage
        
        messages = [HumanMessage(content=message_content)]
        
        print(f"Radiologist analyzing with images...")
        result = llm.invoke(messages)
        result_content = result.content

    print(f"Radiologist result received")
    
    image_findings = []
    limitations = []
    # import pdb;pdb.set_trace()
    if "IMAGE FINDINGS:" in result_content:
        # Extract the findings section
        findings_text = result_content.split("IMAGE FINDINGS:")[1]
        if "LIMITATIONS" in findings_text:
            findings_text = findings_text.split("LIMITATIONS")[0]
        findings_text = findings_text.strip()
        
        # Split by main finding blocks (each starts with "- **Region/Organ**:" or similar)
        finding_blocks = re.split(r'\n- \*\*', findings_text)
        
        for block in finding_blocks:
            if not block.strip():
                continue
                
            # Add back the "**" that was removed by split
            if not block.startswith('**'):
                block = '**' + block
            
            finding_dict = {}
            
            # Extract Region/Organ (main identifier)
            region_match = re.search(r'\*\*Region/Organ\*\*:\s*([^\n]+)', block, re.IGNORECASE)
            if region_match:
                finding_dict["region"] = region_match.group(1).strip()
            
            # Extract all other fields using regex
            patterns = {
                "distribution": r'\*\*Distribution\*\*:\s*([^\n]+)',
                "number": r'\*\*Number\*\*:\s*([^\n]+)',
                "size": r'\*\*Size\*\*:\s*([^\n]+)',
                "density": r'\*\*Density\*\*:\s*([^\n]+)',
                "margins": r'\*\*Margins\*\*:\s*([^\n]+)',
                "laterality": r'\*\*Laterality\*\*:\s*([^\n]+)',
                "associated_features": r'\*\*Associated features\*\*:\s*([^\n]+)'
            }
            
            for key, pattern in patterns.items():
                match = re.search(pattern, block, re.IGNORECASE)
                if match:
                    finding_dict[key] = match.group(1).strip()
            
            # Only add if we found at least a region
            if finding_dict.get("region"):
                image_findings.append(finding_dict)

    if "LIMITATIONS:" in result_content:
        limitations_text = result_content.split("LIMITATIONS:")[1].strip()
        limitations = [limit.strip() for limit in limitations_text.split("-") if limit.strip()]

    # import pdb;pdb.set_trace()
    if not image_findings:
        image_findings = [{
            "region": "General",
            "finding": "Analysis of the provided case indicates medical imaging would be beneficial for diagnosis."
        }]
    
    if not limitations:
        limitations = ["No specific limitations"]

    # import pdb; pdb.set_trace()
    return {
        "radiologist_state": {
            "image_findings": image_findings,
            "limitations": limitations
        },
    }



def web_search(state: CoordinatorState, config: RunnableConfig) -> Dict[str, Any]:
    configurable = Configuration.from_runnable_config(config)
    
    # import pdb;pdb.set_trace()
    all_observations = getattr(state, 'all_observations', [])
    if not all_observations:
        return {"web_search_state": {
            "search_results": [],
            "research_findings": "No observations to research",
            "searched_combinations": []
        }}
    
    print(f"Web research with {len(all_observations)} observations")
    
    combinations = list(itertools.combinations(all_observations, 2)) if len(all_observations) >= 2 else []
    
    max_combinations = 10
    if len(combinations) > max_combinations:
        combinations = combinations[:max_combinations]
    
    print(f"Searching {len(combinations)} combinations")
    
    all_research_findings = []
    
    llm = ChatOpenAI(
        api_key=API_KEY,  
        model=configurable.web_search_google_model,  
        # temperature=0,
        max_retries=2
    )
    
    for combo in combinations:
        print(f"Searching: {' + '.join(combo)}")
        
        # try:
        search_query = f"medical association between {' and '.join(combo)} research studies peer reviewed"
        search_results = search_with_serper(search_query, serper_api_key)
        
        # import pdb; pdb.set_trace()

        search_context = ""
        if 'organic_results' in search_results and search_results['organic_results']:
            for result in search_results['organic_results'][:3]: 
                search_context += f"Title: {result.get('title', '')}\n"
                search_context += f"Snippet: {result.get('snippet', '')}\n\n"
        
        if 'related_questions' in search_results and search_results['related_questions']:
            search_context += "\nRelated Medical Questions:\n"
            for question in search_results['related_questions'][:2]:  
                search_context += f"Q: {question.get('question', '')}\n"
                search_context += f"A: {question.get('snippet', '')}\n\n"
        
        if not search_context.strip():
            search_context = "No relevant search results found."
        
        analysis_prompt = f"""Based on the following search results about medical associations between {' and '.join(combo)}, 
research and summarize the findings into one sentence. Make sure you only tell the findings without cliche and include all existing rare associations and relationships.

Search Results:
{search_context}

Please provide a concise, factual summary focusing on medical associations and relationships."""
        
        response = llm.invoke(analysis_prompt)
        response_text = response.content if response.content else "No analysis generated."
        
        all_research_findings.append({
            'combination': combo,
            'findings': response_text[:500] + "..." if len(response_text) > 500 else response_text
        })
            
        # except Exception as e:
        #     print(f"Search failed for {combo}: {e}")
        #     all_research_findings.append({
        #         'combination': combo,
        #         'findings': f"Search failed: {str(e)}"
        #     })
    
    merged_findings = ""
    for result in all_research_findings:
        combo_str = " + ".join(result['combination'])
        merged_findings += f"[{combo_str}]: {result['findings']}\n\n"
    
    return {"web_search_state": {
        "research_findings": merged_findings,
        "searched_combinations": combinations,
        "search_count": len(combinations)
    }}


def search_with_serper(query: str, serper_api_key: str) -> dict:
    # url = "https://google.serper.dev/search"
    
    
    # headers = {
    #     'X-API-KEY': serper_api_key,
    #     'Content-Type': 'application/json'
    # }
    from serpapi import GoogleSearch

    params = {
        "api_key": "19490efe3a8641768bfa1f416269233921aa89d7e07c64c7ea252593ed391d07",
        "engine": "google",
        "q": query,
        "location": "Austin, Texas, United States",
        "google_domain": "google.com",
        "gl": "us",
        "hl": "en"
    }

    # try:
    response = GoogleSearch(params).get_dict()
    return response
   

def diagnose(state: CoordinatorState, config: RunnableConfig) -> DiagnoserState:
    
    configurable = Configuration.from_runnable_config(config)
    
    original_case = ""
    if hasattr(state, "clinical_text") and state.clinical_text:
        original_case = state.clinical_text
    elif hasattr(state, "patient_info") and state.patient_info:
        original_case = state.patient_info.clinical_text
    
    domain_expert_results = getattr(state, 'domain_expert_state', {})
    symptoms_text = "\n".join([
        "\n".join(f"- {symptom}" for symptom in domain_expert_results.get("extracted_symptoms", [])),
        "\n".join(f"- {key}: {finding}" for key, finding in domain_expert_results.get("clinical_findings", {}).items()),
        "\n".join(f"- Family History: {condition}" for condition in domain_expert_results.get("family_medical_history", [])),
        "\n".join(f"- Past Medical History: {condition}" for condition in domain_expert_results.get("past_medical_history", []))
    ])

    radiologist_results = getattr(state, 'radiologist_state', {})
    imaging_findings = "\n".join([
        f"- {finding['region']}: " + "; ".join([
            f"{label}: {finding[key]}" 
            for key, label in [
                ("distribution", "Distribution"),
                ("number", "Number"),
                ("size", "Size"), 
                ("density", "Density"),
                ("margins", "Margins"),
                ("laterality", "Laterality"),
                ("associated_features", "Associated features")
            ]
            if key in finding and finding[key] and finding[key].lower() not in ["not applicable", "n/a", "none"]
        ])
        for finding in radiologist_results.get("image_findings", [])
        if isinstance(finding, dict) and finding.get('region')
    ])

    research_findings = ""
    if state.web_search_state and isinstance(state.web_search_state, dict):
        research_findings = state.web_search_state.get("research_findings", "")
    
    diagnostic_options_text = ""
    if hasattr(state, "diagnostic_options") and state.diagnostic_options:
        diagnostic_options_text = "\n".join([f"Option {k}: {v}" for k, v in state.diagnostic_options.items()])
    
   
    llm = ChatOpenAI(
        api_key=API_KEY,
        model=configurable.diagnoser_model,
        max_retries=2
    )
    
    diagnostic_prompt = f"""
You are a medical expert. Based on all the clinical information below, answer the given question and select the most likely diagnosis step by step, then provide your diagnostic reasoning.

## Clinical Case
{original_case}

## Key Clinical Observations from Expert Analysis
{symptoms_text}

## Imaging Findings
{imaging_findings}

## Medical Literature Findings
{research_findings}

## Answer Choices
{diagnostic_options_text}

Instructions:
1. Combine information from expert analysis, imaging and literature to form comprehensive diagnostic reasoning
2. Select the MOST LIKELY answer from the given options based on all available evidence
3. Consider all options carefully and provide thorough justification

Please format your response EXACTLY as follows:

REASONING PATH:
[Provide detailed step-by-step analysis connecting symptoms to diagnosis]

SELECTED OPTION: [Write only the letter: A, B, C, D, or E]

Remember: You MUST select one of the provided options (A, B, C, D, or E). End your response with "SELECTED OPTION: [LETTER]"
"""
    
    print("Generating diagnostic reasoning without correct answer guidance...")
    
    improvement_guidance = getattr(state, 'improvement_guidance', '')
    
    if improvement_guidance:
        diagnostic_prompt = f"{improvement_guidance}\n\n{diagnostic_prompt}"
        print(f"Diagnoser applying improvement guidance: {len(improvement_guidance)} characters")
    
    result = llm.invoke(diagnostic_prompt)
    result_content = result.content
    print(f"Raw diagnosis result: {result_content[:200]}...")
    
    
    if not selected_option:
        patterns = [
            r'SELECTED OPTION:\s*([A-E])',
            r'(?:answer|choice|option)[\s:]*([A-E])',
            r'(?:the\s+)?(?:correct\s+)?(?:answer|choice|option)\s+is\s+([A-E])',
            r'\b([A-E])\s*(?:is\s+(?:the\s+)?(?:correct|right|best|most\s+likely))',
            r'(?:diagnosis|option)\s+([A-E])',
            r'^([A-E])[\.\:\s]',
            r'\(([A-E])\)',
        ]
        
        for pattern in patterns:
            matches = re.findall(pattern, result_content, re.IGNORECASE | re.MULTILINE)
            if matches:
                selected_option = matches[-1].upper()
                break
    
    
    fact_check_record = fact_check_analysis(
        state, config, 
        "Diagnostic Reasoning", 
        result_content
    )
    
    print(f"Diagnosis completed. Selected option: {selected_option}")
    
    return {
        "diagnoser_state": {
            "reasoning_path": reasoning_path,
            "selected_option": selected_option,
            "full_response": result_content
        },
        "fact_check_record": fact_check_record
    }


def finalize_result(state: CoordinatorState, config: RunnableConfig) -> Dict[str, Any]:
    
    debug_state_info(state, "FINALIZE_RESULT")
    
    reasoning_path = ""
    selected_option = ""
    
    if state.diagnoser_state and isinstance(state.diagnoser_state, dict):
        reasoning_path = state.diagnoser_state.get("reasoning_path", "")
        selected_option = state.diagnoser_state.get("selected_option", "")
    
    fact_check_summary = generate_fact_check_summary(state)
    
    final_message = f"""# Diagnostic Analysis Result

## Reasoning Path
{reasoning_path}

## Selected Option
**Option {selected_option}**

{fact_check_summary}
"""
    
    return {
        "messages": [AIMessage(content=final_message)]
    }



def route_coordinator(state: CoordinatorState) -> str:
    return "web_search"


def domain_expert_with_fact_check(state: CoordinatorState, config: RunnableConfig) -> Dict[str, Any]:
    result = domain_expert_analysis(state, config)
    
    update_dict = {}
    
    if 'domain_expert_state' in result:
        update_dict['domain_expert_state'] = result['domain_expert_state']
    
    if 'fact_check_record' in result:
        update_dict['fact_check_records'] = [result['fact_check_record']]
        
        print(f"Domain Expert fact-check added. Total records: {len(update_dict['fact_check_records'])}")

    return update_dict


def radiologist_with_fact_check(state: CoordinatorState, config: RunnableConfig) -> Dict[str, Any]:
    result = radiologist_analysis(state, config)
    
    update_dict = {}
    
    if 'radiologist_state' in result:
        update_dict['radiologist_state'] = result['radiologist_state']
    
    if 'fact_check_record' in result:
        update_dict['fact_check_records'] = [result['fact_check_record']]
        
        print(f"Radiologist fact-check added. Added records: {len(update_dict['fact_check_records'])}")

    return update_dict


def diagnoser_with_fact_check(state: CoordinatorState, config: RunnableConfig) -> Dict[str, Any]:
    result = diagnose(state, config)
    
    update_dict = {}
    
    if 'diagnoser_state' in result:
        update_dict['diagnoser_state'] = result['diagnoser_state']
    
    if 'fact_check_record' in result:
        update_dict['fact_check_records'] = [result['fact_check_record']]

        print(f"Diagnoser fact-check added. Total records: {len(update_dict['fact_check_records'])}")

    return update_dict

def hallucination_detector(config: RunnableConfig, analysis_text: str, original_clinical_text: str, analysis_type: str, image_contents: List[Dict] = None) -> Dict[str, Any]:
    configurable = Configuration.from_runnable_config(config)

    llm = ChatOpenAI(
        api_key=API_KEY,
        model=configurable.fact_check_model if hasattr(configurable, 'fact_check_model') else "gpt-4-turbo-preview",
        # temperature=0.1,
        max_retries=2
    )
    
    hallucination_prompt = f"""
You are a medical hallucination detector. Your task is to identify any fabricated, imagined, or unsupported medical information in the analysis.

## Original Clinical Text
{original_clinical_text}

## Analysis Type: {analysis_type}
## Analysis to Check
{analysis_text}

Please identify:

1. **FABRICATED INFORMATION**: Any medical findings, symptoms, or details mentioned in the analysis that are NOT present in the original clinical text or visible in any provided images
2. **UNSUPPORTED CLAIMS**: Medical interpretations that go beyond what can reasonably be inferred from the original text and images
3. **CONTRADICTIONS**: Any statements that contradict the original clinical information or contradict what's visible in the images

Pay special attention to:
- Image-related claims that don't match what's actually visible in the provided images
- Medical findings described that aren't present in the original clinical text
- Diagnostic interpretations that go beyond the evidence provided

Format your response as:

**HALLUCINATION DETECTED: [YES/NO]**

**FABRICATED INFORMATION:**
- [List any fabricated details, or "None detected"]

**UNSUPPORTED CLAIMS:**
- [List any unsupported medical claims, or "None detected"]

**CONTRADICTIONS:**
- [List any contradictions, or "None detected"]

**CONFIDENCE SCORE: [0-100]%**
(How confident you are in this hallucination assessment)

**RECOMMENDATION:**
[Provide specific actionable recommendation - choose from:
- ACCEPT_AS_IS: No issues detected, analysis is reliable
- ACCEPT_WITH_CAUTION: Minor issues but overall acceptable
- REVISE_REDUCE_FABRICATION: Reduce fabricated medical details not in original text/images
- REVISE_STRENGTHEN_EVIDENCE: Base claims more closely on provided evidence and visible findings
- REVISE_REMOVE_CONTRADICTIONS: Remove statements that contradict original information or images
- REVISE_COMPREHENSIVE: Multiple issues require significant revision
- REJECT_HIGH_HALLUCINATION: Too many fabricated elements, complete regeneration needed
- REJECT_UNRELIABLE: Analysis contradicts source material extensively]

**SPECIFIC_ACTIONS:**
[List 2-3 specific actions to improve the analysis, such as:
- Remove reference to [specific fabricated detail not in text/images]
- Base imaging interpretation only on actually visible findings
- Eliminate unsupported diagnostic claims about [specific condition]
- Focus reasoning on symptoms explicitly mentioned in case and visible in images]

**SEVERITY: [LOW/MEDIUM/HIGH]**
(Severity of detected hallucinations if any)
"""
    
    if image_contents and len(image_contents) > 0:
        message_content = [{"type": "text", "text": hallucination_prompt}]
        for image in image_contents:
            message_content.append(image)
        messages = [HumanMessage(content=message_content)]
        result = llm.invoke(messages)
    else:
        result = llm.invoke(hallucination_prompt)
    
    result_content = result.content
    
    hallucination_detected = "NO"
    if "HALLUCINATION DETECTED:" in result_content:
        detection_line = result_content.split("HALLUCINATION DETECTED:")[1].split("\n")[0]
        if "YES" in detection_line.upper():
            hallucination_detected = "YES"
    
    
    
    return {
        "hallucination_detected": hallucination_detected,
        "fabricated_information": fabricated_info,
        "unsupported_claims": unsupported_claims,
        "contradictions": contradictions,
        "confidence_score": confidence,
        "recommendation": recommendation,
        "specific_actions": specific_actions,
        "severity": severity,
        "analysis_type": analysis_type,
        "full_response": result_content,
        "total_issues": len(fabricated_info) + len(unsupported_claims) + len(contradictions),
        "multimodal_check": len(image_contents) > 0 if image_contents else False
    }

def run_analysis_with_hallucination_check(analysis_func, state, config, analysis_name, max_retries=2):
    
    original_clinical_text = getattr(state, 'clinical_text', '')
    if not original_clinical_text and hasattr(state, 'patient_info'):
        original_clinical_text = state.patient_info.clinical_text
    
    image_contents = getattr(state, 'image_contents', [])
    if not image_contents:
        image_contents = []
    
    hallucination_logs = []
    improvement_instructions = []  
    
    for attempt in range(max_retries + 1):
        print(f"  {analysis_name} - Attempt {attempt + 1}/{max_retries + 1}")
        
        modified_state = state
        if attempt > 0 and improvement_instructions:
            guidance = "\n".join([
                "CRITICAL: Avoid the following issues from previous attempts:",
                *[f"- {instruction}" for instruction in improvement_instructions[-5:]],  
                "Base all findings strictly on provided clinical text and visible image contents only."
            ])
            
            print(f"  {analysis_name} - Applying {len(improvement_instructions)} improvement instructions")
            
            state_dict = state.model_dump() if hasattr(state, 'model_dump') else dict(state)
            state_dict['improvement_guidance'] = guidance  
            modified_state = CoordinatorState(**state_dict)
        
        analysis_result = analysis_func(modified_state, config)
        
        analysis_text = json.dumps(analysis_result, indent=2)
        
        print(f"  {analysis_name} - Running hallucination detection...")
        hallucination_result = hallucination_detector(
            config, analysis_text, original_clinical_text, analysis_name, image_contents
        )
        
        log_entry = {
            "analysis_name": analysis_name,
            "attempt": attempt + 1,
            "hallucination_detected": hallucination_result["hallucination_detected"],
            "recommendation": hallucination_result["recommendation"],
            "total_issues": hallucination_result["total_issues"],
            "severity": hallucination_result["severity"],
            "improvement_guidance_applied": len(improvement_instructions) > 0,
            "improvement_instructions": improvement_instructions,
            "previous_warnings_count": len(improvement_instructions)
        }
        hallucination_logs.append(log_entry)
        
        if hallucination_result["hallucination_detected"] == "NO":
            print(f"  {analysis_name} - No hallucination detected")
            if len(improvement_instructions) > 0:
                print(f"  {analysis_name} - SUCCESS: Improvement guidance resolved {len(improvement_instructions)} previous issues")
            break
        elif hallucination_result["recommendation"] in ["ACCEPT_AS_IS", "ACCEPT_WITH_CAUTION"]:
            print(f"  {analysis_name} - {hallucination_result['recommendation'].replace('_', ' ').lower()}, proceeding")
            break
        elif attempt < max_retries:
            print(f"  {analysis_name} - Issues detected ({hallucination_result['severity']} severity), retrying...")
            
            specific_actions = hallucination_result.get("specific_actions", [])
            fabricated_info = hallucination_result.get("fabricated_information", [])
            unsupported_claims = hallucination_result.get("unsupported_claims", [])
            contradictions = hallucination_result.get("contradictions", [])
            
            for action in specific_actions[:3]:  
                improvement_instructions.append(f"Action: {action}")
            for fab in fabricated_info[:2]:
                improvement_instructions.append(f"Do not fabricate: {fab}")
            for claim in unsupported_claims[:2]:
                improvement_instructions.append(f"Unsupported claim to avoid: {claim}")
            for contradiction in contradictions[:1]:
                improvement_instructions.append(f"Contradiction to resolve: {contradiction}")
            
            print(f"  {analysis_name} - Added {len(specific_actions) + len(fabricated_info) + len(unsupported_claims) + len(contradictions)} improvement instructions")
            
        else:
            print(f"  {analysis_name} - Max retries reached, using final result with warnings")
            break
    
    analysis_result["hallucination_detection_log"] = hallucination_logs
    analysis_result["final_hallucination_status"] = hallucination_result
    analysis_result["accumulated_improvement_instructions"] = improvement_instructions
    analysis_result["improvement_success_rate"] = (
        sum(1 for log in hallucination_logs if log["hallucination_detected"] == "NO") / len(hallucination_logs)
        if hallucination_logs else 0
    )
    
    return analysis_result

def generate_k_independent_cot_paths(state: CoordinatorState, config: RunnableConfig) -> CoordinatorState:
    """Generate k independent CoT reasoning paths with diversity"""
    configurable = Configuration.from_runnable_config(config)
    k = getattr(configurable, 'cot_rounds', 3)
    
    llm = ChatOpenAI(
        api_key=API_KEY,
        model=configurable.diagnoser_model,
        # temperature=0.8,  # Higher temperature for diversity
        max_retries=2
    )
    
    # Get clinical case and options
    original_case = ""
    if hasattr(state, "clinical_text") and state.clinical_text:
        original_case = state.clinical_text
    elif hasattr(state, "patient_info") and state.patient_info:
        original_case = state.patient_info.clinical_text
    
    diagnostic_options_text = ""
    if hasattr(state, "diagnostic_options") and state.diagnostic_options:
        diagnostic_options_text = "\n".join([f"Option {k}: {v}" for k, v in state.diagnostic_options.items()])
    
    # Handle images
    image_contents = []
    if hasattr(state, "image_contents") and state.image_contents:
        image_contents = state.image_contents
        print(f"Found {len(image_contents)} images for k-path CoT analysis")
    
    print(f"Generating {k} independent CoT reasoning paths...")
    
    # Diversity strategies for different paths
    diversity_strategies = [
        {
            "instruction": "Focus on the most obvious and direct diagnostic indicators. Consider common diagnoses first.",
            "emphasis": "common_findings"
        },
        {
            "instruction": "Consider less common but possible differential diagnoses. Look for subtle or atypical presentations.", 
            "emphasis": "rare_conditions"
        },
        {
            "instruction": "Pay special attention to imaging findings and their clinical correlation. Consider structural abnormalities.",
            "emphasis": "imaging_focused"
        }
    ]
    
    # Generate k independent paths
    cot_paths = []
    for path_id in range(1, k + 1):
        print(f"Generating CoT path {path_id}/{k}")
        
        # Use cycling diversity strategy
        strategy = diversity_strategies[(path_id - 1) % len(diversity_strategies)]
        diversity_instruction = strategy["instruction"]
        emphasis = strategy["emphasis"]
        
        path_prompt = f"""
You are a medical expert conducting independent diagnostic reasoning. This is analysis path {path_id} of {k}.

ANALYSIS FOCUS: {diversity_instruction}

## Clinical Case
{original_case}

## Answer Choices
{diagnostic_options_text}

Please conduct thorough Chain-of-Thought reasoning:
1. Identify key symptoms and clinical findings
2. Analyze any available imaging information
3. Consider differential diagnoses based on your analysis focus
4. Apply medical reasoning to select the most likely diagnosis
5. Justify your selection with evidence from the case

Format your response as:
CHAIN OF THOUGHT:
[Your detailed step-by-step reasoning with focus on {emphasis}]

SELECTED OPTION: [Write only the letter: A, B, C, D, or E]

CONFIDENCE LEVEL: [High/Medium/Low]
"""
        
        # Generate response with or without images
        if not image_contents:
            result = llm.invoke(path_prompt)
            result_content = result.content
        else:
            message_content = [{"type": "text", "text": path_prompt}]
            for image in image_contents:
                message_content.append(image)
            
            messages = [HumanMessage(content=message_content)]
            result = llm.invoke(messages)
            result_content = result.content
        
        # Parse CoT results
        cot_reasoning = ""
        cot_selected_option = ""
        confidence_level = "Medium"
        
        if "CHAIN OF THOUGHT:" in result_content:
            reasoning_section = result_content.split("CHAIN OF THOUGHT:")[1]
            if "SELECTED OPTION:" in reasoning_section:
                cot_reasoning = reasoning_section.split("SELECTED OPTION:")[0].strip()
                remaining = reasoning_section.split("SELECTED OPTION:")[1]
                
                # Extract option
                option_match = re.search(r'^([A-E])', remaining.strip())
                if option_match:
                    cot_selected_option = option_match.group(1)
                
                # Extract confidence if present
                if "CONFIDENCE LEVEL:" in remaining:
                    conf_section = remaining.split("CONFIDENCE LEVEL:")[1].strip()
                    if any(level in conf_section.upper() for level in ["HIGH", "MEDIUM", "LOW"]):
                        for level in ["HIGH", "MEDIUM", "LOW"]:
                            if level in conf_section.upper():
                                confidence_level = level.title()
                                break
            else:
                cot_reasoning = reasoning_section.strip()
        else:
            cot_reasoning = result_content
        
        # Enhanced option extraction fallback
        if not cot_selected_option:
            patterns = [
                r'SELECTED OPTION:\s*([A-E])',
                r'(?:answer|choice|option)\s+is\s+([A-E])',
                r'(?:select|choose)\s+(?:option\s+)?([A-E])',
                r'^([A-E])[\.\:\s]',
                r'\b([A-E])\s*(?:is\s+(?:the\s+)?(?:correct|right|best|most\s+likely))',
            ]
            
            for pattern in patterns:
                matches = re.findall(pattern, result_content, re.IGNORECASE | re.MULTILINE)
                if matches:
                    cot_selected_option = matches[-1].upper()
                    break
        
        # Store path result
        path_result = {
            'path_id': path_id,
            'reasoning': cot_reasoning,
            'selected_option': cot_selected_option,
            'full_response': result_content,
            'diversity_strategy': strategy,
            'confidence_level': confidence_level,
            'emphasis': emphasis
        }
        cot_paths.append(path_result)
        print(f"Path {path_id} completed: Option {cot_selected_option} (Confidence: {confidence_level})")
    
    # Update state
    state_dict = state.model_dump()
    state_dict["cot_paths"] = cot_paths
    state_dict["total_paths"] = k
    
    print(f"Generated {k} independent CoT paths with options: {[p['selected_option'] for p in cot_paths]}")
    
    return CoordinatorState(**state_dict)


async def process_all_paths_parallel(state: CoordinatorState, config: RunnableConfig) -> CoordinatorState:
    """Process all k paths through MedMMVAgent pipeline in parallel"""
    
    cot_paths = getattr(state, 'cot_paths', [])
    if not cot_paths:
        print("Error: No CoT paths found for processing")
        return state
    
    print(f"Processing {len(cot_paths)} paths through MedMMVAgent pipeline with hallucination detection...")
    
    # Run all paths in parallel
    tasks = []
    for path_data in cot_paths:
        task = run_full_medmmv_pipeline_for_path(state, config, path_data)
        tasks.append(task)
    
    # Wait for all paths to complete
    path_results = await asyncio.gather(*tasks, return_exceptions=True)
    
    # Handle any exceptions
    valid_results = []
    for i, result in enumerate(path_results):
        if isinstance(result, Exception):
            print(f"Path {i+1} failed with exception: {result}")
            failure_result = {
                "path_id": i+1,
                "quality_score": 0,
                "reliability": "FAILED",
                "processing_completed": False,
                "error": str(result)
            }
            valid_results.append(failure_result)
        else:
            valid_results.append(result)
    
    print(f"Completed processing {len(valid_results)} paths with hallucination detection")
    
    # Update state with results
    state_dict = state.model_dump()
    state_dict["path_results"] = valid_results
    
    return CoordinatorState(**state_dict)


def select_best_path_by_quality(state: CoordinatorState, config: RunnableConfig) -> CoordinatorState:
    """Select the best path based on comprehensive quality metrics including enhanced fact checking and hallucination detection"""
    
    path_results = getattr(state, 'path_results', [])
    if not path_results:
        print("Error: No path results found for selection")
        return state
    
    print(f"Evaluating {len(path_results)} paths for best selection with enhanced quality metrics...")
    
    # Sort paths by multiple criteria including fact checking and hallucination detection
    TO FILL
    
    return CoordinatorState(**state_dict)

def generate_final_k_path_result(state: CoordinatorState, config: RunnableConfig) -> Dict[str, Any]:
    """Generate final result with correctness evaluation only at the very end"""
    
    best_path = getattr(state, 'best_path', {})
    evaluated_paths = getattr(state, 'evaluated_paths', [])
    correct_answer = getattr(state, 'correct_answer', '')
    
    if not best_path:
        return {"messages": [AIMessage(content="Error: No best path selected")]}
    
    # Extract key metrics
    selected_path_id = best_path.get('path_id', 1)
    final_option = best_path.get('final_predicted_option', best_path.get('initial_cot_option', ''))
    quality_score = best_path.get('quality_score', 0)
    reliability = best_path.get('reliability', 'UNKNOWN')
    is_correct = best_path.get('is_correct', False)
    
    # Extract comprehensive metrics
    comprehensive_fact_check = best_path.get('comprehensive_fact_check', {})
    total_checks = comprehensive_fact_check.get('total_checks', 0)
    passed_checks = comprehensive_fact_check.get('passed_checks', 0)
    failed_checks = comprehensive_fact_check.get('failed_checks', 0)
    partial_checks = comprehensive_fact_check.get('partial_checks', 0)
    fact_check_score = comprehensive_fact_check.get('overall_fact_check_score', 0)
    
    hallucination_summary = best_path.get('hallucination_detection_summary', {})
    total_hallucination_issues = hallucination_summary.get('total_hallucination_issues', 0)
    high_severity_hallucinations = hallucination_summary.get('high_severity_count', 0)
    total_analysis_attempts = hallucination_summary.get('total_analysis_attempts', 0)
    
    # Generate path comparison table with correctness NOW shown
    path_comparison = []
    for i, p in enumerate(evaluated_paths):
        path_id = p.get('path_id', i+1)
        option = p.get('final_predicted_option', p.get('initial_cot_option', 'N/A'))
        quality = p.get('quality_score', 0)
        reliability_short = p.get('reliability', 'Unknown')
        correct_status = '✓ Correct' if p.get('is_correct', False) else '✗ Incorrect'
        
        path_fact_check = p.get('comprehensive_fact_check', {})
        path_passed = path_fact_check.get('passed_checks', 0)
        path_total = path_fact_check.get('total_checks', 0)
        fact_check_ratio = f"{path_passed}/{path_total}" if path_total > 0 else "0/0"
        
        path_hallucination = p.get('hallucination_detection_summary', {})
        hallucination_issues = path_hallucination.get('total_hallucination_issues', 0)
        
        path_comparison.append(
            f"Path {path_id}: Option {option} | Quality: {quality}/100 | "
            f"Fact Checks: {fact_check_ratio} | Hallucination Issues: {hallucination_issues} | "
            f"Reliability: {reliability_short} | {correct_status}"
        )
    
    path_comparison_text = "\n".join(path_comparison)
    
    # Get detailed reasoning from best path
    final_reasoning = best_path.get('final_diagnosis', '') or best_path.get('initial_reasoning', '')
    
    # Get strategy info
    best_path_strategy = best_path.get('diversity_strategy', {})
    best_path_initial_option = best_path.get('initial_cot_option', 'N/A')
    best_path_emphasis = best_path_strategy.get('emphasis', 'Standard analysis')
    
    # Generate detailed summaries
    detailed_checks = comprehensive_fact_check.get('detailed_checks', {})
    fact_check_details = []
    
    for check_type, check_result in detailed_checks.items():
        if check_result:
            result_status = check_result.get('result', 'UNKNOWN')
            consistency_issues = len(check_result.get('consistency_issues', []))
            accuracy_concerns = len(check_result.get('accuracy_concerns', []))
            missed_info = len(check_result.get('missed_information', []))
            
            status_icon = {'PASS': '✅', 'PARTIAL': '⚠️', 'FAIL': '❌'}.get(result_status, '❓')
            
            fact_check_details.append(
                f"  **{check_type.replace('_', ' ').title()}**: {status_icon} {result_status}"
                + (f" (Issues: {consistency_issues + accuracy_concerns + missed_info})" 
                   if consistency_issues + accuracy_concerns + missed_info > 0 else "")
            )
    
    fact_check_summary = "\n".join(fact_check_details) if fact_check_details else "  No detailed fact check results available"
    
    # Generate hallucination detection summary
    hallucination_logs = hallucination_summary.get('detailed_logs', {})
    hallucination_details = []
    
    for analysis_type, logs in hallucination_logs.items():
        if logs:
            total_attempts = len(logs)
            total_issues = sum(log.get('total_issues', 0) for log in logs)
            high_severity = sum(1 for log in logs if log.get('severity') == 'HIGH')
            
            status_icon = "❌" if total_issues > 0 else "✅"
            hallucination_details.append(
                f"  **{analysis_type.replace('_', ' ').title()}**: {status_icon} "
                f"{total_attempts} attempts, {total_issues} issues"
                + (f" ({high_severity} high severity)" if high_severity > 0 else "")
            )
    
    hallucination_summary_text = "\n".join(hallucination_details) if hallucination_details else "  No hallucination detection logs available"
    
    final_message = f"""# Blind K-Path Multi-Modal Medical Diagnosis Analysis

## Executive Summary
Generated {len(evaluated_paths)} independent diagnostic paths using diverse CoT reasoning strategies. Each path was processed through the complete MedMMVAgent pipeline with comprehensive fact checking and hallucination detection **WITHOUT access to the correct answer during processing**.

**🔥 KEY METHODOLOGY**: The correct answer ({correct_answer}) was **ONLY** revealed and used in the final evaluation stage for performance assessment, ensuring unbiased analysis throughout the entire pipeline.

**Selected Best Path: Path {selected_path_id}**
- **Final Answer**: {final_option}
- **Ground Truth**: {correct_answer}
- **Correctness**: {'✅ CORRECT' if is_correct else '❌ INCORRECT'}
- **Quality Score**: {quality_score}/100 (based on analysis quality, not correctness)
- **Reliability**: {reliability}
- **Fact Check Score**: {fact_check_score:.1f}% ({passed_checks}/{total_checks} passed)
- **Hallucination Issues**: {total_hallucination_issues} detected ({high_severity_hallucinations} high severity)

## Blind Processing Verification
✅ **No correct answer used during CoT generation**
✅ **No correct answer used during expert analysis pipeline**  
✅ **No correct answer used during quality assessment**
✅ **No correct answer used during path selection**
⭐ **Correct answer revealed ONLY for final performance evaluation**

## Path Comparison Results (Final Evaluation)
```
{path_comparison_text}
```

## Quality Assurance Metrics (Blind Processing)
- **Multi-Modal Fact Checking**: ✅ Applied to all {len(evaluated_paths)} paths
- **Hallucination Detection**: ✅ Real-time detection with retry mechanism
- **Quality-Based Selection**: ✅ Based purely on analysis quality, not correctness
- **Pipeline Completeness**: {sum(1 for p in evaluated_paths if p.get('processing_completed', False))}/{len(evaluated_paths)} paths completed successfully

### Fact Checking Summary (Selected Path)
- **Total Checks Performed**: {total_checks}
- **Passed**: {passed_checks} ✅  **Partial**: {partial_checks} ⚠️  **Failed**: {failed_checks} ❌
- **Overall Fact Check Score**: {fact_check_score:.1f}%

### Detailed Fact Check Results
{fact_check_summary}

### Hallucination Detection Summary (Selected Path)
- **Total Analysis Attempts**: {total_analysis_attempts}
- **Total Issues Detected**: {total_hallucination_issues}
- **High Severity Issues**: {high_severity_hallucinations}

### Detailed Hallucination Detection Results
{hallucination_summary_text}

## Selected Path Analysis Details
### Initial CoT Reasoning (Blind)
Option Selected: {best_path_initial_option}
Strategy: {best_path_emphasis}

### MedMMVAgent Pipeline Results (Blind Processing)
- **Domain Expert Analysis**: {'✅ Completed' if best_path.get('pipeline_results', {}).get('domain_expert_state') else '❌ Failed'}
- **Radiologist Analysis**: {'✅ Completed' if best_path.get('pipeline_results', {}).get('radiologist_state') else '❌ Failed'}
- **Coordinator Decision**: {'✅ Completed' if best_path.get('pipeline_results', {}).get('coordinator_observations') else '❌ Failed'}
- **Web Research**: {'✅ Completed' if best_path.get('pipeline_results', {}).get('web_search_findings') else '❌ Failed'}
- **Final Diagnosis**: {'✅ Completed' if best_path.get('pipeline_results', {}).get('diagnoser_state') else '❌ Failed'}

### Final Diagnostic Reasoning
{final_reasoning}

## Methodology Validation
This analysis demonstrates **true blind processing**:

1. **K-Path Generation**: Generated {len(evaluated_paths)} diverse reasoning paths without ground truth
2. **Parallel Processing**: All paths processed simultaneously through MedMMVAgent without answer key
3. **Quality-Based Selection**: Best path selected based on analysis quality, fact-checking, and reliability metrics
4. **Final Evaluation**: Correct answer ({correct_answer}) revealed only at the end for performance assessment

## Quality Control Protocol
Each path underwent rigorous **blind validation**:

1. **Domain Expert Analysis**: Hallucination detection + fact verification (no answer key)
2. **Radiologist Analysis**: Imaging findings validation (no answer key)
3. **Coordinator Decision**: Observation consistency check (no answer key)
4. **Final Diagnosis**: Diagnostic reasoning validation (no answer key)
5. **Integrated Analysis**: Cross-stage consistency verification (no answer key)

**Final Result**: Path {selected_path_id} selected based on quality metrics achieved **{final_option}** vs ground truth **{correct_answer}** ({'MATCH' if is_correct else 'MISMATCH'})

---
*This diagnosis represents unbiased medical reasoning from {len(evaluated_paths)} independent analysis paths, validated through comprehensive fact-checking and real-time hallucination detection, with ground truth revealed only for final performance evaluation.*
"""
    
    # Enhanced metrics including blind processing verification
    enhanced_quality_metrics = {
        "methodology": "BLIND_PROCESSING",
        "correct_answer_revealed_only_at_end": True,
        "selected_path_id": selected_path_id,
        "predicted_answer": final_option,
        "ground_truth": correct_answer,
        "final_correctness": is_correct,
        "quality_score": quality_score,
        "reliability": reliability,
        "total_paths": len(evaluated_paths),
        "completed_paths": sum(1 for p in evaluated_paths if p.get('processing_completed', False)),
        
        "comprehensive_fact_check": comprehensive_fact_check,
        "hallucination_detection_summary": hallucination_summary,
        
        "blind_processing_verification": {
            "cot_generation_blind": True,
            "expert_analysis_blind": True,
            "quality_assessment_blind": True,
            "path_selection_blind": True,
            "correct_answer_usage": "FINAL_EVALUATION_ONLY"
        },
        
        "path_details": evaluated_paths
    }
    
    return {
        "messages": [AIMessage(content=final_message)],
        "final_diagnosis": final_message,
        "selected_option": final_option,
        "quality_metrics": enhanced_quality_metrics,
        "blind_processing_verified": True
    }

# Build the complete K-Path graph
builder = StateGraph(CoordinatorState, config_schema=Configuration)

# Add all nodes with conditional logic
builder.add_node("process_patient_info", process_patient_info)
builder.add_node("generate_k_independent_cot_paths", generate_k_independent_cot_paths)
builder.add_node("process_all_paths_parallel", process_all_paths_parallel)  # Uses conditional radiology internally
builder.add_node("select_best_path_by_quality", select_best_path_by_quality) 
builder.add_node("generate_final_k_path_result", generate_final_k_path_result)

# Linear flow remains the same
builder.add_edge(START, "process_patient_info")
builder.add_edge("process_patient_info", "generate_k_independent_cot_paths")
builder.add_edge("generate_k_independent_cot_paths", "process_all_paths_parallel")
builder.add_edge("process_all_paths_parallel", "select_best_path_by_quality")
builder.add_edge("select_best_path_by_quality", "generate_final_k_path_result") 
builder.add_edge("generate_final_k_path_result", END)

graph = builder.compile(name="enhanced-k-path-medical-diagnosis-system")