"""Synthesis agent for combining findings into coherent medical reports with clinical reasoning"""

from typing import Dict, List, Optional, Any, Tuple
from pydantic import BaseModel, Field
from langchain_core.prompts import ChatPromptTemplate
from langchain_core.language_models import BaseLanguageModel

from .base_abcde import ABCDEAgent
from ..orchestrator.state import MultiAgentState, AgentAnalysis, Finding
from ..orchestrator.semantic_query_analyzer import QueryIntent


class DifferentialDiagnosis(BaseModel):
    """A single differential diagnosis with supporting evidence"""
    diagnosis: str = Field(description="The diagnosis name")
    probability: float = Field(description="Estimated probability (0-1)")
    supporting_findings: List[str] = Field(description="Findings that support this diagnosis")
    against_findings: List[str] = Field(description="Findings against this diagnosis")
    missing_findings: List[str] = Field(description="Expected findings that are absent")
    clinical_correlation: str = Field(description="How clinical context affects probability")
    next_steps: List[str] = Field(description="Recommended next steps if this is the diagnosis")


class ClinicalReasoning(BaseModel):
    """Complete clinical reasoning output"""
    primary_diagnosis: DifferentialDiagnosis = Field(description="Most likely diagnosis")
    differential_diagnoses: List[DifferentialDiagnosis] = Field(description="Alternative diagnoses in order of likelihood")
    pattern_matches: List[str] = Field(description="Disease patterns that match the findings")
    conflicting_findings: List[str] = Field(description="Findings that conflict with each other")
    critical_findings: List[str] = Field(description="Findings requiring immediate attention")
    uncertainty_factors: List[str] = Field(description="Factors contributing to diagnostic uncertainty")


class SynthesisStrategy(BaseModel):
    """Strategy for synthesizing results with clinical reasoning"""
    focus_agents: List[str] = Field(description="Agents to prioritize in synthesis")
    key_metrics: List[str] = Field(description="Key measurements to highlight")
    synthesis_approach: str = Field(description="How to structure the answer")
    pattern_recognition_needed: bool = Field(description="Whether to perform pattern matching")
    differential_needed: bool = Field(description="Whether to generate differential diagnosis")
    
    
class EnhancedSynthesisResult(BaseModel):
    """Enhanced result from synthesis with clinical reasoning"""
    answer: str = Field(description="Direct answer to the user's query")
    confidence: float = Field(description="Overall confidence in the answer (0-1)")
    clinical_reasoning: Optional[ClinicalReasoning] = Field(description="Detailed clinical reasoning")
    supporting_evidence: List[str] = Field(description="Key evidence supporting the answer")
    caveats: List[str] = Field(description="Important limitations or caveats")
    requires_review: bool = Field(description="Whether clinical review is recommended")
    recommended_actions: List[str] = Field(description="Recommended clinical actions")
    full_report: Optional[str] = Field(description="Comprehensive medical report if requested")


class SynthesisReportAgent(ABCDEAgent):
    """Prompt-driven synthesis agent with clinical pattern recognition and differential diagnosis"""
    
    def __init__(self, llm: BaseLanguageModel):
        super().__init__(
            agent_name="synthesis",
            llm=llm,
            tools=[],
            mode="plan_execute",
            vcot_policy="never"
        )
        
        # Create specialized chains - all prompt-driven
        self.strategy_planner = self._create_strategy_planner()
        self.clinical_reasoner = self._create_clinical_reasoner()
        self.answer_generator = self._create_answer_generator()
        self.report_generator = self._create_report_generator()
    
    def _create_strategy_planner(self):
        """Create strategy planner for determining synthesis approach"""
        prompt = ChatPromptTemplate.from_messages([
            ("system", """You are planning how to synthesize medical findings from multiple specialist agents.

Based on the query and available findings, determine:
1. Which agents' findings to prioritize
2. Key measurements to highlight
3. Whether pattern recognition is needed
4. Whether differential diagnosis is needed

Consider:
- Simple queries (e.g., "Is there cardiomegaly?") may not need full differential
- Complex queries or multiple findings suggest pattern recognition
- Uncertain findings require differential diagnosis
- Critical findings need immediate attention"""),
            ("human", """Query: {query}
Query intent: {query_intent}
Available agents: {available_agents}
Finding count: {finding_count}
Clinical context available: {has_clinical_context}

Determine the synthesis strategy.""")
        ])
        
        return prompt | self.llm.with_structured_output(SynthesisStrategy)
    
    def _create_clinical_reasoner(self):
        """Create comprehensive clinical reasoning chain"""
        prompt = ChatPromptTemplate.from_messages([
            ("system", """You are an expert radiologist performing comprehensive clinical reasoning on chest X-ray findings.

Your task is to:
1. Analyze finding patterns and recognize disease presentations
2. Generate differential diagnosis with probabilities
3. Consider clinical context impact
4. Identify conflicting findings and uncertainty factors
5. Flag critical findings requiring immediate attention

Use your medical knowledge to:
- Match findings to known disease patterns (pneumonia, CHF, PE, pneumothorax, etc.)
- Consider alternative explanations for findings
- Evaluate how clinical context (age, symptoms, labs) affects diagnosis probability
- Assess diagnostic confidence and uncertainty

Be thorough and evidence-based in your reasoning."""),
            ("human", """CHEST X-RAY ANALYSIS REQUEST

Query: {query}

FINDINGS FROM SPECIALIST AGENTS:
{formatted_findings}

CLINICAL CONTEXT:
{clinical_context}

ADDITIONAL MEASUREMENTS:
{measurements}

IMPORTANT: If the findings include temporal comparisons (CURRENT vs PRIOR), focus your reasoning on:
- Changes over time (improved, worsened, stable, new, resolved)
- Clinical significance of any changes
- Progression or resolution of disease

Please provide comprehensive clinical reasoning including:
1. Pattern recognition: What disease patterns do these findings suggest?
2. Differential diagnosis: List possible diagnoses with probabilities
3. Supporting evidence: What supports each diagnosis?
4. Conflicting findings: Any contradictory evidence?
5. Critical findings: Any emergencies requiring immediate attention?
6. Uncertainty factors: What contributes to diagnostic uncertainty?
7. For comparison cases: What do the temporal changes indicate?

Format your response as structured clinical reasoning.""")
        ])
        
        return prompt | self.llm.with_structured_output(ClinicalReasoning)
    
    def _create_answer_generator(self):
        """Create answer generator with clinical reasoning integration"""
        prompt = ChatPromptTemplate.from_messages([
            ("system", """You are providing a comprehensive answer to a chest X-ray query.

Your response should:
1. Directly answer the specific query
2. Include key clinical reasoning points
3. Mention differential diagnosis if relevant
4. Provide confidence level with explanation
5. Suggest recommended actions
6. Be clear about certainty vs uncertainty

Tailor your answer to the query type:
- Simple diagnostic: Clear yes/no with confidence
- Measurement: Specific values with interpretation
- Comprehensive: Systematic review with reasoning
- Comparison: Changes from prior study - IMPORTANT: When findings show CURRENT vs PRIOR comparisons, explicitly state:
  * What has changed (improved/worsened/stable/new/resolved)
  * The clinical significance of changes
  * Specific measurements from both timepoints
  * Recommendations based on the progression"""),
            ("human", """Query: {query}
Query Intent: {query_intent}

FINDINGS SUMMARY:
{findings_summary}

CLINICAL REASONING:
{clinical_reasoning}

MEASUREMENTS:
{key_measurements}

CLINICAL CONTEXT:
{clinical_context}

Generate a comprehensive, clinically-reasoned answer to the query.""")
        ])
        
        return prompt | self.llm.with_structured_output(EnhancedSynthesisResult)
    
    def _create_report_generator(self):
        """Create comprehensive medical report generator"""
        prompt = ChatPromptTemplate.from_messages([
            ("system", """You are a radiologist creating a comprehensive chest X-ray report.

Structure the report as:
1. TECHNIQUE: Examination description
2. COMPARISON: Prior studies if available
3. FINDINGS: Systematic ABCDE review with confidence levels
4. CLINICAL REASONING: Pattern recognition and differential diagnosis
5. IMPRESSION: Primary diagnosis and key findings
6. RECOMMENDATIONS: Evidence-based next steps

Use standard radiology language while incorporating clinical reasoning.
Be specific about diagnostic uncertainty and confidence levels."""),
            ("human", """REPORT GENERATION REQUEST

Original Query: {query}
View Position: {view_position}
Prior Study: {has_prior}

FINDINGS BY AGENT:
{all_findings}

CLINICAL REASONING:
{clinical_reasoning}

MEASUREMENTS:
{measurements}

CLINICAL CONTEXT:
{clinical_context}

Generate a comprehensive radiology report with integrated clinical reasoning.""")
        ])
        
        return prompt | self.llm
    
    def analyze(self, state: MultiAgentState) -> MultiAgentState:
        """Perform prompt-driven synthesis with clinical reasoning"""
        print(f"\n{'='*60}")
        
        # Check if this is a comparison analysis
        is_comparison = state.get('need_comparison', False) and state.get('prior_image_path')
        
        if is_comparison:
            print(f"SYNTHESIS AGENT: Performing temporal comparison analysis...")
        else:
            print(f"SYNTHESIS AGENT: Performing clinical reasoning...")
        
        # Extract context
        query_analysis = state.get('query_analysis', {})
        clinical_context = state.get('clinical_context', {})
        
        # Collect and analyze findings
        agent_results = self._collect_agent_results(state)
        all_findings = self._extract_all_findings(agent_results)
        
        # Print detailed findings information
        print(f"\nCollected {len(all_findings)} total findings from {len(agent_results)} agents")
        
        if all_findings:
            # Check if this is a comparison
            has_temporal = any(f.get('temporal_context') for f in all_findings)
            
            if has_temporal:
                print("\n📋 TEMPORAL COMPARISON FINDINGS:")
            else:
                print("\n📋 DETAILED FINDINGS SUMMARY:")
            
            for i, finding in enumerate(all_findings, 1):
                source_agent = finding.get('source_agent', 'unknown')
                pathology = finding.get('pathology', 'unknown')
                confidence = finding.get('confidence', 0)
                evidence = finding.get('evidence', 'No evidence provided')
                measurements = finding.get('measurements', {})
                visual_cot = finding.get('visual_cot')
                temporal_context = finding.get('temporal_context')
                
                # Add temporal indicator
                temporal_tag = ""
                if temporal_context:
                    temporal_tag = f" [{temporal_context.upper()}]"
                
                print(f"  {i}. [{source_agent.upper()}]{temporal_tag} {pathology} (confidence: {confidence:.1%})")
                print(f"     Evidence: {evidence}")
                
                if measurements:
                    # Format measurements for display
                    meas_items = []
                    for k, v in measurements.items():
                        if k not in ['vcot_disagreement', 'tool_confidence', 'final_confidence']:
                            meas_items.append(f"{k}={v}")
                    
                    if meas_items:
                        print(f"     Measurements: {', '.join(meas_items)}")
                    
                    # Show V-CoT disagreement if present
                    if measurements.get('vcot_disagreement'):
                        print(f"     ⚠️  V-CoT DISAGREEMENT: Visual analysis contradicts tool result")
                        # Show direct visual assessment if available
                        if measurements.get('vcot_direct_assessment'):
                            print(f"     👁️  Direct Visual Assessment: {measurements['vcot_direct_assessment']}")
                    
                    # Show confidence adjustments
                    if 'tool_confidence' in measurements and 'final_confidence' in measurements:
                        tool_conf = measurements['tool_confidence']
                        final_conf = measurements['final_confidence']
                        if abs(tool_conf - final_conf) > 0.1:
                            print(f"     🔄 Confidence adjusted: {tool_conf:.1%} → {final_conf:.1%}")
                
                if visual_cot:
                    # Show V-CoT summary
                    vcot_summary = self._extract_vcot_summary(visual_cot)
                    if vcot_summary:
                        print(f"     🔍 V-CoT: {vcot_summary}")
                
                print()  # Empty line between findings
        else:
            print("  ℹ️  No findings detected by any agent")
        
        # Show agent-specific summary
        print(f"\n📊 AGENT-SPECIFIC SUMMARY:")
        for agent_name, analysis in agent_results.items():
            if not isinstance(analysis, dict):
                continue
                
            findings = analysis.get('findings', [])
            plan_executed = analysis.get('plan_executed', [])
            confidence_level = analysis.get('confidence_level', 'unknown')
            visual_cot_triggered = analysis.get('visual_cot_triggered', False)
            
            print(f"  🤖 {agent_name.upper()}: {len(findings)} findings, confidence={confidence_level}")
            if visual_cot_triggered:
                print(f"     📸 V-CoT triggered")
            if plan_executed:
                print(f"     📋 Executed {len(plan_executed)} tasks")
        
        try:
            # 1. Plan synthesis strategy
            strategy = self.strategy_planner.invoke({
                "query": state['query'],
                "query_intent": getattr(query_analysis, 'query_intent', QueryIntent.COMPREHENSIVE).value,
                "available_agents": ", ".join(agent_results.keys()),
                "finding_count": len(all_findings),
                "has_clinical_context": bool(clinical_context)
            })
            
            print(f"\n🎯 SYNTHESIS STRATEGY:")
            print(f"   Pattern recognition: {strategy.pattern_recognition_needed}")
            print(f"   Differential diagnosis: {strategy.differential_needed}")
            
            # 2. Perform clinical reasoning (if needed)
            clinical_reasoning = None
            if strategy.pattern_recognition_needed or strategy.differential_needed:
                clinical_reasoning = self._perform_clinical_reasoning(
                    state, all_findings, clinical_context
                )
                
                if clinical_reasoning and clinical_reasoning.primary_diagnosis:
                    print(f"\n🏥 CLINICAL REASONING:")
                    print(f"   Primary diagnosis: {clinical_reasoning.primary_diagnosis.diagnosis}")
                    print(f"   Probability: {clinical_reasoning.primary_diagnosis.probability:.0%}")
            
            # 3. Generate final answer
            synthesis_result = self._generate_answer(
                state, all_findings, clinical_reasoning, clinical_context
            )
            
            # 4. Generate full report if needed
            if getattr(query_analysis, 'query_intent', None) == QueryIntent.COMPREHENSIVE:
                full_report = self._generate_clinical_report(
                    state, agent_results, all_findings, clinical_reasoning, clinical_context
                )
                synthesis_result.full_report = full_report
            
            # Update state
            state["synthesis_analysis"] = AgentAnalysis(
                agent_name="synthesis",
                findings=[],
                plan_executed=[
                    {"task": "strategy_planning", "result": "completed"},
                    {"task": "clinical_reasoning", "result": "completed" if clinical_reasoning else "skipped"},
                    {"task": "answer_generation", "result": "completed"}
                ],
                react_steps=[],
                visual_cot_triggered=False,
                confidence_level=self._confidence_to_level(synthesis_result.confidence),
                needs_human_review=synthesis_result.requires_review
            )
            
            state["synthesis_result"] = synthesis_result
            state["clinical_reasoning"] = clinical_reasoning
            state["final_report"] = synthesis_result.full_report or synthesis_result.answer
            
        except Exception as e:
            print(f"Error in synthesis: {e}")
            import traceback
            traceback.print_exc()
            state["final_report"] = self._simple_synthesis(state, agent_results)
        
        return state
    
    def _collect_agent_results(self, state: MultiAgentState) -> Dict[str, AgentAnalysis]:
        """Collect results from all completed agents"""
        agent_results = {}
        
        # Check for completed_agents list first
        completed_agents = state.get('completed_agents', [])
        
        for agent_name in completed_agents:
            if agent_name != 'synthesis':  # Don't include self
                analysis_key = f"{agent_name}_analysis"
                if analysis_key in state and state[analysis_key]:
                    agent_results[agent_name] = state[analysis_key]
        
        return agent_results
    
    def _extract_all_findings(self, agent_results: Dict[str, AgentAnalysis]) -> List[Dict]:
        """Extract all findings with their source agents"""
        all_findings = []
        
        for agent_name, analysis in agent_results.items():
            if not isinstance(analysis, dict):
                # Handle AgentAnalysis objects (not just dicts)
                if hasattr(analysis, 'findings'):
                    findings = analysis.findings or []
                else:
                    continue
            else:
                findings = analysis.get('findings', [])
            
            # Check if this is comparison data
            is_comparison = analysis.get('comparison_performed', False)
            comparison_data = analysis.get('comparison_data', {})
            
            for finding in findings:
                if isinstance(finding, dict):
                    enhanced_finding = finding.copy()
                    enhanced_finding['source_agent'] = agent_name
                    
                    # Preserve comparison context if present
                    if is_comparison:
                        enhanced_finding['is_comparison'] = True
                        if 'comparison_data' in analysis:
                            enhanced_finding['comparison_context'] = comparison_data
                    
                    all_findings.append(enhanced_finding)
        
        return all_findings
    
    def _perform_clinical_reasoning(self, state: MultiAgentState, findings: List[Dict], 
                                   clinical_context: Dict) -> Optional[ClinicalReasoning]:
        """Perform comprehensive clinical reasoning using LLM"""
        formatted_findings = self._format_findings_for_reasoning(findings)
        measurements = self._extract_measurements(findings)
        
        try:
            clinical_reasoning = self.clinical_reasoner.invoke({
                "query": state['query'],
                "formatted_findings": formatted_findings,
                "clinical_context": self._format_clinical_context(clinical_context),
                "measurements": self._format_measurements(measurements)
            })
            
            return clinical_reasoning
            
        except Exception as e:
            print(f"Error in clinical reasoning: {e}")
            return None
    
    def _generate_answer(self, state: MultiAgentState, findings: List[Dict], 
                        clinical_reasoning: Optional[ClinicalReasoning],
                        clinical_context: Dict) -> EnhancedSynthesisResult:
        """Generate comprehensive answer using LLM"""
        findings_summary = self._summarize_findings(findings)
        measurements = self._extract_measurements(findings)
        
        synthesis_result = self.answer_generator.invoke({
            "query": state['query'],
            "query_intent": getattr(state.get('query_analysis', {}), 'query_intent', QueryIntent.COMPREHENSIVE).value,
            "findings_summary": findings_summary,
            "clinical_reasoning": clinical_reasoning.dict() if clinical_reasoning else "Not performed",
            "key_measurements": self._format_measurements(measurements),
            "clinical_context": self._format_clinical_context(clinical_context)
        })
        
        return synthesis_result
    
    def _generate_clinical_report(self, state: MultiAgentState, agent_results: Dict,
                                 findings: List[Dict], clinical_reasoning: Optional[ClinicalReasoning],
                                 clinical_context: Dict) -> str:
        """Generate comprehensive clinical report"""
        try:
            response = self.report_generator.invoke({
                "query": state['query'],
                "view_position": state.get('view_position', 'PA/AP'),
                "has_prior": "Yes" if state.get('prior_image_path') else "None",
                "all_findings": self._format_findings_by_agent(agent_results),
                "clinical_reasoning": clinical_reasoning.dict() if clinical_reasoning else "Not performed",
                "measurements": self._format_measurements(self._extract_measurements(findings)),
                "clinical_context": self._format_clinical_context(clinical_context)
            })
            
            return response.content if hasattr(response, 'content') else str(response)
            
        except Exception as e:
            print(f"Error generating report: {e}")
            return self._simple_synthesis(state, agent_results)
    
    def _format_findings_for_reasoning(self, findings: List[Dict]) -> str:
        """Format findings for clinical reasoning"""
        if not findings:
            return "No significant findings detected."
        
        # Check if this is comparison data
        has_temporal_context = any(f.get('temporal_context') for f in findings)
        
        if has_temporal_context:
            return self._format_temporal_findings(findings)
        
        # Regular formatting for non-comparison cases
        # Group by agent
        by_agent = {}
        for finding in findings:
            agent = finding.get('source_agent', 'unknown')
            if agent not in by_agent:
                by_agent[agent] = []
            by_agent[agent].append(finding)
        
        formatted = []
        agent_order = ['airway', 'breathing', 'cardiac', 'diaphragm', 'everything']
        
        for agent in agent_order:
            if agent in by_agent:
                formatted.append(f"\n{agent.upper()} AGENT:")
                for f in by_agent[agent]:
                    pathology = f.get('pathology', 'unknown')
                    confidence = f.get('confidence', 0)
                    evidence = f.get('evidence', '')
                    location = f.get('location')
                    measurements = f.get('measurements', {})
                    visual_cot = f.get('visual_cot')
                    
                    finding_str = f"- {pathology}: {confidence:.0%} confidence"
                    
                    if measurements:
                        # Check for V-CoT disagreement markers
                        if measurements.get('vcot_disagreement'):
                            finding_str += " [V-CoT DISAGREEMENT]"
                        
                        # Format measurements excluding internal markers
                        measurement_items = []
                        for k, v in measurements.items():
                            if k not in ['vcot_disagreement', 'tool_confidence', 'final_confidence']:
                                measurement_items.append(f"{k}={v}")
                        
                        if measurement_items:
                            finding_str += f" (measurements: {', '.join(measurement_items)})"
                        
                        # Add confidence details if available
                        if 'tool_confidence' in measurements and 'final_confidence' in measurements:
                            tool_conf = measurements['tool_confidence']
                            final_conf = measurements['final_confidence']
                            if abs(tool_conf - final_conf) > 0.1:  # Significant difference
                                finding_str += f" (tool: {tool_conf:.0%} → V-CoT adjusted: {final_conf:.0%})"
                    
                    if location:
                        finding_str += f" (location: {location})"
                    
                    if evidence:
                        finding_str += f"\n  Evidence: {evidence}"
                    
                    # Add V-CoT summary if available
                    if visual_cot:
                        # Extract key points from V-CoT for synthesis
                        vcot_summary = self._extract_vcot_summary(visual_cot)
                        if vcot_summary:
                            finding_str += f"\n  V-CoT Assessment: {vcot_summary}"
                    
                    formatted.append(finding_str)
        
        return "\n".join(formatted)
    
    def _format_temporal_findings(self, findings: List[Dict]) -> str:
        """Format findings with temporal context for comparison"""
        # Group findings by pathology and agent
        temporal_groups = {}
        
        for f in findings:
            agent = f.get('source_agent', 'unknown')
            pathology = f.get('pathology', 'unknown')
            temporal = f.get('temporal_context', 'unknown')
            
            key = (agent, pathology)
            if key not in temporal_groups:
                temporal_groups[key] = {'current': None, 'prior': None}
            
            if temporal == 'current':
                temporal_groups[key]['current'] = f
            elif temporal == 'prior':
                temporal_groups[key]['prior'] = f
        
        formatted = []
        formatted.append("\nCOMPARISON ANALYSIS:")
        formatted.append("=" * 50)
        
        agent_order = ['airway', 'breathing', 'cardiac', 'diaphragm', 'everything']
        
        for agent in agent_order:
            agent_findings = [(k, v) for k, v in temporal_groups.items() if k[0] == agent]
            
            if agent_findings:
                formatted.append(f"\n{agent.upper()} AGENT COMPARISON:")
                
                for (ag, pathology), temporal_data in agent_findings:
                    current = temporal_data['current']
                    prior = temporal_data['prior']
                    
                    formatted.append(f"\n  Finding: {pathology}")
                    
                    if current and prior:
                        # Both timepoints present - show comparison
                        curr_conf = current.get('confidence', 0)
                        prior_conf = prior.get('confidence', 0)
                        curr_meas = current.get('measurements', {})
                        prior_meas = prior.get('measurements', {})
                        
                        formatted.append(f"    CURRENT: {curr_conf:.0%} confidence")
                        if curr_meas:
                            for k, v in curr_meas.items():
                                if k not in ['vcot_disagreement', 'tool_confidence', 'final_confidence']:
                                    formatted.append(f"      - {k}: {v}")
                        
                        formatted.append(f"    PRIOR: {prior_conf:.0%} confidence")
                        if prior_meas:
                            for k, v in prior_meas.items():
                                if k not in ['vcot_disagreement', 'tool_confidence', 'final_confidence']:
                                    formatted.append(f"      - {k}: {v}")
                        
                        # Show both timepoints - let the LLM interpret the changes
                        formatted.append(f"    COMPARISON:")
                        formatted.append(f"      Prior → Current confidence: {prior_conf:.0%} → {curr_conf:.0%}")
                        
                        # Show measurement changes if available
                        if curr_meas or prior_meas:
                            # Find all unique measurement keys
                            all_keys = set(list(curr_meas.keys()) + list(prior_meas.keys()))
                            for key in sorted(all_keys):
                                if key not in ['vcot_disagreement', 'tool_confidence', 'final_confidence']:
                                    prior_val = prior_meas.get(key, 'N/A')
                                    curr_val = curr_meas.get(key, 'N/A')
                                    if prior_val != 'N/A' or curr_val != 'N/A':
                                        formatted.append(f"      {key}: {prior_val} → {curr_val}")
                    
                    elif current and not prior:
                        # New finding
                        curr_conf = current.get('confidence', 0)
                        formatted.append(f"    NEW FINDING: {curr_conf:.0%} confidence")
                        curr_meas = current.get('measurements', {})
                        if curr_meas:
                            for k, v in curr_meas.items():
                                if k not in ['vcot_disagreement', 'tool_confidence', 'final_confidence']:
                                    formatted.append(f"      - {k}: {v}")
                    
                    elif prior and not current:
                        # Resolved finding
                        prior_conf = prior.get('confidence', 0)
                        formatted.append(f"    RESOLVED: Was {prior_conf:.0%} confidence in prior")
        
        formatted.append("\n" + "=" * 50)
        return "\n".join(formatted)
    
    def _extract_vcot_summary(self, visual_cot: str) -> str:
        """Extract key points from V-CoT reasoning for synthesis"""
        if not visual_cot:
            return ""
        
        # Look for key patterns in V-CoT output
        summary_points = []
        
        # Check for tool agreement status
        if "disagrees" in visual_cot.lower():
            summary_points.append("Visual analysis contradicts tool result")
        elif "agrees" in visual_cot.lower():
            summary_points.append("Visual analysis confirms tool result")
        elif "uncertain" in visual_cot.lower():
            summary_points.append("Visual analysis shows uncertainty")
        
        # Look for alternative assessments
        if "alternative_assessment" in visual_cot.lower():
            # Try to extract the alternative assessment
            lines = visual_cot.split('\n')
            for line in lines:
                if "alternative" in line.lower():
                    summary_points.append(f"Alternative: {line.strip()}")
                    break
        
        # Look for visual quality issues
        quality_keywords = ["poor quality", "unclear", "difficult to see", "ambiguous"]
        for keyword in quality_keywords:
            if keyword in visual_cot.lower():
                summary_points.append(f"Visual quality concern: {keyword}")
                break
        
        return "; ".join(summary_points) if summary_points else "Visual verification performed"
    
    def _format_clinical_context(self, clinical_context: Dict) -> str:
        """Format clinical context for LLM"""
        if not clinical_context:
            return "No clinical context provided."
        
        formatted = []
        
        if 'age' in clinical_context:
            formatted.append(f"Age: {clinical_context['age']}")
        
        if 'symptoms' in clinical_context:
            symptoms = clinical_context['symptoms']
            if isinstance(symptoms, list):
                formatted.append(f"Symptoms: {', '.join(symptoms)}")
            else:
                formatted.append(f"Symptoms: {symptoms}")
        
        if 'history' in clinical_context:
            history = clinical_context['history']
            if isinstance(history, list):
                formatted.append(f"Medical History: {', '.join(history)}")
            else:
                formatted.append(f"Medical History: {history}")
        
        if 'labs' in clinical_context:
            labs = clinical_context['labs']
            if isinstance(labs, dict):
                lab_str = ", ".join([f"{k}: {v}" for k, v in labs.items()])
                formatted.append(f"Laboratory Results: {lab_str}")
            else:
                formatted.append(f"Laboratory Results: {labs}")
        
        if 'vitals' in clinical_context:
            vitals = clinical_context['vitals']
            if isinstance(vitals, dict):
                vital_str = ", ".join([f"{k}: {v}" for k, v in vitals.items()])
                formatted.append(f"Vital Signs: {vital_str}")
            else:
                formatted.append(f"Vital Signs: {vitals}")
        
        return "\n".join(formatted) if formatted else "No clinical context provided."
    
    def _extract_measurements(self, findings: List[Dict]) -> Dict[str, Any]:
        """Extract all measurements from findings"""
        measurements = {}
        
        for finding in findings:
            if finding.get('measurements'):
                measurements.update(finding['measurements'])
        
        return measurements
    
    def _format_measurements(self, measurements: Dict[str, Any]) -> str:
        """Format measurements for LLM"""
        if not measurements:
            return "No specific measurements available."
        
        formatted = []
        for key, value in measurements.items():
            if isinstance(value, (int, float)):
                formatted.append(f"{key}: {value:.3f}")
            else:
                formatted.append(f"{key}: {value}")
        
        return "\n".join(formatted)
    
    def _format_findings_by_agent(self, agent_results: Dict) -> str:
        """Format findings grouped by agent for report generation"""
        formatted = []
        
        agent_order = ['airway', 'breathing', 'cardiac', 'diaphragm', 'everything']
        
        for agent_name in agent_order:
            if agent_name in agent_results:
                analysis = agent_results[agent_name]
                findings = analysis.get('findings', []) if isinstance(analysis, dict) else []
                
                if findings:
                    formatted.append(f"\n{agent_name.upper()}:")
                    for finding in findings:
                        if isinstance(finding, dict):
                            pathology = finding.get('pathology', 'unknown')
                            confidence = finding.get('confidence', 0)
                            evidence = finding.get('evidence', '')
                            
                            finding_str = f"- {pathology} ({confidence:.0%} confidence)"
                            if evidence:
                                finding_str += f": {evidence}"
                            
                            formatted.append(finding_str)
                else:
                    formatted.append(f"\n{agent_name.upper()}: No significant findings")
        
        return "\n".join(formatted)
    
    def _summarize_findings(self, findings: List[Dict]) -> str:
        """Create a concise summary of findings"""
        if not findings:
            return "No significant findings detected"
        
        # Check if this is temporal comparison data
        has_temporal = any(f.get('temporal_context') for f in findings)
        
        if has_temporal:
            # For comparison, summarize by timepoint
            current_findings = [f for f in findings if f.get('temporal_context') == 'current']
            prior_findings = [f for f in findings if f.get('temporal_context') == 'prior']
            
            summary_parts = []
            if current_findings:
                pathologies = list(set(f.get('pathology', 'unknown') for f in current_findings))
                summary_parts.append(f"Current image findings: {', '.join(pathologies)}")
            
            if prior_findings:
                pathologies = list(set(f.get('pathology', 'unknown') for f in prior_findings))
                summary_parts.append(f"Prior image findings: {', '.join(pathologies)}")
            
            if not summary_parts:
                summary_parts.append("Temporal comparison data available but no specific findings")
            
            return " | ".join(summary_parts)
        else:
            # Regular summary for non-comparison cases
            # Count findings by confidence level
            high_conf = [f for f in findings if f.get('confidence', 0) > 0.7]
            med_conf = [f for f in findings if 0.4 <= f.get('confidence', 0) <= 0.7]
            low_conf = [f for f in findings if f.get('confidence', 0) < 0.4]
            
            summary_parts = []
            
            if high_conf:
                pathologies = list(set(f['pathology'] for f in high_conf))
                summary_parts.append(f"High confidence: {', '.join(pathologies)}")
            
            if med_conf:
                pathologies = list(set(f['pathology'] for f in med_conf))
                summary_parts.append(f"Moderate confidence: {', '.join(pathologies)}")
            
            if low_conf:
                summary_parts.append(f"Low confidence findings: {len(low_conf)}")
            
            return "; ".join(summary_parts)
    
    def _simple_synthesis(self, state: MultiAgentState, agent_results: Dict[str, AgentAnalysis]) -> str:
        """Simple fallback synthesis"""
        findings_count = sum(
            len(analysis.get('findings', [])) 
            for analysis in agent_results.values()
            if isinstance(analysis, dict)
        )
        
        if findings_count == 0:
            return "No significant abnormalities detected in the chest X-ray."
        else:
            return f"Analysis complete. {findings_count} findings detected. Clinical correlation recommended."
    
    def _confidence_to_level(self, confidence: float) -> str:
        """Convert numeric confidence to level"""
        if confidence >= 0.8:
            return "high"
        elif confidence >= 0.5:
            return "medium"
        else:
            return "low" 