"""Breathing specialist agent for lung and pleural analysis using ReAct mode"""

from typing import List, Dict, Any, Optional, Union
from langchain_core.language_models import BaseLanguageModel
from langchain_core.prompts import PromptTemplate, ChatPromptTemplate
from langchain.agents import AgentExecutor, create_react_agent
from langchain_core.messages import HumanMessage, ToolMessage, SystemMessage
from pydantic import BaseModel, Field
import json

from .base_abcde import ABCDEAgent
from ..orchestrator.state import MultiAgentState, AgentAnalysis, Finding
from ...tools import ChestXRayClassifierTool, ChestXRaySegmentationTool, XRayPhraseGroundingTool, XRayVQATool


class BreathingTaskParameters(BaseModel):
    """Parameters for a breathing task"""
    focus: Optional[str] = Field(default=None, description="Focus area for the task")
    phrase: Optional[str] = Field(default=None, description="Phrase to ground/localize")
    phrases: Optional[List[str]] = Field(default=None, description="Multiple phrases to ground")
    image_path: Optional[str] = Field(default=None, description="Path to the image")
    organs: Optional[List[str]] = Field(default=None, description="Specific organs to segment")
    
    class Config:
        extra = "forbid"


class BreathingSubtask(BaseModel):
    """A single subtask in the breathing analysis plan"""
    task_id: str = Field(description="Unique identifier for this subtask")
    description: str = Field(description="What this subtask accomplishes")
    tool: str = Field(description="Which tool to use: chest_xray_classifier, chest_xray_segmentation, or xray_phrase_grounding")
    parameters: BreathingTaskParameters = Field(default_factory=BreathingTaskParameters, description="Parameters for the tool")
    depends_on: List[str] = Field(default_factory=list, description="List of task_ids this task depends on")
    clinical_priority: str = Field(default="medium", description="Clinical priority: high, medium, low")
    
    class Config:
        extra = "forbid"


class BreathingPlan(BaseModel):
    """Dynamic plan for breathing analysis"""
    subtasks: List[BreathingSubtask] = Field(description="Ordered list of subtasks to execute")
    reasoning: str = Field(description="Brief explanation of why this plan was chosen")
    clinical_focus: List[str] = Field(description="Primary clinical conditions this plan addresses")
    
    class Config:
        extra = "forbid"


class FindingLocation(BaseModel):
    """Structured location information for findings"""
    side: str = Field(description="Anatomical side: left, right, bilateral, or midline")
    zone: Optional[str] = Field(default=None, description="Lung zone: upper, middle, lower, perihilar, peripheral, apical")
    lobe: Optional[str] = Field(default=None, description="Specific lobe if identifiable")
    position: Optional[str] = Field(default=None, description="Additional position description")


class FindingExtent(BaseModel):
    """Structured extent information for findings"""
    distribution: str = Field(description="Distribution pattern: focal, multifocal, lobar, diffuse")
    size: Optional[str] = Field(default=None, description="Size category: small, moderate, large")
    percentage: Optional[float] = Field(default=None, description="Percentage of affected area if measurable")
    involvement: Optional[str] = Field(default=None, description="Involvement pattern: limited, basal-predominant, diffuse")



class BreathingAgent(ABCDEAgent):
    """Specialist agent for breathing/lung analysis with ReAct mode for complex lung findings"""
    
    def __init__(
        self, 
        llm: BaseLanguageModel,
        classification_tool: ChestXRayClassifierTool,
        segmentation_tool: ChestXRaySegmentationTool,
        grounding_tool: XRayPhraseGroundingTool,  # Now required, not optional
        vqa_tool: Optional[XRayVQATool] = None,
        vcot_module: Optional[Any] = None
    ):
        # Grounding tool is now required for pathology localization
        if grounding_tool is None:
            raise ValueError("Grounding tool is required for pathology localization in BreathingAgent")
        
        # Create tools list (VQA tool is optional for exploratory questions)
        tools = [classification_tool, segmentation_tool, grounding_tool]
        if vqa_tool:
            tools.append(vqa_tool)
            
        super().__init__(
            agent_name="BreathingAgent",
            llm=llm,
            tools=tools,
            mode="function_calling",  # Function calling mode for efficient analysis
            vcot_policy="on_low_conf"
        )
        self.vcot_module = vcot_module
        self.grounding_tool = grounding_tool  # Store reference
        self.has_vqa = vqa_tool is not None
        
        # Track findings for comprehensive synthesis information
        self.anatomical_measurements = {}
        self.pathology_locations = {}
        self.confidence_scores = {}
        
        # Initialize caches for efficient tool usage
        self._segmentation_cache = {}
        self._classification_cache = {}
        self._findings_dedup = set()
        
        # Initialize temp directory for ROI cropping
        from pathlib import Path
        import tempfile
        self.temp_dir = Path(tempfile.mkdtemp(prefix="breathing_agent_"))
        self.temp_dir.mkdir(exist_ok=True)
        
        # Build tools description and subtask templates
        self._build_tools_description()
        self.subtask_templates = self._define_subtask_templates()
        
        # Create structured planner for plan-execute mode
        self.planner = self._create_planner()
        
        # ReAct mode setup is handled by base class
    
    def set_mode(self, mode: str):
        """Dynamically set the execution mode for this agent"""
        valid_modes = ["function_calling", "react", "plan_execute"]
        if mode not in valid_modes:
            print(f"Warning: Invalid mode '{mode}' for BreathingAgent. Using 'function_calling'")
            mode = "function_calling"
        
        print(f"BreathingAgent: Switching to {mode} mode")
        self.mode = mode
        
        # If switching to react mode, ensure agent executor is set up
        if mode == "react" and not hasattr(self, 'agent_executor'):
            self._setup_react_agent()
        elif mode == "plan_execute" and not hasattr(self, 'plan_execute_workflow'):
            self._setup_plan_execute_workflow()
    
    def _build_tools_description(self):
        """Build tools description string once during init"""
        tools_desc = [
            "- chest_xray_classifier: Detects respiratory pathologies (pneumothorax, effusion, consolidation, atelectasis, pneumonia, edema)",
            "- chest_xray_segmentation: Segments lung structures, provides measurements and anatomical analysis"
        ]
        if self.grounding_tool:
            tools_desc.append("- xray_phrase_grounding: Localizes specific respiratory findings in the image")
        if self.has_vqa:
            tools_desc.append("- xray_vqa: Provides detailed visual analysis and description of findings")
        
        self.tools_available_desc = "\n".join(tools_desc)
    
    def _define_subtask_templates(self) -> str:
        """Define available subtask templates for breathing analysis focusing on clinically significant conditions"""
        return """
Available Breathing Subtask Templates - Focus on Most Clinically Significant Conditions:

1. ACUTE LIFE-THREATENING CONDITIONS (HIGHEST PRIORITY):
   - detect_pneumothorax: Identify pneumothorax using classification + grounding
     * High clinical priority - can be life-threatening
     * Use grounding to localize (percentage calculation not reliable)
   
   - detect_tension_pneumothorax: Assess for tension pneumothorax signs
     * Look for mediastinal shift using segmentation
     * Measure tracheal deviation
     * Check for hemidiaphragm flattening
   
   - detect_massive_effusion: Identify large pleural effusions
     * Use grounding to localize (percentage calculation not reliable)
     * Assess for mediastinal shift
     * Check costophrenic angle blunting

2. ACUTE RESPIRATORY FAILURE CONDITIONS (HIGH PRIORITY):
   - detect_pulmonary_edema: Identify pulmonary edema patterns
     * Look for bilateral perihilar infiltrates
     * Assess for cardiomegaly (heart failure vs non-cardiogenic)
     * Check for Kerley B lines, bat wing pattern
   
   - detect_consolidation: Identify consolidation (pneumonia, infarct)
     * Use grounding to localize consolidation
     * Assess distribution pattern (lobar vs bronchopneumonia)
     * Check for air bronchograms
   
   - detect_atelectasis: Identify volume loss/collapse
     * Measure lung volume reduction
     * Check for compensatory hyperinflation
     * Assess for underlying obstruction

3. RESPIRATORY PATHOLOGY ASSESSMENT (MEDIUM PRIORITY):
   - detect_interstitial_infiltrates: Identify interstitial patterns
     * Look for reticular, nodular, or reticulonodular patterns
     * Assess distribution (upper vs lower zone predominance)
     * Check for honeycombing in advanced cases
   
   - assess_pleural_abnormalities: Comprehensive pleural assessment
     * Effusion quantification and characterization
     * Pleural thickening assessment
     * Pneumothorax evaluation
   
   - evaluate_lung_opacity: Assess lung opacities
     * Differentiate ground-glass vs consolidation
     * Assess distribution and extent
     * Check for cavitation or mass lesions

4. MEASUREMENT AND QUANTIFICATION TASKS:
   - segment_respiratory_structures: Segment lungs, pleura, airways
     * Optimized organ selection: ["Left Lung", "Right Lung", "Pleura", "Trachea"]
     * Calculate lung volumes and ratios
     * Assess symmetry and position
   
   - measure_effusion_volume: V-CoT percentage estimation using pleural space reference
     * Uses grounding to locate pleural space and effusion
     * Calculates percentage relative to pleural cavity (anatomically correct)
     * V-CoT provides visual assessment of pleural involvement
   
   - measure_pneumothorax_extent: V-CoT percentage estimation using pleural space reference
     * Uses grounding to locate pleural space and pneumothorax
     * Calculates percentage relative to pleural cavity (anatomically correct)
     * V-CoT provides visual assessment of pleural involvement

5. LOCALIZATION AND CHARACTERIZATION:
   - localize_respiratory_finding: Precise anatomical localization
     * Use grounding to find specific pathology
     * Describe location with anatomical precision
     * Assess extent and distribution
   
   - characterize_finding_attributes: Detailed finding description
     * Location: side, zone, lobe, position
     * Extent: distribution, size, percentage, involvement
     * Morphology: shape, margins, internal characteristics

6. ADVANCED ANALYSIS:
   - cross_validate_findings: Compare findings across tools
     * Validate classification with grounding
     * Confirm measurements with visual analysis
     * Resolve discrepancies
   
   - visual_reasoning_vcot: Apply V-CoT for uncertain findings
     * Use cropped regions of interest
     * Focus on specific anatomical areas
     * Enhance confidence through detailed visual analysis

CLINICAL PRIORITIZATION:
- Life-threatening: Pneumothorax, massive effusion, tension pneumothorax
- Respiratory failure: Pulmonary edema, extensive consolidation, severe atelectasis
- Infectious/inflammatory: Pneumonia, interstitial infiltrates
- Quantitative assessment: Always include measurements for objective evaluation
- Localization: Precise anatomical description for clinical correlation

TOOL OPTIMIZATION:
- Classification: Use for broad screening of respiratory pathologies
- Segmentation: Optimize organ selection based on clinical focus
- Grounding: Essential for precise localization of acute findings
- VQA: For complex pattern recognition and detailed description
- V-CoT: Triggered by low confidence grounding results (<0.6)"""
    
    def _create_planner(self):
        """Create the LLM-based planner with structured output for breathing analysis"""
        
        planner_prompt = ChatPromptTemplate.from_messages([
            ("system", """You are a pulmonary imaging specialist planning a breathing analysis workflow.
Given a query about respiratory findings, create a detailed plan using available tools.

{subtask_templates}

Tools available:
{tools_available}

CLINICAL PRIORITIES FOR BREATHING ANALYSIS:
1. Life-threatening conditions (pneumothorax, massive effusion) - HIGHEST PRIORITY
2. Acute respiratory failure (pulmonary edema, consolidation) - HIGH PRIORITY  
3. Infectious/inflammatory conditions (pneumonia, infiltrates) - HIGH PRIORITY
4. Quantitative measurements for objective assessment - ALWAYS INCLUDE
5. Precise anatomical localization - ESSENTIAL FOR CLINICAL CORRELATION

INTELLIGENT TOOL SELECTION:
- For pneumothorax queries: classify → segment lungs → ground "pneumothorax" → measure extent
- For effusion queries: classify → segment lungs + pleura → ground "pleural effusion" → quantify volume
- For consolidation/pneumonia: classify → ground "consolidation" → segment for extent → characterize location
- For comprehensive assessment: classify → segment → ground multiple findings → quantify + localize

FINDING ATTRIBUTE REQUIREMENTS:
For each finding, ensure the plan includes:
- Location: Describe anatomical position (side, zone, lobe)
- Extent: Describe distribution (focal/multifocal/diffuse) and size (small/moderate/large)
- Clinical significance: Relate to acute vs chronic conditions

V-COT TRIGGERING:
- Automatically trigger V-CoT for grounding confidence < 0.6
- Use cropped regions of interest based on grounding bounding boxes
- Focus on specific lung zones for detailed analysis

Create a plan that:
1. Addresses the specific clinical query
2. Prioritizes life-threatening conditions
3. Includes quantitative measurements
4. Provides precise anatomical localization
5. Uses efficient tool combinations
6. Considers clinical workflow and urgency

IMPORTANT: Structure findings with both location and extent attributes for clinical utility."""),
            ("human", "Query: {query}\n\nCreate a plan to analyze the respiratory findings with clinical priority and detailed anatomical characterization.")
        ])
        
        return planner_prompt | self.llm.with_structured_output(BreathingPlan)
    
    def _setup_react_agent(self):
        """Set up ReAct agent executor for breathing analysis"""
        from langchain.agents import create_react_agent, AgentExecutor
        from langchain_core.prompts import PromptTemplate
        
        # Create ReAct prompt template
        prompt = PromptTemplate.from_template(self.get_react_prompt_template())
        
        # Create ReAct agent
        agent = create_react_agent(
            llm=self.llm,
            tools=list(self.tools.values()),
            prompt=prompt
        )
        
        # Create agent executor
        self.agent_executor = AgentExecutor(
            agent=agent,
            tools=list(self.tools.values()),
            verbose=True,
            max_iterations=10,
            max_execution_time=300,  # 5 minutes timeout
            handle_parsing_errors=True
        )
    
    def _setup_plan_execute_workflow(self):
        """Set up plan-execute workflow for complex breathing analysis"""
        from langgraph.graph import StateGraph, END
        from langchain_core.messages import HumanMessage
        from langchain_core.prompts import PromptTemplate
        
        # Create plan-execute workflow
        workflow = StateGraph(dict)
        
        # Add nodes
        workflow.add_node("plan", self._plan_analysis)
        workflow.add_node("execute_classification", self._execute_classification)
        workflow.add_node("execute_segmentation", self._execute_segmentation)
        workflow.add_node("execute_grounding", self._execute_grounding)
        workflow.add_node("execute_vqa", self._execute_vqa)
        workflow.add_node("synthesize_findings", self._synthesize_findings)
        
        # Add conditional edges based on plan
        workflow.add_conditional_edges(
            "plan",
            self._should_continue_execution,
            {
                "classification": "execute_classification",
                "segmentation": "execute_segmentation", 
                "grounding": "execute_grounding",
                "vqa": "execute_vqa",
                "synthesize": "synthesize_findings",
                "end": END
            }
        )
        
        # Add edges from execution nodes back to decision point
        workflow.add_edge("execute_classification", "plan")
        workflow.add_edge("execute_segmentation", "plan")
        workflow.add_edge("execute_grounding", "plan")
        workflow.add_edge("execute_vqa", "plan")
        workflow.add_edge("synthesize_findings", END)
        
        # Set entry point
        workflow.set_entry_point("plan")
        
        self.plan_execute_workflow = workflow.compile()
    


    
    def get_react_prompt_template(self) -> str:
        """Get ReAct prompt template for breathing analysis"""
        return """You are a radiologist analyzing the breathing/lung aspects of a chest X-ray.
        
Available tools:
{tools}

Tool names: {tool_names}

Use the following format:
Thought: Consider what lung pathologies to check for
Action: the action to take, should be one of [{tool_names}]
Action Input: the input to the action
Observation: the result of the action
... (repeat Thought/Action/Observation as needed)
Thought: I now have enough information about the lung findings
Final Answer: comprehensive summary of lung findings with confidence levels

TOOL USAGE EXAMPLES:
- For classification: Action Input: {{}}
- For segmentation: Action Input: {{}}
- For grounding: Action Input: {{"phrase": "pneumothorax"}}
- For VQA: Action Input: {{"question": "Is there pneumothorax?"}}

CRITICAL ANALYSIS PROTOCOL:
1. ALWAYS start with the classification tool for broad screening
2. ALWAYS use grounding tool for these critical pathologies regardless of classification confidence:
   - pneumothorax (life-threatening) - use {{"phrase": "pneumothorax"}}
   - pleural effusion (clinically significant) - use {{"phrase": "pleural effusion"}}
   - pneumonia (infectious concern) - use {{"phrase": "pneumonia"}}
   - consolidation (respiratory compromise) - use {{"phrase": "consolidation"}}
3. Use segmentation tool for measurements and percentage calculations
4. Multiple tools may disagree - this is normal and valuable for comprehensive analysis

Focus on these breathing-related pathologies:
- LUNG FIELDS: Pneumothorax, Consolidation, Atelectasis, Infiltrates, Pneumonia, Nodules
- PLEURAL: Pleural Effusion, Pleural Thickening, Pneumothorax
- COSTOPHRENIC ANGLES: Blunting, sharp angles (per ABCDEF B: Breathing)
- VASCULAR: Pulmonary Edema, Vascular Redistribution, Cephalization
- INTERSTITIAL: Interstitial patterns, Fibrosis

IMPORTANT: 
- Even if classification gives low confidence, STILL ground critical pathologies
- Different tools have different strengths - use multiple perspectives
- Combine evidence from all tools for final assessment
- Action Input must be valid JSON without extra quotes or newlines
- Image path is automatically provided to all tools
- For grounding tool, you MUST provide the "phrase" parameter

Query: {input}
Image path: {image_path} (automatically injected into all tool calls)

Begin your systematic breathing analysis:

{agent_scratchpad}"""
    
    def create_plan(self, state: MultiAgentState) -> List[Dict[str, Any]]:
        """Create dynamic plan using LLM with structured output for breathing analysis"""
        query = state.get("query", "")
        
        # If in comparison mode, modify query to avoid comparison within agent
        comparison_mode = state.get("comparison_mode")
        if comparison_mode:
            # Simplify query for single image analysis
            if "pneumothorax" in query.lower():
                query = "Detect pneumothorax and assess lung fields"
            elif "effusion" in query.lower():
                query = "Detect pleural effusion and assess pleural space"
            elif "pneumonia" in query.lower() or "consolidation" in query.lower():
                query = "Detect pneumonia, consolidation, and lung pathologies"
            else:
                query = "Perform comprehensive lung and pleural assessment"
        
        try:
            # Use LLM to generate structured plan
            plan_response = self.planner.invoke({
                "query": query,
                "subtask_templates": self.subtask_templates,
                "tools_available": self.tools_available_desc
            })
            
            # Convert structured plan to execution format
            execution_plan = []
            for subtask in plan_response.subtasks:
                # Convert parameters to dict for execution
                params_dict = subtask.parameters.dict(exclude_none=True)
                
                execution_plan.append({
                    "task_id": subtask.task_id,
                    "description": subtask.description,
                    "tool": subtask.tool,
                    "parameters": params_dict,
                    "depends_on": subtask.depends_on,
                    "clinical_priority": subtask.clinical_priority
                })
            
            # Store planning information for transparency
            state["breathing_planning_reasoning"] = plan_response.reasoning
            state["breathing_clinical_focus"] = plan_response.clinical_focus
            
            return execution_plan
            
        except Exception as e:
            print(f"Error in LLM planning, falling back to basic plan: {e}")
            # Fallback to a basic comprehensive plan
            return self._get_fallback_plan(query)
    
    def _get_fallback_plan(self, query: str) -> List[Dict[str, Any]]:
        """Minimal fallback plan if LLM planning fails"""
        plan = [
            {
                "task_id": "classify_respiratory",
                "description": "General respiratory pathology detection",
                "tool": "chest_xray_classifier",
                "parameters": {"focus": "respiratory"},
                "depends_on": [],
                "clinical_priority": "high"
            },
            {
                "task_id": "segment_lungs",
                "description": "Segment lung structures for measurements",
                "tool": "chest_xray_segmentation",
                "parameters": {"organs": ["Left Lung", "Right Lung", "Pleura"]},
                "depends_on": [],
                "clinical_priority": "medium"
            }
        ]
        
        # Add grounding tasks for critical pathologies if tool is available
        if self.grounding_tool:
            critical_pathologies = ["pneumothorax", "pleural effusion", "consolidation"]
            for pathology in critical_pathologies:
                if pathology in query.lower():
                    plan.append({
                        "task_id": f"localize_{pathology.replace(' ', '_')}",
                        "description": f"Localize {pathology}",
                        "tool": "xray_phrase_grounding",
                        "parameters": {"phrase": pathology},
                        "depends_on": [],
                        "clinical_priority": "high"
                    })
        
        return plan
    
    def analyze(self, state: MultiAgentState) -> MultiAgentState:
        """Perform breathing analysis using configured mode (ReAct or StateGraph)"""
        print(f"\n{'='*60}")
        print(f"BREATHING AGENT: Starting {self.mode} analysis...")
        
        # Clean image path
        image_path = state["image_path"]
        if '\n' in image_path:
            print(f"WARNING: Image path contains newline character! Cleaning it...")
            image_path = image_path.strip()
            state["image_path"] = image_path
        
        print(f"Image path: '{image_path}'")
        print(f"Query: '{state.get('query', '')}'")
        
        # Reset tracking for new analysis
        self.anatomical_measurements = {}
        self.pathology_locations = {}
        self.confidence_scores = {}
        
        if self.mode == "function_calling":
            return self._analyze_function_calling(state, image_path)
        elif self.mode == "react":
            return self._analyze_react(state, image_path)
        elif self.mode == "plan_execute":
            return self._analyze_plan_execute_structured(state, image_path)
        else:
            raise NotImplementedError(f"Mode {self.mode} not implemented yet")
    
    def _process_request(self, state):
        """Process request using function calling (following main.py pattern)"""
        messages = state["messages"]
        
        # Add system message with agent context
        system_msg = SystemMessage(content=f"""You are a {self.agent_name} specialist analyzing medical images.
Available tools: {list(self.tools.keys())}

Focus on your specialty area and use the appropriate tools to analyze the image.
Current image: {state.get('image_path', 'Unknown')}

CRITICAL ANALYSIS PROTOCOL for breathing/lung analysis:
1. ALWAYS start with chest_xray_classifier for broad screening
2. ALWAYS use xray_phrase_grounding for these critical pathologies regardless of classification confidence:
   - pneumothorax (life-threatening)
   - pleural effusion (clinically significant)
   - pneumonia (infectious concern)
   - consolidation (respiratory compromise)
3. Use chest_xray_segmentation for measurements and percentage calculations
4. Multiple tools may disagree - this is normal and valuable for comprehensive analysis

Be systematic and thorough in your analysis.""")
        
        messages_with_system = [system_msg] + messages
        response = self.model_with_tools.invoke(messages_with_system)
        
        return {"messages": [response]}
    
    def _analyze_function_calling(self, state: MultiAgentState, image_path: str) -> MultiAgentState:
        """Analyze using function calling with StateGraph workflow (following main.py pattern)"""
        try:
            print(f"  Executing function calling analysis with query: '{state.get('query', '')}'")
            print(f"  Available tools: {list(self.tools.keys())}")
            
            # Check if query involves critical pathologies that need grounding
            query = state.get("query", "").lower()
            critical_pathologies = ['pneumothorax', 'pleural effusion', 'pneumonia', 'consolidation']
            needs_grounding = any(pathology in query for pathology in critical_pathologies)
            
            if needs_grounding:
                print(f"  🚨 Critical pathology query detected - forcing comprehensive analysis")
                return self._force_comprehensive_analysis(state, image_path)
            
            # Prepare initial message
            query = state.get("query", "Analyze this chest X-ray for breathing abnormalities")
            initial_message = HumanMessage(content=query)
            
            # Execute function calling workflow (exactly like main.py)
            result = self.function_calling_workflow.invoke({
                "messages": [initial_message],
                "image_path": image_path
            })
            
            # Extract findings from tool messages (simplified)
            findings = []
            messages = result.get("messages", [])
            
            # Process tool messages to extract findings
            for message in messages:
                if isinstance(message, ToolMessage):
                    # Parse tool result and extract findings
                    tool_result = self._parse_tool_message(message)
                    if message.name == "chest_xray_classifier":
                        self._process_classification_findings(tool_result, findings, state)
                    elif message.name == "chest_xray_segmentation":
                        self._process_segmentation_findings(tool_result, findings, state)
                    elif message.name == "xray_phrase_grounding":
                        self._process_grounding_findings(tool_result, findings, {"phrase": "from_tool"})
                    elif message.name == "xray_vqa":
                        self._process_vqa_findings(tool_result, findings, {"question": "from_tool"})
            
            # If no findings from tools, extract from final response
            if not findings:
                final_message = messages[-1] if messages else None
                if final_message and hasattr(final_message, 'content'):
                    findings = self._extract_findings_from_response(final_message.content, state)
            
            # Generate synthesis information
            synthesis_info = self._prepare_synthesis_information(findings)
            confidence_level = self._assess_confidence(findings)
            
            state["breathing_analysis"] = AgentAnalysis(
                agent_name="BreathingAgent",
                findings=findings,
                plan_executed=[],
                react_steps=[],
                visual_cot_triggered=any(f.get("visual_cot") for f in findings if isinstance(f, dict)),
                confidence_level=confidence_level,
                needs_human_review=self._needs_review(findings),
                synthesis_info=synthesis_info
            )
            
            print(f"✓ Function calling analysis complete: {len(findings)} findings")
            return state
            
        except Exception as e:
            print(f"Error in function calling analysis: {e}")
            import traceback
            traceback.print_exc()
            
            # Return error state
            state["breathing_analysis"] = AgentAnalysis(
                agent_name="BreathingAgent",
                findings=[],
                plan_executed=[],
                react_steps=[],
                visual_cot_triggered=False,
                confidence_level="error",
                needs_human_review=True,
                synthesis_info={"error": str(e)}
            )
            return state
    
    def _force_comprehensive_analysis(self, state: MultiAgentState, image_path: str) -> MultiAgentState:
        """Force comprehensive analysis with all tools for critical pathologies"""
        print(f"  🔬 Starting forced comprehensive analysis...")
        
        findings = []
        executed_tools = []
        
        # Step 1: Always run classification first
        print(f"  🔍 Step 1: Running classification...")
        try:
            classifier_result = self.tools["chest_xray_classifier"].invoke({"image_path": image_path})
            self._process_classification_findings(classifier_result, findings, state)
            executed_tools.append("chest_xray_classifier")
            print(f"    ✓ Classification complete, found {len(findings)} findings so far")
        except Exception as e:
            print(f"    ✗ Classification failed: {e}")
        
        # Step 2: Always run segmentation
        print(f"  📏 Step 2: Running segmentation...")
        try:
            segmentation_result = self.tools["chest_xray_segmentation"].invoke({"image_path": image_path})
            self._process_segmentation_findings(segmentation_result, findings, state)
            executed_tools.append("chest_xray_segmentation")
            print(f"    ✓ Segmentation complete, found {len(findings)} findings so far")
        except Exception as e:
            print(f"    ✗ Segmentation failed: {e}")
        
        # Step 3: Always run grounding for critical pathologies
        print(f"  🎯 Step 3: Running grounding for critical pathologies...")
        critical_pathologies = ['pneumothorax', 'pleural effusion', 'pneumonia', 'consolidation']
        
        query = state.get("query", "").lower()
        for pathology in critical_pathologies:
            if pathology in query:
                print(f"    🎯 Grounding for: {pathology}")
                try:
                    grounding_result = self.tools["xray_phrase_grounding"].invoke({
                        "image_path": image_path,
                        "phrase": pathology
                    })
                    self._process_grounding_findings(grounding_result, findings, {"phrase": pathology})
                    executed_tools.append(f"xray_phrase_grounding({pathology})")
                    print(f"      ✓ Grounding for {pathology} complete")
                except Exception as e:
                    print(f"      ✗ Grounding for {pathology} failed: {e}")
        
        # Generate synthesis information
        synthesis_info = self._prepare_synthesis_information(findings)
        synthesis_info["forced_comprehensive"] = True
        synthesis_info["executed_tools"] = executed_tools
        
        confidence_level = self._assess_confidence(findings)
        
        state["breathing_analysis"] = AgentAnalysis(
            agent_name="BreathingAgent",
            findings=findings,
            plan_executed=[{"tool": tool, "forced": True} for tool in executed_tools],
            react_steps=[],
            visual_cot_triggered=any(f.get("visual_cot") for f in findings if isinstance(f, dict)),
            confidence_level=confidence_level,
            needs_human_review=self._needs_review(findings),
            synthesis_info=synthesis_info
        )
        
        print(f"✓ Forced comprehensive analysis complete: {len(findings)} findings from {len(executed_tools)} tools")
        return state
    
    def _parse_tool_message(self, tool_message: ToolMessage):
        """Parse tool message content into structured data"""
        try:
            content = tool_message.content
            
            # Try to parse as JSON if it looks like structured data
            if content.startswith('{') or content.startswith('['):
                try:
                    import json
                    return json.loads(content)
                except:
                    return {"raw_content": content}
            else:
                return {"raw_content": content}
        except Exception as e:
            print(f"Error parsing tool message: {e}")
            return {"raw_content": str(tool_message.content)}
    
    def _analyze_react(self, state: MultiAgentState, image_path: str) -> MultiAgentState:
        """Analyze using ReAct mode"""
        try:
            print(f"  Executing ReAct analysis with query: '{state.get('query', '')}'")
            print(f"  Available tools: {list(self.tools.keys())}")
            
            # Debug tool names
            print(f"  Tool names for ReAct: {[tool.name for tool in self.tools.values()]}")
            
            # Set current image path for auto-injection
            self.set_current_image_path(image_path.strip())
            print(f"  Set current image path to: {image_path.strip()}")
            
            # Execute ReAct analysis
            result = self.agent_executor.invoke({
                "input": state.get("query", "").strip(),
                "image_path": image_path.strip()
            })
            
            findings = []
            react_steps = []
            
            # Process intermediate steps
            intermediate_steps = result.get("intermediate_steps", [])
            print(f"  Processed {len(intermediate_steps)} ReAct steps")
            
            for i, step in enumerate(intermediate_steps):
                action, observation = step
                tool_name = action.tool
                tool_input = action.tool_input
                
                print(f"  Step {i+1}: {tool_name} with input {tool_input}")
                react_steps.append(f"{tool_name}: {tool_input}")
                
                # Extract findings from each tool's results
                # Handle both tuple and direct results
                if isinstance(observation, tuple):
                    tool_result, metadata = observation
                    print(f"    Tool returned tuple: {type(tool_result)}, {type(metadata)}")
                else:
                    tool_result = observation
                    metadata = {}
                    print(f"    Tool returned direct result: {type(tool_result)}")
                
                # Process results based on tool name (use actual tool names)
                if tool_name in ["chest_xray_classifier", "ChestXRayClassifierTool"]:
                    print(f"    Processing classification results...")
                    self._process_classification_findings(tool_result, findings, state)
                elif tool_name in ["chest_xray_segmentation", "ChestXRaySegmentationTool"]:
                    print(f"    Processing segmentation results...")
                    self._process_segmentation_findings(tool_result, findings, state)
                elif tool_name in ["xray_phrase_grounding", "XRayPhraseGroundingTool"]:
                    print(f"    Processing grounding results...")
                    self._process_grounding_findings(tool_result, findings, tool_input)
                elif tool_name in ["xray_vqa", "XRayVQATool"]:
                    print(f"    Processing VQA results...")
                    self._process_vqa_findings(tool_result, findings, tool_input)
                else:
                    print(f"    Unknown tool: {tool_name}")
            
            # Also extract findings from final answer if available
            final_answer = result.get("output", "")
            if final_answer and not findings:
                print(f"  Extracting findings from final answer: {final_answer}")
                extracted_findings = self._extract_findings_from_response(final_answer, state)
                findings.extend(extracted_findings)
            
            # Generate synthesis information
            synthesis_info = self._prepare_synthesis_information(findings)
            confidence_level = self._assess_confidence(findings)
            
            state["breathing_analysis"] = AgentAnalysis(
                agent_name="BreathingAgent",
                findings=findings,
                plan_executed=[],
                react_steps=react_steps,
                visual_cot_triggered=any(f.get("visual_cot") for f in findings if isinstance(f, dict)),
                confidence_level=confidence_level,
                needs_human_review=self._needs_review(findings),
                synthesis_info=synthesis_info
            )
            
            print(f"✓ ReAct analysis complete: {len(findings)} findings from {len(react_steps)} steps")
            return state
            
        except Exception as e:
            print(f"Error in breathing ReAct analysis: {e}")
            import traceback
            traceback.print_exc()
            
            # Create fallback analysis
            state["breathing_analysis"] = AgentAnalysis(
                agent_name="BreathingAgent",
                findings=[],
                plan_executed=[],
                react_steps=[f"Error: {str(e)}"],
                visual_cot_triggered=False,
                confidence_level="low",
                needs_human_review=True,
                synthesis_info={}
            )
        
        return state
    
    def _analyze_plan_execute_structured(self, state: MultiAgentState, image_path: str) -> MultiAgentState:
        """Analyze using structured plan-execute mode with clinical prioritization"""
        try:
            print(f"  Executing structured plan-execute analysis with query: '{state.get('query', '')}'")
            print(f"  Available tools: {list(self.tools.keys())}")
            
            # Generate structured plan
            plan = self.create_plan(state)
            print(f"BreathingAgent: Executing plan with {len(plan)} tasks")
            for t in plan:
                print(f"  - {t['task_id']}: {t['description']} (priority: {t.get('clinical_priority', 'medium')})")
            
            findings = []
            executed_plan = []
            measurements = {}
            task_results = {}
            
            # Reset deduplication set for this analysis
            self._findings_dedup.clear()
            
            # Sort tasks by clinical priority
            sorted_plan = sorted(plan, key=lambda x: {"high": 0, "medium": 1, "low": 2}.get(x.get("clinical_priority", "medium"), 1))
            
            # Execute plan with dependency handling
            for task in sorted_plan:
                task_id = task["task_id"]
                
                # Check dependencies
                deps_met = all(dep in task_results for dep in task.get("depends_on", []))
                if not deps_met:
                    print(f"Skipping {task_id} - dependencies not met")
                    continue
                
                print(f"\n🔍 Executing task: {task_id} (priority: {task.get('clinical_priority', 'medium')})")
                
                # Execute task based on tool type
                if task["tool"] == "chest_xray_classifier":
                    result = self._execute_classification_task_structured(state, task, task_results)
                elif task["tool"] == "chest_xray_segmentation":
                    result = self._execute_segmentation_task_structured(state, task, task_results)
                elif task["tool"] == "xray_phrase_grounding":
                    result = self._execute_grounding_task_structured(state, task, task_results)
                elif task["tool"] == "xray_vqa":
                    result = self._execute_vqa_task_structured(state, task, task_results)
                elif task["tool"] == "visual_reasoning":
                    result = self._execute_vcot_task_structured(state, task, task_results, findings)
                else:
                    result = {"success": False, "error": f"Unknown tool: {task['tool']}"}
                
                print(f"Task {task_id} result: success={result.get('success', False)}")
                
                # Store result
                task_results[task_id] = result
                executed_plan.append({
                    "task_id": task_id,
                    "description": task["description"],
                    "result": result,
                    "clinical_priority": task.get("clinical_priority", "medium")
                })
                
                # Process results into findings with structured attributes
                self._process_task_results_structured(task, result, findings, measurements)
            
            print(f"\n✓ BreathingAgent: Generated {len(findings)} findings")
            for f in findings:
                if isinstance(f, dict):
                    location_info = f.get("location_structured", {})
                    extent_info = f.get("extent_structured", {})
                    print(f"  - {f['pathology']}: {f['confidence']:.2f} [{location_info.get('side', 'N/A')}] [{extent_info.get('distribution', 'N/A')}]")
            
            # Update state with breathing analysis
            try:
                confidence_level = self._assess_confidence(findings)
                needs_review = self._needs_review(findings)
                visual_cot_triggered = any(f.get("visual_cot") is not None for f in findings if isinstance(f, dict))
            except Exception as e:
                print(f"Warning: Error in confidence assessment: {e}")
                confidence_level = "medium"
                needs_review = True
                visual_cot_triggered = False
            
            # Generate synthesis information
            synthesis_info = self._prepare_synthesis_information(findings)
            synthesis_info["plan_execute_structured"] = True
            synthesis_info["executed_plan"] = executed_plan
            synthesis_info["clinical_focus"] = state.get("breathing_clinical_focus", [])
            synthesis_info["planning_reasoning"] = state.get("breathing_planning_reasoning", "")
            
            state["breathing_analysis"] = AgentAnalysis(
                agent_name="BreathingAgent",
                findings=findings,
                plan_executed=executed_plan,
                react_steps=[],
                visual_cot_triggered=visual_cot_triggered,
                confidence_level=confidence_level,
                needs_human_review=needs_review,
                synthesis_info=synthesis_info
            )
            
            print(f"✓ Structured plan-execute analysis complete: {len(findings)} findings from {len(executed_plan)} tasks")
            return state
            
        except Exception as e:
            print(f"Error in structured plan-execute analysis: {e}")
            import traceback
            traceback.print_exc()
            
            # Return error state
            state["breathing_analysis"] = AgentAnalysis(
                agent_name="BreathingAgent",
                findings=[],
                plan_executed=[],
                react_steps=[],
                visual_cot_triggered=False,
                confidence_level="error",
                needs_human_review=True,
                synthesis_info={"error": str(e)}
            )
            return state
    
    # Structured task execution methods
    def _execute_classification_task_structured(self, state: MultiAgentState, task: Dict, task_results: Dict) -> Dict:
        """Execute classification task with structured processing"""
        try:
            parameters = task.get("parameters", {})
            if "image_path" not in parameters:
                parameters["image_path"] = state["image_path"]
            
            # Check cache
            cache_key = f"classification_{parameters.get('focus', 'respiratory')}"
            if cache_key in self._classification_cache:
                return self._classification_cache[cache_key]
            
            print(f"  🔍 Calling classifier with params: {parameters}")
            result = self.tools["chest_xray_classifier"].invoke(parameters)
            
            # Handle tuple return
            if isinstance(result, tuple):
                classification, metadata = result
            else:
                classification = result
                metadata = {}
            
            # Convert numpy types to Python types
            if isinstance(classification, dict):
                classification_clean = {}
                for k, v in classification.items():
                    if hasattr(v, 'item'):
                        classification_clean[k] = float(v.item())
                    else:
                        classification_clean[k] = float(v) if isinstance(v, (int, float)) else v
                classification = classification_clean
            
            result_dict = {"success": True, "classification": classification, "metadata": metadata}
            self._classification_cache[cache_key] = result_dict
            return result_dict
            
        except Exception as e:
            print(f"Error in classification task {task['task_id']}: {e}")
            return {"success": False, "error": str(e)}
    
    def _execute_segmentation_task_structured(self, state: MultiAgentState, task: Dict, task_results: Dict) -> Dict:
        """Execute segmentation task with structured processing"""
        try:
            parameters = task.get("parameters", {})
            if "image_path" not in parameters:
                parameters["image_path"] = state["image_path"]
            
            # Optimize organ selection if not specified
            if "organs" not in parameters:
                parameters["organs"] = self._get_optimal_organs_for_breathing_task(task["task_id"])
            
            # Check cache
            organs_sorted = sorted(parameters["organs"])
            cache_key = f"segmentation_{','.join(organs_sorted)}"
            if cache_key in self._segmentation_cache:
                return self._segmentation_cache[cache_key]
            
            print(f"  📏 Calling segmentation with organs: {parameters['organs']}")
            result = self.tools["chest_xray_segmentation"].invoke(parameters)
            
            # Handle tuple return
            if isinstance(result, tuple):
                segmentation_data, metadata = result
            else:
                segmentation_data = result
                metadata = {}
            
            # Calculate breathing-specific measurements
            measurements = self._calculate_breathing_measurements(segmentation_data, task["task_id"])
            segmentation_data['breathing_measurements'] = measurements
            
            result_dict = {"success": True, "segmentation": segmentation_data, "metadata": metadata, "measurements": measurements}
            self._segmentation_cache[cache_key] = result_dict
            return result_dict
            
        except Exception as e:
            print(f"Error in segmentation task {task['task_id']}: {e}")
            return {"success": False, "error": str(e)}
    
    def _execute_grounding_task_structured(self, state: MultiAgentState, task: Dict, task_results: Dict) -> Dict:
        """Execute grounding task with structured processing and V-CoT triggering"""
        try:
            if not self.grounding_tool:
                return {"success": False, "error": "Grounding tool not available"}
            
            parameters = task.get("parameters", {})
            if "image_path" not in parameters:
                parameters["image_path"] = state["image_path"]
            
            phrase = parameters.get("phrase", "pneumothorax")
            print(f"  🎯 Calling grounding for phrase: {phrase}")
            
            result = self.tools["xray_phrase_grounding"].invoke(parameters)
            
            # Handle tuple return
            if isinstance(result, tuple):
                grounding_data, metadata = result
            else:
                grounding_data = result
                metadata = {}
            
            # Extract bounding boxes (no reliable confidence available)
            bboxes = []
            
            if "predictions" in grounding_data and grounding_data["predictions"]:
                prediction = grounding_data["predictions"][0]
                
                if "bounding_boxes" in prediction:
                    bbox_data = prediction["bounding_boxes"].get("image_coordinates", [])
                    if bbox_data:
                        bboxes = bbox_data
            
            # Always trigger V-CoT for grounding results (no reliable confidence threshold)
            visual_cot = None
            percentage_analysis = None
            density_analysis = None
            location_analysis = None
            extent_analysis = None
            
            if bboxes:
                print(f"  🔍 Triggering comprehensive V-CoT analysis")
                visual_cot = self._execute_vcot_with_cropped_region(
                    state, phrase, bboxes[0], 0.5  # Default confidence for V-CoT
                )
                
                # Comprehensive location analysis for all findings
                location_analysis = self._execute_vcot_comprehensive_location_analysis(
                    state, phrase, bboxes[0], 0.5
                )
                
                # Comprehensive extent analysis for all findings
                extent_analysis = self._execute_vcot_comprehensive_extent_analysis(
                    state, phrase, bboxes[0], 0.5
                )
                
                # Optional: Add percentage estimation for pathological findings
                if phrase.lower() in ["pleural effusion", "pneumothorax", "consolidation", "atelectasis"]:
                    percentage_analysis = self._execute_vcot_percentage_estimation(
                        state, phrase, bboxes[0], 0.5
                    )
                    # Log the anatomical reference used
                    if percentage_analysis and "anatomical_reference" in percentage_analysis:
                        print(f"      📊 Percentage estimation using {percentage_analysis['anatomical_reference']} reference")
                
                # Optional: Add density analysis for opacity-based findings
                if phrase.lower() in ["consolidation", "pneumonia", "infiltration", "lung opacity"]:
                    density_analysis = self._execute_vcot_density_analysis(
                        state, phrase, bboxes[0]
                    )
            
            result_dict = {
                "success": True,
                "grounding": grounding_data,
                "confidence": 0.5,  # Default confidence since not reliably available
                "bboxes": bboxes,
                "visual_cot": visual_cot,
                "location_analysis": location_analysis,
                "extent_analysis": extent_analysis,
                "percentage_analysis": percentage_analysis,
                "density_analysis": density_analysis,
                "metadata": metadata
            }
            
            return result_dict
            
        except Exception as e:
            print(f"Error in grounding task {task['task_id']}: {e}")
            return {"success": False, "error": str(e)}
    
    def _execute_vqa_task_structured(self, state: MultiAgentState, task: Dict, task_results: Dict) -> Dict:
        """Execute VQA task with structured processing"""
        try:
            if not self.has_vqa:
                return {"success": False, "error": "VQA tool not available"}
            
            parameters = task.get("parameters", {})
            if "image_path" not in parameters:
                parameters["image_path"] = state["image_path"]
            
            # Generate question if not provided
            if "question" not in parameters:
                parameters["question"] = self._generate_breathing_vqa_question(task["task_id"], state["query"])
            
            print(f"  🤔 Calling VQA with question: {parameters['question']}")
            result = self.tools["xray_vqa"].invoke(parameters)
            
            # Handle tuple return
            if isinstance(result, tuple):
                vqa_data, metadata = result
            else:
                vqa_data = result
                metadata = {}
            
            return {"success": True, "vqa": vqa_data, "metadata": metadata}
            
        except Exception as e:
            print(f"Error in VQA task {task['task_id']}: {e}")
            return {"success": False, "error": str(e)}
    
    def _execute_vcot_task_structured(self, state: MultiAgentState, task: Dict, task_results: Dict, findings: List[Finding]) -> Dict:
        """Execute V-CoT task with structured processing"""
        try:
            if not self.vcot_module:
                return {"success": False, "error": "V-CoT module not available"}
            
            # Get ROI bbox from previous grounding results
            roi_bbox = None
            for task_id, result in task_results.items():
                if result.get("success") and result.get("bboxes"):
                    roi_bbox = result["bboxes"][0]
                    break
            
            # Get measurements from segmentation results
            measurements = {}
            for task_id, result in task_results.items():
                if result.get("success") and result.get("measurements"):
                    measurements.update(result["measurements"])
            
            # Determine task focus
            focus = task.get("parameters", {}).get("focus", "respiratory findings")
            
            # Get confidence from most relevant finding
            primary_conf = 0.5
            for finding in findings:
                if isinstance(finding, dict):
                    primary_conf = finding.get("confidence", 0.5)
                    break
            
            print(f"  🔬 Executing V-CoT for {focus}")
            visual_cot = self.vcot_module.generate(
                image_path=state["image_path"],
                roi_bbox=roi_bbox,
                measurements=measurements,
                task=f"Visual assessment: {focus}",
                confidence=primary_conf
            )
            
            return {"success": True, "visual_cot": visual_cot}
            
        except Exception as e:
            print(f"Error in V-CoT task {task['task_id']}: {e}")
            return {"success": False, "error": str(e)}
    
    def _execute_vcot_with_cropped_region(self, state: MultiAgentState, phrase: str, bbox: List[float], confidence: float) -> Optional[str]:
        """Execute V-CoT with cropped region for low-confidence grounding results"""
        try:
            if not self.vcot_module:
                return None
            
            # Determine lung zone for cropping context
            lung_zone = self._determine_lung_zone_from_bbox(bbox)
            
            print(f"    🔍 V-CoT analysis for {phrase} in {lung_zone} (confidence: {confidence:.2f})")
            
            # Execute V-CoT with cropped region
            visual_cot = self.vcot_module.generate(
                image_path=state["image_path"],
                roi_bbox=bbox,
                measurements={},
                task=f"Detailed analysis of {phrase} in {lung_zone}",
                target=f"{phrase} in {lung_zone}",
                confidence=confidence
            )
            
            return visual_cot
            
        except Exception as e:
            print(f"Error in V-CoT with cropped region: {e}")
            return None
    
    def _execute_vcot_percentage_estimation(self, state: MultiAgentState, phrase: str, pathology_bbox: List[float], confidence: float) -> Optional[Dict]:
        """Execute V-CoT for VQA-style percentage estimation using appropriate anatomical reference"""
        try:
            if not self.vcot_module:
                return None
            
            print(f"    📊 V-CoT percentage estimation for {phrase}")
            
            # Determine if pathology is pleural or parenchymal
            pleural_pathologies = ["pleural effusion", "pneumothorax", "pleural thickening", "pleural mass"]
            is_pleural = any(pleural_path in phrase.lower() for pleural_path in pleural_pathologies)
            
            # Step 1: Ground appropriate anatomical reference
            reference_bboxes = {}
            if is_pleural:
                # For pleural pathologies, use pleural space and lung boundaries
                print(f"    🫁 Grounding pleural space for pleural pathology: {phrase}")
                
                # Ground pleural space
                try:
                    pleural_result = self.tools["xray_phrase_grounding"].invoke({
                        "image_path": state["image_path"],
                        "phrase": "pleural space"
                    })
                    if pleural_result and "predictions" in pleural_result:
                        for pred in pleural_result["predictions"]:
                            if pred.get("bounding_boxes", {}).get("image_coordinates"):
                                reference_bboxes["pleural_space"] = pred["bounding_boxes"]["image_coordinates"][0]
                                break
                except Exception as e:
                    print(f"    Warning: Could not ground pleural space: {e}")
                
                # Also ground lung boundaries for context
                for lung_side in ["left lung", "right lung"]:
                    try:
                        lung_result = self.tools["xray_phrase_grounding"].invoke({
                            "image_path": state["image_path"],
                            "phrase": lung_side
                        })
                        if lung_result and "predictions" in lung_result:
                            for pred in lung_result["predictions"]:
                                if pred.get("bounding_boxes", {}).get("image_coordinates"):
                                    reference_bboxes[lung_side] = pred["bounding_boxes"]["image_coordinates"][0]
                                    break
                    except Exception as e:
                        print(f"    Warning: Could not ground {lung_side}: {e}")
            else:
                # For parenchymal pathologies, use lung information
                print(f"    🫁 Grounding lung parenchyma for parenchymal pathology: {phrase}")
                for lung_side in ["left lung", "right lung"]:
                    try:
                        lung_result = self.tools["xray_phrase_grounding"].invoke({
                            "image_path": state["image_path"],
                            "phrase": lung_side
                        })
                        if lung_result and "predictions" in lung_result:
                            for pred in lung_result["predictions"]:
                                if pred.get("bounding_boxes", {}).get("image_coordinates"):
                                    reference_bboxes[lung_side] = pred["bounding_boxes"]["image_coordinates"][0]
                                    break
                    except Exception as e:
                        print(f"    Warning: Could not ground {lung_side}: {e}")
            
            # Step 2: Calculate spatial relationships
            spatial_measurements = {}
            if reference_bboxes:
                spatial_measurements = self._calculate_spatial_relationships(pathology_bbox, reference_bboxes)
            
            # Step 3: Create evidence list with appropriate anatomical reference
            from ..reasoning.visual_cot import VisualEvidence, VisualEvidenceType
            evidence_list = [
                VisualEvidence(
                    evidence_type=VisualEvidenceType.BOUNDING_BOX,
                    tool_name="grounding_tool",
                    confidence=confidence,
                    data={
                        "pathology_bbox": pathology_bbox,
                        "reference_bboxes": reference_bboxes,
                        "spatial_measurements": spatial_measurements,
                        "is_pleural": is_pleural
                    },
                    description=f"Grounded {phrase} and {'pleural space' if is_pleural else 'lung parenchyma'} with spatial relationships"
                )
            ]
            
            # Step 4: V-CoT with anatomically appropriate percentage estimation task
            if is_pleural:
                task_description = f"Estimate the percentage of {phrase} relative to the affected pleural space. " \
                                 f"For pleural pathologies, assess the extent within the pleural cavity. " \
                                 f"Consider the spatial relationship between the pathology and pleural boundaries. " \
                                 f"Provide a percentage estimate (0-100%) and confidence level."
                target_description = f"{phrase} extent and percentage in pleural space"
            else:
                task_description = f"Estimate the percentage of {phrase} relative to the affected lung volume. " \
                                 f"Consider the spatial overlap between the pathology and lung parenchyma. " \
                                 f"Provide a percentage estimate (0-100%) and confidence level."
                target_description = f"{phrase} extent and percentage in lung parenchyma"
            
            visual_cot_result = self.vcot_module.generate(
                image_path=state["image_path"],
                task=task_description,
                target=target_description,
                evidence_list=evidence_list,
                roi_bbox=pathology_bbox,
                measurements=spatial_measurements
            )
            
            # Step 5: Extract percentage from V-CoT result
            percentage_estimate = self._extract_percentage_from_vcot(visual_cot_result)
            
            return {
                "visual_cot": visual_cot_result,
                "percentage_estimate": percentage_estimate,
                "spatial_measurements": spatial_measurements,
                "reference_bboxes": reference_bboxes,
                "anatomical_reference": "pleural_space" if is_pleural else "lung_parenchyma"
            }
            
        except Exception as e:
            print(f"Error in V-CoT percentage estimation: {e}")
            return None
    
    def _execute_vcot_density_analysis(self, state: MultiAgentState, phrase: str, bbox: List[float]) -> Optional[Dict]:
        """Execute V-CoT with cropped region for density/severity analysis"""
        try:
            if not self.vcot_module:
                return None
            
            print(f"    🔬 V-CoT density analysis for {phrase}")
            
            # Create cropped region for detailed analysis
            roi_image_path = self._create_roi_image(state["image_path"], bbox)
            
            # V-CoT with density-focused analysis
            visual_cot_result = self.vcot_module.generate(
                image_path=roi_image_path,
                task=f"Analyze the radiographic density and clinical severity of {phrase}. "
                      f"Assess opacity patterns, margins, and internal characteristics. "
                      f"Provide severity assessment (mild/moderate/severe) and confidence.",
                target=f"radiographic density and clinical severity of {phrase}",
                evidence_list=[],
                roi_bbox=None,  # Using cropped image
                measurements={}
            )
            
            # Extract density/severity assessment
            density_assessment = self._extract_density_from_vcot(visual_cot_result)
            
            return {
                "visual_cot": visual_cot_result,
                "density_assessment": density_assessment,
                "roi_image_path": roi_image_path
            }
            
        except Exception as e:
            print(f"Error in V-CoT density analysis: {e}")
            return None
    
    def _calculate_spatial_relationships(self, pathology_bbox: List[float], reference_bboxes: Dict[str, List[float]]) -> Dict:
        """Calculate spatial relationships between pathology and anatomical reference boundaries"""
        measurements = {}
        
        try:
            px1, py1, px2, py2 = pathology_bbox  # Pathology bbox
            pathology_area = (px2 - px1) * (py2 - py1)
            
            # Check if we have pleural space reference
            has_pleural_space = "pleural_space" in reference_bboxes
            
            for ref_name, ref_bbox in reference_bboxes.items():
                rx1, ry1, rx2, ry2 = ref_bbox  # Reference bbox
                
                # Calculate overlap area
                overlap_x1 = max(px1, rx1)
                overlap_y1 = max(py1, ry1)
                overlap_x2 = min(px2, rx2)
                overlap_y2 = min(py2, ry2)
                
                if overlap_x1 < overlap_x2 and overlap_y1 < overlap_y2:
                    # There is overlap
                    overlap_area = (overlap_x2 - overlap_x1) * (overlap_y2 - overlap_y1)
                    ref_area = (rx2 - rx1) * (ry2 - ry1)
                    
                    # Calculate percentages
                    pathology_overlap_percent = (overlap_area / pathology_area) * 100 if pathology_area > 0 else 0
                    ref_affected_percent = (overlap_area / ref_area) * 100 if ref_area > 0 else 0
                    
                    # Use appropriate naming based on reference type
                    if ref_name == "pleural_space":
                        measurement_key = f"pleural_space_overlap"
                        affected_key = "pleural_space_affected_percent"
                    else:
                        measurement_key = f"{ref_name}_overlap"
                        affected_key = f"{ref_name.replace(' ', '_')}_affected_percent"
                    
                    measurements[measurement_key] = {
                        "pathology_overlap_percent": pathology_overlap_percent,
                        affected_key: ref_affected_percent,
                        "overlap_area": overlap_area,
                        "has_overlap": True,
                        "reference_type": ref_name
                    }
                else:
                    # No overlap
                    if ref_name == "pleural_space":
                        measurement_key = f"pleural_space_overlap"
                        affected_key = "pleural_space_affected_percent"
                    else:
                        measurement_key = f"{ref_name}_overlap"
                        affected_key = f"{ref_name.replace(' ', '_')}_affected_percent"
                    
                    measurements[measurement_key] = {
                        "pathology_overlap_percent": 0,
                        affected_key: 0,
                        "overlap_area": 0,
                        "has_overlap": False,
                        "reference_type": ref_name
                    }
            
            # For pleural pathologies, calculate pleural space ratio if available
            if has_pleural_space and "pleural_space_overlap" in measurements:
                pleural_measurements = measurements["pleural_space_overlap"]
                measurements["pleural_space_ratio"] = {
                    "pathology_to_pleural_ratio": pleural_measurements["pathology_overlap_percent"],
                    "pleural_involvement_percent": pleural_measurements["pleural_space_affected_percent"],
                    "assessment_type": "pleural_space_analysis"
                }
            
            return measurements
            
        except Exception as e:
            print(f"Error calculating spatial relationships: {e}")
            return {}
    
    def _extract_percentage_from_vcot(self, vcot_result) -> Optional[Dict]:
        """Extract percentage estimate from V-CoT result"""
        try:
            if hasattr(vcot_result, 'direct_visual_assessment'):
                assessment = vcot_result.direct_visual_assessment
            elif hasattr(vcot_result, 'full_reasoning'):
                assessment = vcot_result.full_reasoning
            else:
                assessment = str(vcot_result)
            
            # Simple regex to extract percentage (could be enhanced with NLP)
            import re
            percentage_pattern = r'(\d+(?:\.\d+)?)\s*%'
            matches = re.findall(percentage_pattern, assessment)
            
            if matches:
                percentage = float(matches[0])
                return {
                    "percentage": percentage,
                    "confidence": getattr(vcot_result, 'final_confidence', 0.5),
                    "assessment_text": assessment
                }
            
            return None
            
        except Exception as e:
            print(f"Error extracting percentage from V-CoT: {e}")
            return None
    
    def _extract_density_from_vcot(self, vcot_result) -> Optional[Dict]:
        """Extract density/severity assessment from V-CoT result"""
        try:
            if hasattr(vcot_result, 'direct_visual_assessment'):
                assessment = vcot_result.direct_visual_assessment
            elif hasattr(vcot_result, 'full_reasoning'):
                assessment = vcot_result.full_reasoning
            else:
                assessment = str(vcot_result)
            
            # Extract severity keywords
            severity_keywords = {
                "mild": ["mild", "minor", "small", "limited"],
                "moderate": ["moderate", "medium", "intermediate"],
                "severe": ["severe", "extensive", "large", "significant", "marked"]
            }
            
            assessment_lower = assessment.lower()
            severity = "unknown"
            
            for severity_level, keywords in severity_keywords.items():
                if any(keyword in assessment_lower for keyword in keywords):
                    severity = severity_level
                    break
            
            return {
                "severity": severity,
                "confidence": getattr(vcot_result, 'final_confidence', 0.5),
                "assessment_text": assessment
            }
            
        except Exception as e:
            print(f"Error extracting density from V-CoT: {e}")
            return None
    
    def _create_roi_image(self, image_path: str, bbox: List[float]) -> str:
        """Create cropped ROI image from bounding box"""
        try:
            from PIL import Image
            import uuid
            
            # Load image
            image = Image.open(image_path)
            width, height = image.size
            
            # Convert normalized coordinates to pixel coordinates
            x1 = int(bbox[0] * width)
            y1 = int(bbox[1] * height)
            x2 = int(bbox[2] * width)
            y2 = int(bbox[3] * height)
            
            # Add padding around ROI
            padding = 20
            x1 = max(0, x1 - padding)
            y1 = max(0, y1 - padding)
            x2 = min(width, x2 + padding)
            y2 = min(height, y2 + padding)
            
            # Crop image
            cropped = image.crop((x1, y1, x2, y2))
            
            # Save cropped image
            roi_path = self.temp_dir / f"roi_{uuid.uuid4().hex[:8]}.png"
            cropped.save(roi_path)
            
            return str(roi_path)
            
        except Exception as e:
            print(f"Error creating ROI image: {e}")
            return image_path  # Return original if cropping fails
    
    def _determine_lung_zone_from_bbox(self, bbox: List[float]) -> str:
        """Determine lung zone from bounding box coordinates"""
        x1, y1, x2, y2 = bbox
        center_y = (y1 + y2) / 2
        center_x = (x1 + x2) / 2
        
        # Determine vertical zone
        if center_y < 0.33:
            vertical_zone = "upper"
        elif center_y < 0.67:
            vertical_zone = "middle"
        else:
            vertical_zone = "lower"
        
        # Determine horizontal side
        if center_x < 0.5:
            side = "left"
        else:
            side = "right"
        
        return f"{side} {vertical_zone} lung zone"
    
    def _get_optimal_organs_for_breathing_task(self, task_id: str) -> List[str]:
        """Get optimal organs for breathing-specific tasks"""
        task_organ_mapping = {
            "pneumothorax": ["Left Lung", "Right Lung", "Pleura"],
            "effusion": ["Left Lung", "Right Lung", "Pleura"],
            "consolidation": ["Left Lung", "Right Lung"],
            "atelectasis": ["Left Lung", "Right Lung"],
            "edema": ["Left Lung", "Right Lung", "Heart"],
            "comprehensive": ["Left Lung", "Right Lung", "Pleura", "Trachea"]
        }
        
        # Match task to organ set
        for key, organs in task_organ_mapping.items():
            if key in task_id.lower():
                return organs
        
        # Default to comprehensive lung assessment
        return task_organ_mapping["comprehensive"]
    
    def _calculate_breathing_measurements(self, segmentation_data: Dict, task_id: str) -> Dict:
        """Calculate breathing-specific measurements from segmentation data - DISABLED unreliable measurements"""
        measurements = {}
        
        if not isinstance(segmentation_data, dict) or "metrics" not in segmentation_data:
            return measurements
        
        metrics = segmentation_data["metrics"]
        
        # DISABLED: Pneumothorax percentage calculation
        # Reason: Segmentation tool cannot segment "Pneumothorax" (it's stubbed)
        # Inferring from normal lung segmentation is unreliable
        
        # DISABLED: Pleural effusion percentage calculation  
        # Reason: Segmentation tool cannot segment "Pleural Effusion" (it's stubbed)
        # Inferring from normal lung segmentation is unreliable
        
        # Calculate lung volume asymmetry (RELIABLE - uses normal anatomy)
        if "Left Lung" in metrics and "Right Lung" in metrics:
            left_volume = metrics["Left Lung"]["area_pixels"]
            right_volume = metrics["Right Lung"]["area_pixels"]
            total_volume = left_volume + right_volume
            
            if total_volume > 0:
                asymmetry = abs(left_volume - right_volume) / total_volume
                measurements["lung_volume_asymmetry"] = asymmetry
                
                # Add basic lung area measurements (RELIABLE)
                measurements["left_lung_area_pixels"] = left_volume
                measurements["right_lung_area_pixels"] = right_volume
                measurements["total_lung_area_pixels"] = total_volume
        
        return measurements
    
    def _generate_breathing_vqa_question(self, task_id: str, query: str) -> str:
        """Generate appropriate VQA question based on task and query"""
        task_questions = {
            "pneumothorax": "Is there evidence of pneumothorax in this chest X-ray?",
            "effusion": "Is there evidence of pleural effusion in this chest X-ray?",
            "consolidation": "Is there evidence of consolidation or pneumonia in this chest X-ray?",
            "atelectasis": "Is there evidence of atelectasis or lung collapse in this chest X-ray?",
            "edema": "Is there evidence of pulmonary edema in this chest X-ray?",
            "comprehensive": "What respiratory abnormalities are visible in this chest X-ray?"
        }
        
        # Match task to question
        for key, question in task_questions.items():
            if key in task_id.lower():
                return question
        
        # Default to query-based question
        return f"Based on this query: {query}, what respiratory findings can you observe?"
    
    def _process_task_results_structured(self, task: Dict, result: Dict, findings: List[Finding], measurements: Dict):
        """Process task results into structured findings with location and extent attributes"""
        if not result.get("success"):
            return
        
        task_id = task["task_id"]
        clinical_priority = task.get("clinical_priority", "medium")
        
        # Process classification results
        if "classification" in result:
            self._process_classification_results_structured(
                result["classification"], task_id, clinical_priority, findings
            )
        
        # Process grounding results
        if "grounding" in result:
            self._process_grounding_results_structured(
                result["grounding"], result.get("confidence", 0.5), 
                result.get("bboxes", []), result.get("visual_cot"), 
                task_id, clinical_priority, findings
            )
            
            # Enhance findings with V-CoT location and extent analysis if available
            if result.get("location_analysis") or result.get("extent_analysis"):
                self._enhance_findings_with_vcot_analysis(
                    findings, result.get("location_analysis"), result.get("extent_analysis"),
                    result.get("bboxes", []), task_id
                )
        
        # Process segmentation measurements
        if "measurements" in result:
            measurements.update(result["measurements"])
            self._process_segmentation_measurements_structured(
                result["measurements"], task_id, clinical_priority, findings
            )
        
        # Process VQA results
        if "vqa" in result:
            self._process_vqa_results_structured(
                result["vqa"], task_id, clinical_priority, findings
            )
    
    def _process_classification_results_structured(self, classification: Dict, task_id: str, priority: str, findings: List[Finding]):
        """Process classification results with structured attributes"""
        breathing_pathologies = {
            "Pneumothorax": "pneumothorax",
            "Effusion": "pleural_effusion",
            "Consolidation": "consolidation",
            "Atelectasis": "atelectasis",
            "Pneumonia": "pneumonia",
            "Edema": "pulmonary_edema",
            "Infiltration": "infiltration",
            "Lung Opacity": "lung_opacity"
        }
        
        for classification_name, pathology_name in breathing_pathologies.items():
            if classification_name in classification:
                conf = classification[classification_name]
                if conf > 0.3:  # Threshold for reporting
                    # Create structured finding
                    finding = {
                        "pathology": pathology_name,
                        "confidence": conf,
                        "location": None,  # Will be enhanced by grounding
                        "location_structured": FindingLocation(
                            side="unknown",
                            zone=None,
                            lobe=None,
                            position=None
                        ).dict(),
                        "extent_structured": FindingExtent(
                            distribution="unknown",
                            size=None,
                            percentage=None,
                            involvement=None
                        ).dict(),
                        "measurements": None,
                        "visual_cot": None,
                        "evidence": f"{classification_name} detected by classification (confidence: {conf:.3f})",
                        "clinical_priority": priority,
                        "task_source": task_id
                    }
                    
                    # Deduplicate
                    finding_key = f"{pathology_name}_{task_id}"
                    if finding_key not in self._findings_dedup:
                        self._findings_dedup.add(finding_key)
                        findings.append(finding)
    
    def _process_grounding_results_structured(self, grounding: Dict, confidence: float, bboxes: List, visual_cot: Optional[str], task_id: str, priority: str, findings: List[Finding]):
        """Process grounding results with structured location attributes"""
        if not grounding.get("predictions"):
            return
        
        for prediction in grounding["predictions"]:
            phrase = prediction.get("phrase", "unknown")
            bbox_data = prediction.get("bounding_boxes", {}).get("image_coordinates", [])
            
            if bbox_data:
                bbox = bbox_data[0]
                
                # Extract V-CoT enhanced location and extent if available
                # Check if we have V-CoT analysis results from the task result
                vcot_location_analysis = None
                vcot_extent_analysis = None
                
                # These will be passed through the task result processing
                # For now, fall back to basic extraction
                location_structured = self._extract_location_from_bbox(bbox)
                extent_structured = self._extract_extent_from_bbox(bbox)
                
                # Create structured finding (use default confidence since not reliably available)
                pathology_name = phrase.lower().replace(" ", "_")
                finding = {
                    "pathology": pathology_name,
                    "confidence": 0.5,  # Default confidence since grounding confidence is not reliable
                    "location": bbox,
                    "location_structured": location_structured.dict(),
                    "extent_structured": extent_structured.dict(),
                    "measurements": None,
                    "visual_cot": visual_cot,
                    "evidence": f"Grounded finding: {phrase} located (confidence not reliably available)",
                    "clinical_priority": priority,
                    "task_source": task_id
                }
                
                # Deduplicate
                finding_key = f"{pathology_name}_{task_id}_{bbox[0]:.2f}_{bbox[1]:.2f}"
                if finding_key not in self._findings_dedup:
                    self._findings_dedup.add(finding_key)
                    findings.append(finding)
    
    def _process_segmentation_measurements_structured(self, measurements: Dict, task_id: str, priority: str, findings: List[Finding]):
        """Process segmentation measurements with structured attributes - DISABLED unreliable percentage measurements"""
        # Process reliable measurements only
        for measurement_name, value in measurements.items():
            # Only process reliable measurements (lung volume asymmetry, basic areas)
            if measurement_name == "lung_volume_asymmetry" and value > 0.2:  # >20% asymmetry is significant
                extent_structured = FindingExtent(
                    distribution="measured",
                    size="moderate" if value < 0.4 else "large",
                    percentage=value * 100,  # Convert to percentage
                    involvement=f"{value*100:.1f}% volume difference between lungs"
                ).dict()
                
                finding = {
                    "pathology": "lung_volume_asymmetry",
                    "confidence": 0.8,  # High confidence for quantitative measurements
                    "location": None,
                    "location_structured": FindingLocation(
                        side="bilateral",
                        zone=None,
                        lobe=None,
                        position=None
                    ).dict(),
                    "extent_structured": extent_structured,
                    "measurements": {measurement_name: value},
                    "visual_cot": None,
                    "evidence": f"Lung volume asymmetry: {value*100:.1f}% difference",
                    "clinical_priority": priority,
                    "task_source": task_id
                }
                
                # Deduplicate
                finding_key = f"lung_volume_asymmetry_measurement_{task_id}"
                if finding_key not in self._findings_dedup:
                    self._findings_dedup.add(finding_key)
                    findings.append(finding)
            
            # DISABLED: Pneumothorax and pleural effusion percentage measurements
            # These are unreliable as they try to infer pathology from normal lung segmentation
    
    def _process_vqa_results_structured(self, vqa_data: Dict, task_id: str, priority: str, findings: List[Finding]):
        """Process VQA results with structured attributes"""
        # This is a simplified implementation - could be enhanced with NLP parsing
        answer = vqa_data.get("answer", "")
        confidence = vqa_data.get("confidence", 0.5)
        
        # Simple keyword extraction for pathologies
        pathology_keywords = {
            "pneumothorax": ["pneumothorax", "collapsed lung", "air in pleural"],
            "pleural_effusion": ["pleural effusion", "fluid in pleural", "pleural fluid"],
            "consolidation": ["consolidation", "opacity", "infiltrate"],
            "atelectasis": ["atelectasis", "collapse", "volume loss"]
        }
        
        answer_lower = answer.lower()
        for pathology, keywords in pathology_keywords.items():
            if any(keyword in answer_lower for keyword in keywords):
                finding = {
                    "pathology": pathology,
                    "confidence": confidence,
                    "location": None,
                    "location_structured": FindingLocation(
                        side="unknown",
                        zone=None,
                        lobe=None,
                        position=None
                    ).dict(),
                    "extent_structured": FindingExtent(
                        distribution="unknown",
                        size=None,
                        percentage=None,
                        involvement=None
                    ).dict(),
                    "measurements": None,
                    "visual_cot": None,
                    "evidence": f"VQA finding: {answer}",
                    "clinical_priority": priority,
                    "task_source": task_id
                }
                
                # Deduplicate
                finding_key = f"{pathology}_vqa_{task_id}"
                if finding_key not in self._findings_dedup:
                    self._findings_dedup.add(finding_key)
                    findings.append(finding)
    
    def _extract_location_from_bbox(self, bbox: List[float]) -> FindingLocation:
        """Extract structured location information from bounding box"""
        x1, y1, x2, y2 = bbox
        center_x = (x1 + x2) / 2
        center_y = (y1 + y2) / 2
        
        # Determine side
        if center_x < 0.45:
            side = "left"
        elif center_x > 0.55:
            side = "right"
        else:
            side = "midline"
        
        # Determine zone
        if center_y < 0.33:
            zone = "upper"
        elif center_y < 0.67:
            zone = "middle"
        else:
            zone = "lower"
        
        # Determine position (peripheral vs central)
        if center_x < 0.2 or center_x > 0.8:
            position = "peripheral"
        elif 0.4 < center_x < 0.6:
            position = "central"
        else:
            position = "intermediate"
        
        return FindingLocation(
            side=side,
            zone=zone,
            lobe=None,  # Could be enhanced with lobe detection
            position=position
        )
    
    def _extract_extent_from_bbox(self, bbox: List[float]) -> FindingExtent:
        """Extract structured extent information from bounding box"""
        x1, y1, x2, y2 = bbox
        width = x2 - x1
        height = y2 - y1
        area = width * height
        
        # Determine distribution based on size
        if area < 0.1:
            distribution = "focal"
        elif area < 0.25:
            distribution = "multifocal"
        else:
            distribution = "diffuse"
        
        # Determine size category
        if area < 0.05:
            size = "small"
        elif area < 0.2:
            size = "moderate"
        else:
            size = "large"
        
        return FindingExtent(
            distribution=distribution,
            size=size,
            percentage=None,  # Could be calculated relative to lung area
            involvement=None
        )
    
    def _extract_findings_from_response(self, response: str, state: MultiAgentState) -> List[Finding]:
        """Extract structured findings from the agent's response"""
        findings = []
        
        # This is a simplified extraction - you could make it more sophisticated
        # by parsing the response more carefully or using structured output
        
        # Common breathing pathologies to look for in the response
        pathology_keywords = {
            "pneumothorax": ["pneumothorax", "ptx", "collapsed lung"],
            "pleural_effusion": ["pleural effusion", "fluid in pleural", "pleural fluid"],
            "consolidation": ["consolidation", "consolidation"],
            "atelectasis": ["atelectasis", "collapse", "volume loss"],
            "pneumonia": ["pneumonia", "infection", "inflammatory"],
            "pulmonary_edema": ["pulmonary edema", "edema", "fluid in lungs"],
            "pleural_thickening": ["pleural thickening", "thickened pleura"],
            "costophrenic_blunting": ["costophrenic", "blunted", "angle"],
            "lung_opacity": ["opacity", "opacification", "shadowing"],
            "lung_nodule": ["nodule", "mass", "lesion"]
        }
        
        # Look for pathologies in the response
        response_lower = response.lower()
        
        for pathology, keywords in pathology_keywords.items():
            for keyword in keywords:
                if keyword in response_lower:
                    # Extract confidence if mentioned
                    confidence = 0.5  # Default confidence
                    
                    # Look for confidence patterns
                    if "high confidence" in response_lower:
                        confidence = 0.8
                    elif "low confidence" in response_lower:
                        confidence = 0.3
                    elif "moderate confidence" in response_lower:
                        confidence = 0.6
                    elif "suspicious" in response_lower:
                        confidence = 0.4
                    elif "likely" in response_lower:
                        confidence = 0.7
                    elif "possible" in response_lower:
                        confidence = 0.4
                    elif "probable" in response_lower:
                        confidence = 0.6
                    
                    # Look for negative findings
                    if any(neg in response_lower for neg in ["no", "not", "negative", "absent", "clear"]):
                        confidence = 0.1  # Low confidence for negative findings
                    
                    findings.append(Finding(
                        pathology=pathology,
                        confidence=confidence,
                        location=None,  # Could be extracted from response if available
                        measurements=None,  # Could be extracted from response if available
                        visual_cot=None,
                        evidence=f"Extracted from agent response: {keyword}"
                    ))
                    break  # Only add once per pathology
        
        # If no specific pathologies found, create a general finding
        if not findings:
            findings.append(Finding(
                pathology="general_assessment",
                confidence=0.5,
                location=None,
                measurements=None,
                visual_cot=None,
                evidence="General breathing assessment completed"
            ))
        
        return findings
    

    
    def _process_classification_findings(self, observation: Any, findings: List[Finding], state: MultiAgentState):
        """Process classification results for lung pathologies"""
        if not isinstance(observation, dict):
            return
        
        # Map actual classification output to breathing pathologies
        # Based on the classification tool, it returns these pathologies:
        breathing_pathology_mapping = {
            "Pneumothorax": "pneumothorax",
            "Consolidation": "consolidation", 
            "Atelectasis": "atelectasis",
            "Effusion": "pleural_effusion",  # Tool returns "Effusion" not "Pleural Effusion"
            "Pneumonia": "pneumonia",
            "Infiltration": "infiltration",
            "Edema": "pulmonary_edema",  # Tool returns "Edema" not "Pulmonary Edema"
            "Nodule": "lung_nodule",
            "Mass": "lung_mass",
            "Lung Opacity": "lung_opacity",
            "Lung Lesion": "lung_lesion",
            "Pleural Thickening": "pleural_thickening"
        }
        
        for classification_name, pathology_name in breathing_pathology_mapping.items():
            confidence = observation.get(classification_name, 0)
            
            # Convert numpy types to float if needed
            if hasattr(confidence, 'item'):
                confidence = float(confidence.item())
            else:
                confidence = float(confidence)
            
            if confidence > 0.2:  # Lower threshold for reporting
                
                # Store confidence for synthesis
                self.confidence_scores[pathology_name] = confidence
                
                # Check if V-CoT should be triggered
                visual_cot = None
                if self.should_trigger_vcot(confidence):
                    visual_cot = self._execute_vcot(state, pathology_name, confidence)
                
                findings.append(Finding(
                    pathology=pathology_name,
                    confidence=confidence,
                    location=None,  # Will be filled by grounding
                    measurements=None,
                    visual_cot=visual_cot,
                    evidence=f"Classification confidence: {confidence:.3f} for {classification_name}"
                ))
    
    def _process_segmentation_findings(self, observation: Any, findings: List[Finding], state: MultiAgentState):
        """Process segmentation results for anatomical measurements and percentage calculations"""
        if not isinstance(observation, dict) or "metrics" not in observation:
            return
        
        metrics = observation["metrics"]
        
        # Store anatomical measurements for synthesis
        self.anatomical_measurements = {
            "lung_metrics": {},
            "pleural_metrics": {},
            "vascular_metrics": {}
        }
        
        # Extract lung field measurements
        if "Left Lung" in metrics:
            self.anatomical_measurements["lung_metrics"]["left_lung"] = metrics["Left Lung"]
        if "Right Lung" in metrics:
            self.anatomical_measurements["lung_metrics"]["right_lung"] = metrics["Right Lung"]
        
        # DISABLED: Pleural effusion percentage calculation
        # Reason: Cannot reliably infer effusion from normal lung segmentation
        
        # DISABLED: Pneumothorax percentage calculation  
        # Reason: Cannot reliably infer pneumothorax from normal lung segmentation
        
        # Calculate costophrenic angle measurements
        costophrenic_findings = self._calculate_costophrenic_angles(metrics)
        if costophrenic_findings:
            confidence = costophrenic_findings["confidence"]
            
            visual_cot = None
            if self.should_trigger_vcot(confidence):
                visual_cot = self._execute_vcot(state, "costophrenic_blunting", confidence)
            
            findings.append(Finding(
                pathology="costophrenic_blunting",
                confidence=confidence,
                location=None,
                measurements=costophrenic_findings["measurements"],
                visual_cot=visual_cot,
                evidence=costophrenic_findings["evidence"]
            ))
    
    def _calculate_pleural_effusion_percentage(self, metrics: Dict) -> Optional[float]:
        """DISABLED: Cannot reliably calculate pleural effusion from normal lung segmentation"""
        # Reason: Segmentation tool cannot segment "Pleural Effusion" (it's stubbed)
        # Inferring from lung area reduction is unreliable - could be due to:
        # - Patient positioning, inspiration level, image quality, etc.
        return None
    
    def _calculate_pneumothorax_percentage(self, metrics: Dict) -> Optional[float]:
        """DISABLED: Cannot reliably calculate pneumothorax from normal lung segmentation"""  
        # Reason: Segmentation tool cannot segment "Pneumothorax" (it's stubbed)
        # Inferring from lung area reduction and position changes is unreliable - could be due to:
        # - Patient positioning, inspiration level, image quality, etc.
        return None
    
    def _calculate_costophrenic_angles(self, metrics: Dict) -> Optional[Dict]:
        """Calculate costophrenic angle measurements from segmentation"""
        try:
            # Use diaphragm and lung positions to estimate angles
            diaphragm = metrics.get("Facies Diaphragmatica", {})
            left_lung = metrics.get("Left Lung", {})
            right_lung = metrics.get("Right Lung", {})
            
            if not all([diaphragm, left_lung, right_lung]):
                return None
            
            # Get actual bounding boxes to calculate angles
            diaphragm_bbox = diaphragm.get("bbox", [0, 0, 0, 0])  # [min_y, min_x, max_y, max_x]
            left_bbox = left_lung.get("bbox", [0, 0, 0, 0])
            right_bbox = right_lung.get("bbox", [0, 0, 0, 0])
            
            # Calculate where lung meets diaphragm (costophrenic angle)
            # Left costophrenic angle: left lung bottom-left corner vs diaphragm
            left_lung_bottom = left_bbox[2]  # max_y (bottom)
            left_lung_left = left_bbox[1]    # min_x (left edge)
            diaphragm_top = diaphragm_bbox[0]  # min_y (top)
            
            # Right costophrenic angle: right lung bottom-right corner vs diaphragm  
            right_lung_bottom = right_bbox[2]  # max_y (bottom)
            right_lung_right = right_bbox[3]   # max_x (right edge)
            
            # Calculate overlap/gap between lung and diaphragm
            # Normal sharp angle: lung extends close to diaphragm
            # Blunted angle: gap between lung and diaphragm (filled with fluid)
            
            left_gap = abs(left_lung_bottom - diaphragm_top)
            right_gap = abs(right_lung_bottom - diaphragm_top)
            
            # Convert gap to angle estimate (smaller gap = sharper angle)
            # Normal costophrenic angle is ~90 degrees
            # Blunted angle is <75 degrees
            
            # Gap of 0-5 pixels = sharp (90°), gap of 20+ pixels = blunted (60°)
            max_gap = 25  # pixels
            
            left_angle = 90 - min(left_gap / max_gap * 30, 30)  # 90° down to 60°
            right_angle = 90 - min(right_gap / max_gap * 30, 30)
            
            # Also check lung area reduction (effusion reduces visible lung)
            left_area = left_lung.get("area_cm2", 175)
            right_area = right_lung.get("area_cm2", 175)
            
            # If lung area is significantly reduced, angle is likely blunted
            if left_area < 140:  # <140 cm2 suggests volume loss
                left_angle = min(left_angle, 75)
            if right_area < 140:
                right_angle = min(right_angle, 75)
            
            # Check for blunting (angle < 75°)
            if left_angle < 75 or right_angle < 75:
                confidence = 0.8 if min(left_angle, right_angle) < 70 else 0.6
                return {
                    "confidence": confidence,
                    "measurements": {
                        "left_angle": left_angle,
                        "right_angle": right_angle,
                        "left_gap_pixels": left_gap,
                        "right_gap_pixels": right_gap
                    },
                    "evidence": f"Costophrenic angles: L={left_angle:.1f}°, R={right_angle:.1f}° (per ABCDEF B: Breathing)"
                }
            
            return None
            
        except Exception as e:
            print(f"Error calculating costophrenic angles: {e}")
            return None
    
    def _process_grounding_findings(self, observation: Any, findings: List[Finding], tool_input: Dict):
        """Process grounding results to add precise location information and create new findings"""
        if not isinstance(observation, dict) or not observation.get("predictions"):
            return
        
        # Extract bounding box information
        for prediction in observation["predictions"]:
            phrase = prediction.get("phrase", tool_input.get("phrase", "unknown"))
            bbox_data = prediction.get("bounding_boxes", {}).get("image_coordinates", [])
            
            if bbox_data:
                # Store location for synthesis
                self.pathology_locations[phrase] = bbox_data
                
                # Match and update existing findings
                found_match = False
                for finding in findings:
                    if isinstance(finding, dict) and finding.get("pathology"):
                        pathology = finding["pathology"].replace("_", " ")
                        if phrase.lower() in pathology or pathology in phrase.lower():
                            finding["location"] = bbox_data[0] if bbox_data else None
                            finding["evidence"] += f" | Located at: {bbox_data[0]}" if bbox_data else ""
                            found_match = True
                            break
                
                # If no existing finding matched, create a new one from grounding
                if not found_match:
                    # Convert phrase to standardized pathology name
                    pathology_name = phrase.lower().replace(" ", "_")
                    
                    # Estimate confidence based on grounding success
                    # If grounding found it, it's likely present
                    confidence = 0.75  # High confidence from visual grounding
                    
                    # Calculate location-based measurements if possible
                    measurements = {}
                    if bbox_data:
                        bbox = bbox_data[0]
                        # Calculate size and position metrics
                        width = bbox[2] - bbox[0]  # x2 - x1
                        height = bbox[3] - bbox[1]  # y2 - y1
                        area = width * height
                        center_x = (bbox[0] + bbox[2]) / 2
                        center_y = (bbox[1] + bbox[3]) / 2
                        
                        measurements = {
                            "bbox_width": width,
                            "bbox_height": height,
                            "bbox_area": area,
                            "center_x": center_x,
                            "center_y": center_y
                        }
                    
                    # Trigger V-CoT for grounding-based findings
                    visual_cot = None
                    if self.should_trigger_vcot(confidence):
                        visual_cot = self._execute_vcot(None, pathology_name, confidence)
                    
                    findings.append(Finding(
                        pathology=pathology_name,
                        confidence=confidence,
                        location=bbox_data[0] if bbox_data else None,
                        measurements=measurements,
                        visual_cot=visual_cot,
                        evidence=f"Grounded finding: {phrase} located at {bbox_data[0]}"
                    ))
            
            else:
                # No bounding boxes found - this might be a negative finding
                phrase = prediction.get("phrase", tool_input.get("phrase", "unknown"))
                pathology_name = phrase.lower().replace(" ", "_")
                
                findings.append(Finding(
                    pathology=pathology_name,
                    confidence=0.1,  # Low confidence for negative grounding
                    location=None,
                    measurements=None,
                    visual_cot=None,
                    evidence=f"Grounding tool could not locate: {phrase}"
                ))
    
    def _process_vqa_findings(self, observation: Any, findings: List[Finding], tool_input: Dict):
        """Process VQA results for additional insights"""
        if not isinstance(observation, dict):
            return
        
        question = tool_input.get("question", "")
        answer = observation.get("answer", "")
        confidence = observation.get("confidence", 0.5)
        
        # Extract pathology from question context
        question_lower = question.lower()
        pathology = "lung_finding"
        
        if "pneumothorax" in question_lower:
            pathology = "pneumothorax"
        elif "effusion" in question_lower:
            pathology = "pleural_effusion"
        elif "pneumonia" in question_lower or "consolidation" in question_lower:
            pathology = "pneumonia"
        elif "opacity" in question_lower or "infiltrate" in question_lower:
            pathology = "lung_opacity"
        
        # Only add if answer suggests positive finding
        if any(word in answer.lower() for word in ["yes", "present", "visible", "seen", "shows"]):
            visual_cot = None
            if self.should_trigger_vcot(confidence):
                visual_cot = self._execute_vcot(None, pathology, confidence)
            
            findings.append(Finding(
                pathology=pathology,
                confidence=confidence,
                location=None,
                measurements=None,
                visual_cot=visual_cot,
                evidence=f"VQA - Q: {question} | A: {answer}"
            ))
    
    def _prepare_synthesis_information(self, findings: List[Finding]) -> Dict:
        """Prepare comprehensive information for synthesis agent"""
        synthesis_info = {
            "anatomical_measurements": self.anatomical_measurements,
            "pathology_locations": self.pathology_locations,
            "confidence_scores": self.confidence_scores,
            "clinical_significance": self._assess_clinical_significance(findings),
            "measurement_methods": {
                "pleural_effusion": "vcot_percentage_estimation_pleural_space",  # V-CoT with pleural space reference
                "pneumothorax": "vcot_percentage_estimation_pleural_space",      # V-CoT with pleural space reference
                "consolidation": "vcot_percentage_estimation_lung_parenchyma",   # V-CoT with lung parenchyma reference
                "atelectasis": "vcot_percentage_estimation_lung_parenchyma",     # V-CoT with lung parenchyma reference
                "costophrenic_angles": "geometric_estimation",
                "lung_fields": "area_and_position_analysis"
            },
            "grounding_coverage": len(self.pathology_locations),
            "total_findings": len(findings)
        }
        
        return synthesis_info
    
    def _assess_clinical_significance(self, findings: List[Finding]) -> Dict:
        """Assess clinical significance of findings"""
        significance = {
            "high_priority": [],
            "moderate_priority": [],
            "low_priority": []
        }
        
        for finding in findings:
            if isinstance(finding, dict):
                pathology = finding.get("pathology", "")
                confidence = finding.get("confidence", 0)
                measurements = finding.get("measurements", {}) or {}  # Fix null check
                
                # Assess priority based on pathology type and confidence (no percentage measurements)
                if pathology in ["pneumothorax", "pleural_effusion"]:
                    # Use classification confidence only (no percentage measurements available)
                    if confidence > 0.7:
                        significance["high_priority"].append(pathology)
                    elif confidence > 0.5:
                        significance["moderate_priority"].append(pathology)
                    else:
                        significance["low_priority"].append(pathology)
                elif pathology in ["pneumonia", "consolidation"]:
                    if confidence > 0.8:
                        significance["high_priority"].append(pathology)
                    else:
                        significance["moderate_priority"].append(pathology)
                else:
                    significance["low_priority"].append(pathology)
        
        return significance
    
    def _execute_vcot(self, state: Optional[MultiAgentState], pathology: str, confidence: float) -> Optional[str]:
        """Execute V-CoT analysis for uncertain findings"""
        if not self.vcot_module or not state:
            return None
        
        try:
            # Create evidence list from the finding
            from ..reasoning.visual_cot import VisualEvidence, VisualEvidenceType
            evidence_list = [VisualEvidence(
                evidence_type=VisualEvidenceType.CLASSIFICATION_RESULT,
                tool_name="chest_xray_classifier",
                confidence=confidence,
                data={"pathology": pathology, "confidence": confidence},
                description=f"Classification detected {pathology} with confidence {confidence:.2f}"
            )]
            
            # Define target based on pathology
            target_mapping = {
                "pneumothorax": "pneumothorax in pleural space",
                "pleural_effusion": "pleural effusion in pleural space",
                "consolidation": "consolidation in lung parenchyma",
                "pneumonia": "pneumonia in lung fields",
                "atelectasis": "atelectasis in lung fields",
                "lung_opacity": "lung opacity in lung fields",
                "costophrenic_blunting": "costophrenic angle blunting"
            }
            
            target = target_mapping.get(pathology, f"lung finding related to {pathology}")
            
            result = self.vcot_module.generate(
                image_path=state["image_path"],
                task=f"Verify {pathology} finding in chest X-ray",
                target=target,
                evidence_list=evidence_list,
                roi_bbox=None,
                measurements={}
            )
            
            return result.full_reasoning if hasattr(result, 'full_reasoning') else str(result)
            
        except Exception as e:
            print(f"Error in V-CoT for {pathology}: {e}")
            return None
    
    def _needs_review(self, findings: List[Finding]) -> bool:
        """Determine if human review is needed"""
        # Review needed for significant lung pathologies
        high_priority_pathologies = ["pneumothorax", "pleural_effusion", "pneumonia"]
        
        for finding in findings:
            if isinstance(finding, dict):
                pathology = finding.get("pathology", "")
                confidence = self._extract_confidence_value(finding.get("confidence", 0))
                measurements = finding.get("measurements", {}) or {}  # Fix null check
                
                # High confidence concerning findings (no percentage measurements available)
                if pathology in high_priority_pathologies and confidence > 0.7:
                    return True
        
        return False
    
    def _assess_confidence(self, findings: List[Finding]) -> str:
        """Assess overall confidence level based on findings"""
        if not findings:
            return "high"  # High confidence in negative findings
        
        confidences = [self._extract_confidence_value(f.get("confidence", 0)) for f in findings if isinstance(f, dict)]
        if not confidences:
            return "high"
        
        avg_confidence = sum(confidences) / len(confidences)
        
        # Check for any very uncertain findings
        min_confidence = min(confidences)
        
        if min_confidence < 0.3:
            return "low"
        elif avg_confidence >= 0.7:
            return "high"
        else:
            return "medium"
    
    # Plan-Execute workflow methods
    def _plan_analysis(self, state: dict) -> dict:
        """Create or update the analysis plan based on query and current findings"""
        query = state.get("query", "")
        findings = state.get("findings", [])
        current_step = state.get("current_step", 0)
        
        # Create initial plan if not exists
        if not state.get("plan"):
            plan = self._create_initial_plan(query)
            state["plan"] = plan
            print(f"  📋 Created analysis plan with {len(plan)} steps")
        
        # Check if we need to add more steps based on findings
        plan = state["plan"]
        if findings and current_step < len(plan):
            additional_steps = self._evaluate_additional_steps(findings, query)
            if additional_steps:
                plan.extend(additional_steps)
                state["plan"] = plan
                print(f"  📋 Added {len(additional_steps)} additional steps to plan")
        
        state["current_step"] = current_step
        return state
    
    def _create_initial_plan(self, query: str) -> List[Dict]:
        """Create initial analysis plan based on query"""
        query_lower = query.lower()
        plan = []
        
        # Always start with classification for broad screening
        plan.append({
            "step": "classification",
            "tool": "chest_xray_classifier",
            "purpose": "Broad pathology screening",
            "priority": "high"
        })
        
        # Add segmentation for measurements and anatomical analysis
        plan.append({
            "step": "segmentation", 
            "tool": "chest_xray_segmentation",
            "purpose": "Anatomical measurements and quantification",
            "priority": "medium"
        })
        
        # Add grounding for critical pathologies
        critical_pathologies = ['pneumothorax', 'pleural effusion', 'pneumonia', 'consolidation']
        for pathology in critical_pathologies:
            if pathology in query_lower or "abnormalities" in query_lower or "report" in query_lower:
                plan.append({
                    "step": "grounding",
                    "tool": "xray_phrase_grounding", 
                    "purpose": f"Localize {pathology}",
                    "priority": "high",
                    "phrase": pathology
                })
        
        # Add VQA for complex or report-generation queries
        if any(keyword in query_lower for keyword in ["report", "abnormalities", "describe", "findings", "assessment"]):
            if self.has_vqa:
                plan.append({
                    "step": "vqa",
                    "tool": "xray_vqa",
                    "purpose": "Detailed analysis and description",
                    "priority": "medium"
                })
        
        # Always end with synthesis
        plan.append({
            "step": "synthesize",
            "tool": "synthesize_findings",
            "purpose": "Comprehensive finding synthesis",
            "priority": "high"
        })
        
        return plan
    
    def _evaluate_additional_steps(self, findings: List[Finding], query: str) -> List[Dict]:
        """Evaluate if additional analysis steps are needed based on current findings"""
        additional_steps = []
        
        # If high-confidence pathologies found, add specific grounding
        for finding in findings:
            if isinstance(finding, dict):
                pathology = finding.get("pathology", "")
                confidence = finding.get("confidence", 0)
                
                if confidence > 0.7 and pathology in ["pneumothorax", "pleural_effusion", "consolidation"]:
                    # Check if we already have grounding for this pathology
                    existing_grounding = any(
                        step.get("phrase") == pathology 
                        for step in additional_steps 
                        if step.get("step") == "grounding"
                    )
                    
                    if not existing_grounding:
                        additional_steps.append({
                            "step": "grounding",
                            "tool": "xray_phrase_grounding",
                            "purpose": f"Precise localization of {pathology}",
                            "priority": "high",
                            "phrase": pathology
                        })
        
        return additional_steps
    
    def _should_continue_execution(self, state: dict) -> str:
        """Determine next step in plan-execute workflow"""
        plan = state.get("plan", [])
        current_step = state.get("current_step", 0)
        completed_steps = state.get("completed_steps", [])
        
        # Check if we've completed all steps
        if current_step >= len(plan):
            if not state.get("synthesis_complete", False):
                return "synthesize"
            else:
                return "end"
        
        # Get next step
        next_step = plan[current_step]
        step_type = next_step["step"]
        
        # Skip if already completed
        if step_type in completed_steps:
            state["current_step"] = current_step + 1
            return self._should_continue_execution(state)
        
        return step_type
    
    def _execute_classification(self, state: dict) -> dict:
        """Execute classification tool"""
        try:
            print(f"  🔍 Executing classification...")
            image_path = state["image_path"]
            
            result = self.tools["chest_xray_classifier"].invoke({"image_path": image_path})
            findings = state.get("findings", [])
            
            # Process classification results
            self._process_classification_findings(result, findings, {"image_path": image_path})
            
            state["findings"] = findings
            state["executed_tools"].append("chest_xray_classifier")
            state["completed_steps"].append("classification")
            state["current_step"] += 1
            
            print(f"    ✓ Classification complete, {len(findings)} findings total")
            
        except Exception as e:
            print(f"    ✗ Classification failed: {e}")
        
        return state
    
    def _execute_segmentation(self, state: dict) -> dict:
        """Execute segmentation tool"""
        try:
            print(f"  📏 Executing segmentation...")
            image_path = state["image_path"]
            
            result = self.tools["chest_xray_segmentation"].invoke({"image_path": image_path})
            findings = state.get("findings", [])
            
            # Process segmentation results
            self._process_segmentation_findings(result, findings, {"image_path": image_path})
            
            state["findings"] = findings
            state["executed_tools"].append("chest_xray_segmentation")
            state["completed_steps"].append("segmentation")
            state["current_step"] += 1
            
            print(f"    ✓ Segmentation complete, {len(findings)} findings total")
            
        except Exception as e:
            print(f"    ✗ Segmentation failed: {e}")
        
        return state
    
    def _execute_grounding(self, state: dict) -> dict:
        """Execute grounding tool"""
        try:
            plan = state.get("plan", [])
            current_step = state.get("current_step", 0)
            
            if current_step < len(plan):
                step_info = plan[current_step]
                phrase = step_info.get("phrase", "pneumothorax")  # Default phrase
                
                print(f"  🎯 Executing grounding for: {phrase}")
                image_path = state["image_path"]
                
                result = self.tools["xray_phrase_grounding"].invoke({
                    "image_path": image_path,
                    "phrase": phrase
                })
                findings = state.get("findings", [])
                
                # Process grounding results
                self._process_grounding_findings(result, findings, {"phrase": phrase})
                
                state["findings"] = findings
                state["executed_tools"].append(f"xray_phrase_grounding({phrase})")
                state["completed_steps"].append("grounding")
                state["current_step"] += 1
                
                print(f"    ✓ Grounding for {phrase} complete, {len(findings)} findings total")
            
        except Exception as e:
            print(f"    ✗ Grounding failed: {e}")
        
        return state
    
    def _execute_vqa(self, state: dict) -> dict:
        """Execute VQA tool"""
        try:
            if not self.has_vqa:
                state["completed_steps"].append("vqa")
                state["current_step"] += 1
                return state
            
            print(f"  🤔 Executing VQA...")
            image_path = state["image_path"]
            query = state["query"]
            
            # Generate appropriate VQA question based on query
            if "report" in query.lower():
                question = "What abnormalities are visible in this chest X-ray?"
            elif "abnormalities" in query.lower():
                question = "Describe any pathological findings in this chest X-ray."
            else:
                question = f"Based on this query: {query}, what can you observe in the chest X-ray?"
            
            result = self.tools["xray_vqa"].invoke({
                "image_path": image_path,
                "question": question
            })
            findings = state.get("findings", [])
            
            # Process VQA results
            self._process_vqa_findings(result, findings, {"question": question})
            
            state["findings"] = findings
            state["executed_tools"].append("xray_vqa")
            state["completed_steps"].append("vqa")
            state["current_step"] += 1
            
            print(f"    ✓ VQA complete, {len(findings)} findings total")
            
        except Exception as e:
            print(f"    ✗ VQA failed: {e}")
        
        return state
    
    def _synthesize_findings(self, state: dict) -> dict:
        """Synthesize all findings into final analysis"""
        print(f"  🔬 Synthesizing findings...")
        
        findings = state.get("findings", [])
        executed_tools = state.get("executed_tools", [])
        
        # Remove duplicates and consolidate findings
        consolidated_findings = self._consolidate_findings(findings)
        
        state["findings"] = consolidated_findings
        state["synthesis_complete"] = True
        
        print(f"    ✓ Synthesis complete: {len(consolidated_findings)} consolidated findings")
        print(f"    📊 Executed tools: {executed_tools}")
        
        return state
    
    def _consolidate_findings(self, findings: List[Finding]) -> List[Finding]:
        """Consolidate duplicate findings and enhance with multiple tool evidence"""
        if not findings:
            return findings
        
        # Group findings by pathology
        pathology_groups = {}
        for finding in findings:
            if isinstance(finding, dict):
                pathology = finding.get("pathology", "unknown")
                if pathology not in pathology_groups:
                    pathology_groups[pathology] = []
                pathology_groups[pathology].append(finding)
        
        # Consolidate each group
        consolidated = []
        for pathology, group in pathology_groups.items():
            if len(group) == 1:
                consolidated.extend(group)
            else:
                # Merge multiple findings for same pathology
                merged_finding = self._merge_findings(group)
                consolidated.append(merged_finding)
        
        return consolidated
    
    def _merge_findings(self, findings_group: List[Dict]) -> Dict:
        """Merge multiple findings for the same pathology"""
        if not findings_group:
            return {}
        
        # Use the finding with highest confidence as base
        base_finding = max(findings_group, key=lambda f: f.get("confidence", 0))
        
        # Combine evidence from all findings
        all_evidence = []
        all_measurements = {}
        max_confidence = 0
        
        for finding in findings_group:
            if finding.get("evidence"):
                all_evidence.append(finding["evidence"])
            if finding.get("measurements"):
                all_measurements.update(finding["measurements"])
            max_confidence = max(max_confidence, finding.get("confidence", 0))
        
        # Create merged finding
        merged = base_finding.copy()
        merged["confidence"] = max_confidence
        merged["evidence"] = " | ".join(all_evidence)
        merged["measurements"] = all_measurements if all_measurements else None
        
        return merged 
    
    def _execute_vcot_comprehensive_location_analysis(self, state: MultiAgentState, phrase: str, bbox: List[float], confidence: float) -> Optional[Dict]:
        """Execute V-CoT for comprehensive location analysis of all FindingLocation attributes"""
        try:
            if not self.vcot_module:
                return None
            
            print(f"    📍 V-CoT comprehensive location analysis for {phrase}")
            
            # Create evidence list with bounding box information
            from ..reasoning.visual_cot import VisualEvidence, VisualEvidenceType
            evidence_list = [
                VisualEvidence(
                    evidence_type=VisualEvidenceType.BOUNDING_BOX,
                    tool_name="grounding_tool",
                    confidence=confidence,
                    data={"bbox": bbox},
                    description=f"Grounded {phrase} at bounding box coordinates"
                )
            ]
            
            # V-CoT with comprehensive location analysis
            visual_cot_result = self.vcot_module.generate(
                image_path=state["image_path"],
                task=f"Analyze the precise anatomical location of {phrase}. "
                      f"Determine: 1) Anatomical side (left/right/bilateral/midline), "
                      f"2) Lung zone (upper/middle/lower/perihilar/peripheral/apical), "
                      f"3) Specific lobe if identifiable (RUL/RML/RLL/LUL/LLL), "
                      f"4) Position details (peripheral/central/hilar/pleural/subpleural). "
                      f"Provide clinical anatomical description.",
                target=f"anatomical location and regional distribution of {phrase}",
                evidence_list=evidence_list,
                roi_bbox=bbox,
                measurements={}
            )
            
            # Extract structured location from V-CoT result
            location_analysis = self._extract_location_from_vcot(visual_cot_result)
            
            return {
                "visual_cot": visual_cot_result,
                "location_analysis": location_analysis,
                "bbox": bbox
            }
            
        except Exception as e:
            print(f"Error in V-CoT comprehensive location analysis: {e}")
            return None
    
    def _execute_vcot_comprehensive_extent_analysis(self, state: MultiAgentState, phrase: str, bbox: List[float], confidence: float) -> Optional[Dict]:
        """Execute V-CoT for comprehensive extent analysis of all FindingExtent attributes"""
        try:
            if not self.vcot_module:
                return None
            
            print(f"    📏 V-CoT comprehensive extent analysis for {phrase}")
            
            # Create evidence list with bounding box information
            from ..reasoning.visual_cot import VisualEvidence, VisualEvidenceType
            evidence_list = [
                VisualEvidence(
                    evidence_type=VisualEvidenceType.BOUNDING_BOX,
                    tool_name="grounding_tool",
                    confidence=confidence,
                    data={"bbox": bbox},
                    description=f"Grounded {phrase} at bounding box coordinates"
                )
            ]
            
            # V-CoT with comprehensive extent analysis
            visual_cot_result = self.vcot_module.generate(
                image_path=state["image_path"],
                task=f"Analyze the extent and distribution pattern of {phrase}. "
                      f"Determine: 1) Distribution pattern (focal/multifocal/lobar/segmental/diffuse), "
                      f"2) Size category (small/moderate/large) with clinical context, "
                      f"3) Percentage of affected lung area (0-100%), "
                      f"4) Involvement pattern (limited/extensive/basal-predominant/upper-lobe/diffuse). "
                      f"Provide clinical extent assessment.",
                target=f"extent, distribution, and involvement pattern of {phrase}",
                evidence_list=evidence_list,
                roi_bbox=bbox,
                measurements={}
            )
            
            # Extract structured extent from V-CoT result
            extent_analysis = self._extract_extent_from_vcot(visual_cot_result)
            
            return {
                "visual_cot": visual_cot_result,
                "extent_analysis": extent_analysis,
                "bbox": bbox
            }
            
        except Exception as e:
            print(f"Error in V-CoT comprehensive extent analysis: {e}")
            return None
    
    def _extract_location_from_vcot(self, vcot_result) -> Optional[Dict]:
        """Extract structured location information from V-CoT analysis"""
        try:
            if hasattr(vcot_result, 'direct_visual_assessment'):
                assessment = vcot_result.direct_visual_assessment
            elif hasattr(vcot_result, 'full_reasoning'):
                assessment = vcot_result.full_reasoning
            else:
                assessment = str(vcot_result)
            
            assessment_lower = assessment.lower()
            
            # Extract side
            side = "unknown"
            if "left" in assessment_lower and "right" in assessment_lower:
                side = "bilateral"
            elif "left" in assessment_lower:
                side = "left"
            elif "right" in assessment_lower:
                side = "right"
            elif "midline" in assessment_lower or "central" in assessment_lower:
                side = "midline"
            
            # Extract zone
            zone = None
            zone_keywords = {
                "upper": ["upper", "apex", "apical"],
                "middle": ["middle", "mid"],
                "lower": ["lower", "base", "basal"],
                "perihilar": ["perihilar", "hilar", "hilum"],
                "peripheral": ["peripheral", "outer", "pleural"],
                "apical": ["apical", "apex"]
            }
            
            for zone_name, keywords in zone_keywords.items():
                if any(keyword in assessment_lower for keyword in keywords):
                    zone = zone_name
                    break
            
            # Extract lobe
            lobe = None
            lobe_keywords = {
                "RUL": ["right upper lobe", "rul"],
                "RML": ["right middle lobe", "rml"],
                "RLL": ["right lower lobe", "rll"],
                "LUL": ["left upper lobe", "lul"],
                "LLL": ["left lower lobe", "lll"]
            }
            
            for lobe_name, keywords in lobe_keywords.items():
                if any(keyword in assessment_lower for keyword in keywords):
                    lobe = lobe_name
                    break
            
            # Extract position
            position = None
            position_keywords = {
                "peripheral": ["peripheral", "outer", "pleural", "subpleural"],
                "central": ["central", "inner", "medial"],
                "hilar": ["hilar", "hilum", "perihilar"],
                "pleural": ["pleural", "pleural-based"],
                "subpleural": ["subpleural", "sub-pleural"]
            }
            
            for pos_name, keywords in position_keywords.items():
                if any(keyword in assessment_lower for keyword in keywords):
                    position = pos_name
                    break
            
            return {
                "side": side,
                "zone": zone,
                "lobe": lobe,
                "position": position,
                "confidence": getattr(vcot_result, 'final_confidence', 0.5),
                "assessment_text": assessment
            }
            
        except Exception as e:
            print(f"Error extracting location from V-CoT: {e}")
            return None
    
    def _extract_extent_from_vcot(self, vcot_result) -> Optional[Dict]:
        """Extract structured extent information from V-CoT analysis"""
        try:
            if hasattr(vcot_result, 'direct_visual_assessment'):
                assessment = vcot_result.direct_visual_assessment
            elif hasattr(vcot_result, 'full_reasoning'):
                assessment = vcot_result.full_reasoning
            else:
                assessment = str(vcot_result)
            
            assessment_lower = assessment.lower()
            
            # Extract distribution
            distribution = "unknown"
            distribution_keywords = {
                "focal": ["focal", "localized", "single"],
                "multifocal": ["multifocal", "multiple", "scattered"],
                "lobar": ["lobar", "entire lobe"],
                "segmental": ["segmental", "segment"],
                "diffuse": ["diffuse", "widespread", "extensive"]
            }
            
            for dist_name, keywords in distribution_keywords.items():
                if any(keyword in assessment_lower for keyword in keywords):
                    distribution = dist_name
                    break
            
            # Extract size
            size = None
            size_keywords = {
                "small": ["small", "minor", "limited", "minimal"],
                "moderate": ["moderate", "medium", "intermediate"],
                "large": ["large", "extensive", "significant", "major"]
            }
            
            for size_name, keywords in size_keywords.items():
                if any(keyword in assessment_lower for keyword in keywords):
                    size = size_name
                    break
            
            # Extract percentage
            percentage = None
            import re
            percentage_pattern = r'(\d+(?:\.\d+)?)\s*%'
            matches = re.findall(percentage_pattern, assessment)
            if matches:
                percentage = float(matches[0])
            
            # Extract involvement
            involvement = None
            involvement_keywords = {
                "limited": ["limited", "localized", "restricted"],
                "extensive": ["extensive", "widespread", "diffuse"],
                "basal-predominant": ["basal", "lower lobe", "base"],
                "upper-lobe": ["upper lobe", "apical", "upper"],
                "diffuse": ["diffuse", "bilateral", "throughout"]
            }
            
            for inv_name, keywords in involvement_keywords.items():
                if any(keyword in assessment_lower for keyword in keywords):
                    involvement = inv_name
                    break
            
            return {
                "distribution": distribution,
                "size": size,
                "percentage": percentage,
                "involvement": involvement,
                "confidence": getattr(vcot_result, 'final_confidence', 0.5),
                "assessment_text": assessment
            }
            
        except Exception as e:
            print(f"Error extracting extent from V-CoT: {e}")
            return None
    
    def _create_vcot_enhanced_finding_location(self, bbox: List[float], vcot_analysis: Optional[Dict] = None) -> FindingLocation:
        """Create FindingLocation with V-CoT enhancement when available"""
        # Start with basic geometric analysis
        basic_location = self._extract_location_from_bbox(bbox)
        
        # Enhance with V-CoT analysis if available
        if vcot_analysis and vcot_analysis.get("location_analysis"):
            vcot_loc = vcot_analysis["location_analysis"]
            
            return FindingLocation(
                side=vcot_loc.get("side", basic_location.side),
                zone=vcot_loc.get("zone", basic_location.zone),
                lobe=vcot_loc.get("lobe", basic_location.lobe),
                position=vcot_loc.get("position", basic_location.position)
            )
        
        return basic_location
    
    def _create_vcot_enhanced_finding_extent(self, bbox: List[float], vcot_analysis: Optional[Dict] = None) -> FindingExtent:
        """Create FindingExtent with V-CoT enhancement when available"""
        # Start with basic geometric analysis
        basic_extent = self._extract_extent_from_bbox(bbox)
        
        # Enhance with V-CoT analysis if available
        if vcot_analysis and vcot_analysis.get("extent_analysis"):
            vcot_ext = vcot_analysis["extent_analysis"]
            
            return FindingExtent(
                distribution=vcot_ext.get("distribution", basic_extent.distribution),
                size=vcot_ext.get("size", basic_extent.size),
                percentage=vcot_ext.get("percentage", basic_extent.percentage),
                involvement=vcot_ext.get("involvement", basic_extent.involvement)
            )
        
        return basic_extent
    
    def _enhance_findings_with_vcot_analysis(self, findings: List[Finding], location_analysis: Optional[Dict], extent_analysis: Optional[Dict], bboxes: List, task_id: str):
        """Enhance existing findings with V-CoT location and extent analysis"""
        if not findings or not bboxes:
            return
        
        # Find the most recent finding from this task
        for finding in reversed(findings):
            if isinstance(finding, dict) and finding.get("task_source") == task_id:
                
                # Enhance with V-CoT location analysis
                if location_analysis and location_analysis.get("location_analysis"):
                    vcot_loc = location_analysis["location_analysis"]
                    
                    enhanced_location = FindingLocation(
                        side=vcot_loc.get("side", finding["location_structured"].get("side", "unknown")),
                        zone=vcot_loc.get("zone", finding["location_structured"].get("zone")),
                        lobe=vcot_loc.get("lobe", finding["location_structured"].get("lobe")),
                        position=vcot_loc.get("position", finding["location_structured"].get("position"))
                    )
                    
                    finding["location_structured"] = enhanced_location.dict()
                    finding["vcot_location_confidence"] = vcot_loc.get("confidence", 0.5)
                    
                    # Add to evidence
                    finding["evidence"] += f" | V-CoT Location: {vcot_loc.get('side', 'unknown')} {vcot_loc.get('zone', '')} {vcot_loc.get('lobe', '')}"
                
                # Enhance with V-CoT extent analysis
                if extent_analysis and extent_analysis.get("extent_analysis"):
                    vcot_ext = extent_analysis["extent_analysis"]
                    
                    enhanced_extent = FindingExtent(
                        distribution=vcot_ext.get("distribution", finding["extent_structured"].get("distribution", "unknown")),
                        size=vcot_ext.get("size", finding["extent_structured"].get("size")),
                        percentage=vcot_ext.get("percentage", finding["extent_structured"].get("percentage")),
                        involvement=vcot_ext.get("involvement", finding["extent_structured"].get("involvement"))
                    )
                    
                    finding["extent_structured"] = enhanced_extent.dict()
                    finding["vcot_extent_confidence"] = vcot_ext.get("confidence", 0.5)
                    
                    # Add to evidence
                    finding["evidence"] += f" | V-CoT Extent: {vcot_ext.get('distribution', 'unknown')} {vcot_ext.get('size', '')} {vcot_ext.get('percentage', '')}%"
                
                # Mark as V-CoT enhanced
                finding["vcot_enhanced"] = True
                
                print(f"    ✅ Enhanced finding with V-CoT: {finding['pathology']}")
                break  # Only enhance the most recent finding from this task
    
    def _extract_confidence_value(self, conf: Any) -> float:
        """Safely extract confidence value from various formats"""
        if isinstance(conf, (int, float)):
            return float(conf)
        elif isinstance(conf, dict):
            return float(conf.get("value", 0))
        else:
            return 0.0