"""Airway specialist agent for tracheal and mediastinal analysis"""

from typing import List, Dict, Any, Optional, Union
from langchain_core.language_models import BaseLanguageModel
from langchain_core.prompts import ChatPromptTemplate
from pydantic import BaseModel, Field, ConfigDict
import json
from dataclasses import dataclass

from .base_abcde import ABCDEAgent
from ..orchestrator.state import MultiAgentState, AgentAnalysis, Finding
from ...tools import ChestXRayClassifierTool, ChestXRaySegmentationTool, XRayPhraseGroundingTool
from ..reasoning.visual_cot import BiasResistantVisualCoT, VisualEvidence, VisualEvidenceType

# '''
# Priority:
# High
# -- check_tracheal_position (Is trachea mid-line / deviated?)
# -- measure_tracheal_deviation
# -- detect_tracheal_pathology (pneumomediastinum, etc.)
# -- detect_pneumomediastinum

# Medium
# -- segment_tracheal_structures
# -- assess_tracheal_caliber
# -- assess_carina       (symmetry)
# -- measure_carina_angle
# -- check_main_bronchi
# -- detect_subcutaneous_emphysema
# -- visual_reasoning / cross_validate (verification)

# Low
# -- detect_bronchial_narrowing
# -- localize_carina, localize_abnormalities
# '''

@dataclass
class AirwayAgentConfig:
    """Configuration for AirwayAgent thresholds and parameters"""
    # Confidence thresholds
    pathology_report_threshold: float = 0.3
    high_confidence_threshold: float = 0.7
    
    # Measurement thresholds
    tracheal_deviation_threshold_mm: float = 5.0
    significant_deviation_mm: float = 10.0
    carina_angle_normal_max: float = 100.0
    
    # Tool availability strings (built once)
    tools_available_desc: str = ""


class AirwayTaskParameters(BaseModel):
    """Parameters for an airway task"""
    focus: Optional[str] = Field(default=None, description="Focus area for the task")
    phrase: Optional[str] = Field(default=None, description="Phrase to ground/localize")
    phrases: Optional[List[str]] = Field(default=None, description="Multiple phrases to ground")
    image_path: Optional[str] = Field(default=None, description="Path to the image")
    organs: Optional[List[str]] = Field(default=None, description="Organs to segment")
    
    model_config = ConfigDict(
        extra="forbid",
        populate_by_name=True  # Accept camelCase from external services
    )


class AirwaySubtask(BaseModel):
    """A single subtask in the airway analysis plan"""
    task_id: str = Field(description="Unique identifier for this subtask (e.g., 'check_tracheal_position', 'assess_carina', 'detect_mediastinal_masses')")
    description: str = Field(description="What this subtask accomplishes")
    tool: str = Field(description="Which tool to use: chest_xray_classifier, chest_xray_segmentation, or xray_phrase_grounding")
    parameters: AirwayTaskParameters = Field(default_factory=AirwayTaskParameters, description="Parameters for the tool")
    depends_on: List[str] = Field(default_factory=list, description="List of task_ids this task depends on")
    
    model_config = ConfigDict(
        extra="forbid",
        populate_by_name=True
    )


class AirwayPlan(BaseModel):
    """Dynamic plan for airway analysis"""
    subtasks: List[AirwaySubtask] = Field(description="Ordered list of subtasks to execute")
    reasoning: str = Field(description="Brief explanation of why this plan was chosen")
    
    model_config = ConfigDict(
        extra="forbid",
        populate_by_name=True
    )


class AirwayAgent(ABCDEAgent):
    """Specialist agent for airway and mediastinal findings with LangGraph-style flexible P&E mode"""
    
    def __init__(
        self, 
        llm: BaseLanguageModel,
        classification_tool: ChestXRayClassifierTool,
        segmentation_tool: ChestXRaySegmentationTool,
        grounding_tool: Optional[XRayPhraseGroundingTool] = None,
        vcot_module: Optional[Any] = None,
        config: Optional[AirwayAgentConfig] = None
    ):
        # Only include grounding tool if provided
        tools = [classification_tool, segmentation_tool]
        if grounding_tool:
            tools.append(grounding_tool)
            
        super().__init__(
            agent_name="AirwayAgent",
            llm=llm,
            tools=tools,
            mode="plan_execute",  # P&E mode with LLM-driven planning
            vcot_policy="on_low_conf"  # V-CoT on low confidence
        )
        self.vcot_module = vcot_module
        self.has_grounding = grounding_tool is not None
        self.config = config or AirwayAgentConfig()
        
        # Build tools description once
        self._build_tools_description()
        
        # Define subtask templates for the planner
        self.subtask_templates = self._define_subtask_templates()
        
        # Create structured planner
        self.planner = self._create_planner()
    
    def _build_tools_description(self):
        """Build tools description string once during init"""
        tools_desc = [
            "- chest_xray_classifier: Detects pathologies (pneumomediastinum, paratracheal masses, subcutaneous emphysema)",
            "- chest_xray_segmentation: Segments anatomical structures (e.g., Weasand, lungs) for position/measurement analysis"
        ]
        if self.has_grounding:
            tools_desc.append("- xray_phrase_grounding: AVAILABLE - Attempts to localize specific phrases/objects in the image")
        else:
            tools_desc.append("- xray_phrase_grounding: NOT AVAILABLE")
        
        self.config.tools_available_desc = "\n".join(tools_desc)
    
    def _define_subtask_templates(self) -> str:
        """Define available subtask templates for airway analysis"""
        templates = """
Available Airway Subtask Templates:

1. TRACHEAL ASSESSMENT:
   - check_tracheal_position: Assess if trachea is midline or deviated (use segmentation with "Weasand" - grounding not effective for trachea)
   - measure_tracheal_deviation: Quantify deviation from midline using segmentation
   - segment_tracheal_structures: Segment tracheal structures using "Weasand" organ
   - assess_tracheal_caliber: Evaluate tracheal narrowing or widening using segmentation
   - detect_tracheal_pathology: Detect tracheal pathologies using classification
   
2. CARINA AND BRONCHI:
   - assess_carina: Evaluate carina symmetry (use grounding: "carina")
   - measure_carina_angle: Measure carina angle (use grounding: "carina", "main bronchi")
   - check_main_bronchi: Assess main bronchi patency and symmetry (use grounding: "main bronchi")
   - detect_bronchial_narrowing: Look for luminal narrowing (use grounding for specific bronchi)
   
4. PNEUMOMEDIASTINUM:
   - detect_pneumomediastinum: Look for air in mediastinum
   - detect_subcutaneous_emphysema: Check for air in soft tissues
   
5. LOCALIZATION TASKS:
   - localize_carina: Identify carina location (use grounding)
   - localize_abnormalities: Find specific airway/mediastinal findings (use grounding)
   
6. VERIFICATION TASKS:
   - visual_reasoning: Apply V-CoT for uncertain findings
   - cross_validate: Compare findings across different tools

Remember: 
- IMPORTANT: Grounding tool is NOT effective for tracheal localization - use segmentation with "Weasand" for tracheal assessment
- NOTE: Mediastinal width assessment belongs to CardiacAgent per ABCDEF
- NOTE: Hilar vessel assessment belongs to CardiacAgent per ABCDEF C: Circulation  
- NOTE: Tubes and foreign devices belong to Everything_else_agent
- The system will automatically optimize organ selection based on the task
- Quantitative measurements provide objective assessment when possible"""
        
        return templates
    
# """
# △ 临床相关性中等。<br/>对肿瘤分期或感染评估有用，但对典型「Airway 急症」并非最高优先；不少机构把这部分放在 Mediastinum/Lymph node agent。
# 3. PARATRACHEAL ASSESSMENT:
#    - detect_paratracheal_masses: Identify paratracheal masses or lymphadenopathy
#    - assess_paratracheal_regions: Check paratracheal soft tissue abnormalities
#    - evaluate_paratracheal_lymph_nodes: Assess paratracheal lymphadenopathy
#    - assess_posterior_tracheal_stripe: Evaluate retro-tracheal space thickening
# """
    
    def _create_planner(self):
        """Create the LLM-based planner with structured output"""
        
        planner_prompt = ChatPromptTemplate.from_messages([
            ("system", """You are an airway and mediastinal imaging specialist planning an analysis workflow.
Given a query about airway/mediastinal findings, create a detailed plan using available tools.

{subtask_templates}

Tools available:
{tools_available}

IMPORTANT ORGAN MAPPING:
- Segmentation tool does NOT support "Trachea" directly
- Available organs: Left/Right Hilus Pulmonis, Mediastinum, Left/Right Lung, Heart, Aorta, Weasand, Spine
- For tracheal assessment: Use "Weasand" as closest approximation OR use grounding to locate "trachea" directly
- For airway structures: Prefer grounding tool over segmentation for accuracy

TOOL SELECTION GUIDELINES:
- chest_xray_classifier: Use for detecting pathologies (pneumomediastinum, masses, abnormalities)
- chest_xray_segmentation: Use for organ measurements when exact organ exists (Weasand for trachea approximation)
- xray_phrase_grounding: Use for non-tracheal airway structures ("carina", "main bronchi", "bronchus") - NOT effective for "trachea"

TASK TYPE GUIDANCE (flexible, not mandatory):
- TRACHEAL POSITION/LOCATION queries (e.g., "Is the trachea midline?", "Where is the trachea?"):
  → Use chest_xray_segmentation with "Weasand" organ (grounding not effective for tracheal localization)
  → Classification is NOT suitable for position assessment
- NON-TRACHEAL POSITION queries (e.g., "Where is the carina?", "Locate main bronchi"):
  → Consider xray_phrase_grounding for direct localization if structure is likely visible
  → Accept that some structures may not be localizable in certain images
- PATHOLOGY queries (e.g., "Is there pneumomediastinum?", "Any masses?"):
  → Use chest_xray_classifier for pathology detection
  → Optionally use grounding for localization if pathology is detected
- MEASUREMENT queries (e.g., "Measure tracheal deviation", "Carina angle"):
  → Use segmentation for quantitative measurements when structures are segmentable
  → Consider whether measurement is feasible given image quality and structure visibility

MEDICAL BEST PRACTICES:
- For tracheal position assessment, grounding is the primary method
- For tracheal deviation, always quantify the deviation from midline
- For paratracheal assessment, consider masses, lymphadenopathy, and stripe thickening
- For masses/lymphadenopathy, describe location, size, and characteristics
- Always check both tracheal position AND paratracheal structures comprehensively
- Carina assessment should include angle measurement when possible
- Consider pneumomediastinum in trauma or post-procedure cases
- NOTE: Mediastinal width belongs to CardiacAgent per ABCDEF - DO NOT assess it here
- NOTE: Hilar vessel assessment belongs to CardiacAgent per ABCDEF C: Circulation - DO NOT assess it here
- NOTE: Tubes and foreign devices belong to Everything_else_agent - DO NOT assess them here

Create a plan that:
1. Addresses the specific query requirements intelligently
2. Only calls tools when they can meaningfully contribute to answering the query
3. Considers whether the requested analysis is feasible given available tools and image characteristics
4. Accepts that some queries may not require tool usage or may not be answerable
5. Uses clinical reasoning to determine the most appropriate approach
6. Is efficient and avoids unnecessary or redundant tool calls

IMPORTANT: 
- Empty tool results may be clinically accurate (e.g., structure not visible/localizable)
- Not every query requires tool usage - use clinical judgment
- Tools should add value, not be called just because they're available"""),
            ("human", "Query: {query}\n\nCreate a plan to analyze the airway and mediastinal findings.")
        ])
        
        return planner_prompt | self.llm.with_structured_output(AirwayPlan)
    
    def get_react_prompt_template(self) -> str:
        """Not used for P&E mode"""
        return ""
    
    def create_plan(self, state: MultiAgentState) -> List[Dict[str, Any]]:
        """Create dynamic plan using LLM with structured output"""
        query = state.get("query", "")
        
        # If in comparison mode, modify query to avoid comparison within agent
        comparison_mode = state.get("comparison_mode")
        if comparison_mode:
            # Simplify query for single image analysis
            if "trachea" in query.lower():
                query = "Assess tracheal position and deviation"
            elif "airway" in query.lower():
                query = "Perform airway assessment with position analysis"
            else:
                query = "Perform airway and mediastinal assessment"
        
        try:
            # Use LLM to generate structured plan
            plan_response = self.planner.invoke({
                "query": query,
                "subtask_templates": self.subtask_templates,
                "tools_available": self.config.tools_available_desc
            })
            
            # Convert structured plan to execution format
            execution_plan = []
            
            for subtask in plan_response.subtasks:
                # Convert parameters to dict for execution
                params_dict = subtask.parameters.dict(exclude_none=True)
                
                execution_plan.append({
                    "task_id": subtask.task_id,
                    "description": subtask.description,
                    "tool": subtask.tool,
                    "parameters": params_dict,
                    "depends_on": subtask.depends_on
                })
            
            return execution_plan
            
        except Exception as e:
            print(f"Error in LLM planning for airway analysis, falling back: {e}")
            return self._get_fallback_plan(query)
    
    def _get_fallback_plan(self, query: str) -> List[Dict[str, Any]]:
        """Simple fallback plan if LLM planning fails - prefers minimal tool usage"""
        plan = []
        query_lower = query.lower()
        
        # For tracheal position queries, use segmentation (not grounding)
        if any(keyword in query_lower for keyword in ["trachea", "midline", "tracheal position"]):
            plan.append({
                "task_id": "assess_tracheal_position",
                "description": "Assess tracheal position using segmentation",
                "tool": "chest_xray_segmentation",
                "parameters": {"organs": ["Weasand"]},
                "depends_on": []
            })
        
        # For non-tracheal position queries, try grounding if available
        elif any(keyword in query_lower for keyword in ["carina", "bronchi", "position", "where", "located"]):
            if self.has_grounding:
                plan.append({
                    "task_id": "assess_airway_position",
                    "description": "Assess airway position using grounding",
                    "tool": "xray_phrase_grounding",
                    "parameters": {"phrase": "carina"},
                    "depends_on": []
                })
            else:
                plan.append({
                    "task_id": "assess_airway_position",
                    "description": "Assess airway position using segmentation",
                    "tool": "chest_xray_segmentation",
                    "parameters": {"organs": ["Left Hilus Pulmonis", "Right Hilus Pulmonis"]},
                    "depends_on": []
                })
        
        # For pathology queries, use classification
        elif any(keyword in query_lower for keyword in ["pneumomediastinum", "mass", "abnormal", "pathology"]):
            plan.append({
                "task_id": "assess_pathologies",
                "description": "Assess for airway/mediastinal pathologies",
                "tool": "chest_xray_classifier",
                "parameters": {},
                "depends_on": []
            })
        
        # If no specific query type detected, create minimal assessment plan
        else:
            plan.append({
                "task_id": "basic_airway_assessment",
                "description": "Basic airway assessment",
                "tool": "chest_xray_classifier",
                "parameters": {},
                "depends_on": []
            })
        
        return plan
    
    def analyze(self, state: MultiAgentState) -> MultiAgentState:
        """Execute the dynamically generated plan"""
        plan = self.create_plan(state)
        findings = []
        executed_plan = []
        measurements = {}
        task_results = {}
        
        # Execute plan with dependency handling
        for task in plan:
            task_id = task["task_id"]
            
            # Check dependencies
            deps_met = all(dep in task_results for dep in task.get("depends_on", []))
            if not deps_met:
                print(f"Skipping {task_id} - dependencies not met")
                continue
            
            # Execute task based on tool type
            if task["tool"] == "chest_xray_classifier":
                result = self._execute_classification_task(state, task, task_results)
            elif task["tool"] == "chest_xray_segmentation":
                result = self._execute_segmentation_task(state, task, task_results)
            elif task["tool"] == "xray_phrase_grounding":
                result = self._execute_grounding_task(state, task, task_results)
            else:
                result = {"success": False, "error": f"Unknown tool: {task['tool']}"}
            
            # Store result and process into findings
            task_results[task_id] = result
            executed_plan.append({
                "task_id": task_id,
                "description": task["description"],
                "result": result
            })
            
            self._process_task_results(state, task, result, findings, measurements)
        
        state["airway_analysis"] = AgentAnalysis(
            agent_name="AirwayAgent",
            findings=findings,
            plan_executed=executed_plan,
            react_steps=[],  # P&E mode doesn't use react steps
            visual_cot_triggered=any(f.get("visual_cot") for f in findings if isinstance(f, dict)),
            confidence_level=self._assess_confidence(findings),
            needs_human_review=self._needs_review(findings, measurements)
        )
        
        return state
    
    def _execute_classification_task(self, state: MultiAgentState, task: Dict, task_results: Dict) -> Dict:
        """Execute classification task"""
        try:
            tool = self.tools["chest_xray_classifier"]
            params = {"image_path": state["image_path"]}
            
            # Add focus if specified
            if "focus" in task.get("parameters", {}):
                params["focus"] = task["parameters"]["focus"]
            
            print(f"  Calling classifier with params: {params}")
            result = tool.invoke(params)
            
            # Handle tuple return from classification tool
            if isinstance(result, tuple):
                classification, metadata = result
                print(f"  Classification tool returned tuple, extracting classification results")
            else:
                classification = result
                metadata = {}
            
            # Convert numpy types to Python types for JSON serialization
            if isinstance(classification, dict):
                classification_clean = {}
                for k, v in classification.items():
                    if hasattr(v, 'item'):  # numpy scalar
                        classification_clean[k] = float(v.item())
                    else:
                        classification_clean[k] = float(v) if isinstance(v, (int, float)) else v
                classification = classification_clean
            
            print(f"  Classification results: {classification}")
            return {"success": True, "result": classification, "metadata": metadata, "tool": "classification"}
        except Exception as e:
            print(f"Error in classification task: {e}")
            import traceback
            traceback.print_exc()
            return {"success": False, "error": str(e)}
    
    def _execute_segmentation_task(self, state: MultiAgentState, task: Dict, task_results: Dict) -> Dict:
        """Execute segmentation task"""
        try:
            tool = self.tools["chest_xray_segmentation"]
            
            # Get organs from parameters or use optimal selection
            params = task.get("parameters", {})
            if "organs" in params and params["organs"]:
                organs = params["organs"]
            else:
                organs = self._get_optimal_organs_for_task(task["task_id"], task["description"])
            
            tool_params = {
                "image_path": state["image_path"],
                "organs": organs
            }
            
            print(f"  Calling segmentation with params: {tool_params}")
            result = tool.invoke(tool_params)
            
            # Handle tuple return from segmentation tool
            if isinstance(result, tuple):
                segmentation_data, metadata = result
                print(f"  Segmentation tool returned tuple, extracting segmentation data")
            else:
                segmentation_data = result
                metadata = {}
            
            print(f"  Segmentation result keys: {list(segmentation_data.keys()) if isinstance(segmentation_data, dict) else type(segmentation_data)}")
            return {"success": True, "result": segmentation_data, "metadata": metadata, "tool": "segmentation"}
        except Exception as e:
            print(f"Error in segmentation task: {e}")
            import traceback
            traceback.print_exc()
            return {"success": False, "error": str(e)}
    
    def _execute_grounding_task(self, state: MultiAgentState, task: Dict, task_results: Dict) -> Dict:
        """Execute grounding task with fallback phrases"""
        if not self.has_grounding:
            print(f"  Grounding tool not available for {task['task_id']}")
            return {"success": False, "error": "Grounding tool not available"}
        
        try:
            tool = self.tools["xray_phrase_grounding"]
            
            # Extract phrase(s) from parameters
            params = task.get("parameters", {})
            phrase = params.get("phrase")
            phrases = params.get("phrases", [])
            
            # Handle multiple phrases if specified by the planner
            if phrases:
                # Try multiple phrases as requested by the planner
                for test_phrase in phrases:
                    tool_params = {
                        "image_path": state["image_path"],
                        "phrase": test_phrase
                    }
                    
                    print(f"  Calling grounding with phrase: '{test_phrase}'")
                    result = tool.invoke(tool_params)
                    
                    # Check if grounding found anything
                    if isinstance(result, dict) and "predictions" in result:
                        num_predictions = len(result["predictions"]) if result["predictions"] else 0
                        print(f"  Grounding found {num_predictions} predictions for '{test_phrase}'")
                        
                        # If we found predictions, return this result
                        if num_predictions > 0:
                            return {"success": True, "result": result, "tool": "grounding", "phrase_used": test_phrase}
                
                # If no phrases worked, return the last result
                phrases_tried = ", ".join(phrases)
                return {"success": True, "result": result, "tool": "grounding", "phrase_used": f"tried: {phrases_tried}"}
            
            else:
                # Single phrase or default
                if not phrase:
                    # Simple default based on task
                    if "trachea" in task["task_id"].lower():
                        phrase = "trachea"
                    elif "carina" in task["task_id"].lower():
                        phrase = "carina"
                    elif "mediastin" in task["task_id"].lower():
                        phrase = "mediastinum"
                    else:
                        phrase = "airway"
                
                tool_params = {
                    "image_path": state["image_path"],
                    "phrase": phrase
                }
                
                print(f"  Calling grounding with phrase: '{phrase}'")
                result = tool.invoke(tool_params)
                
                # Check if grounding found anything
                if isinstance(result, dict) and "predictions" in result:
                    num_predictions = len(result["predictions"]) if result["predictions"] else 0
                    print(f"  Grounding found {num_predictions} predictions for '{phrase}'")
                
                return {"success": True, "result": result, "tool": "grounding", "phrase_used": phrase}
                
        except Exception as e:
            print(f"  Error in grounding task: {e}")
            return {"success": False, "error": str(e)}
    
    def _trigger_vcot(self, state: MultiAgentState, confidence: float, pathology: str, 
                     location: Optional[Any] = None, measurements: Optional[Dict] = None,
                     tool_name: str = "airway_tool", mask_data: Optional[Any] = None,
                     existing_visualization: Optional[str] = None,
                     evidence_list: Optional[List[VisualEvidence]] = None) -> Optional[Dict]:
        """
        Unified V-CoT trigger method using bias-resistant visual reasoning.
        
        This method implements a two-step process:
        1. Pure visual analysis without tool bias
        2. Tool evidence validation against visual observations
        """
        if not self.vcot_module or not self.should_trigger_vcot(confidence):
            return None
        
        try:
            # Use the new bias-resistant V-CoT if available
            if isinstance(self.vcot_module, BiasResistantVisualCoT):
                # Use provided evidence_list or create one
                if evidence_list is None:
                    evidence_list = []
                    
                    # Add segmentation evidence if mask data is provided
                    if mask_data is not None:
                        evidence_list.append(VisualEvidence(
                            evidence_type=VisualEvidenceType.SEGMENTATION_MASK,
                            tool_name=tool_name,
                            confidence=confidence,
                            data=mask_data,
                            description=f"Tool detected {pathology} with segmentation mask",
                            visualization_path=existing_visualization
                        ))
                    
                    # Add bounding box evidence if location is provided
                    if location and hasattr(location, '__iter__') and len(location) >= 4:
                        evidence_list.append(VisualEvidence(
                            evidence_type=VisualEvidenceType.BOUNDING_BOX,
                            tool_name=tool_name,
                            confidence=confidence,
                            data=location,
                            description=f"Tool localized {pathology} at bounding box coordinates",
                            visualization_path=existing_visualization
                        ))
                    
                    # Add measurement evidence if measurements are provided
                    if measurements:
                        evidence_list.append(VisualEvidence(
                            evidence_type=VisualEvidenceType.MEASUREMENT,
                            tool_name=tool_name,
                            confidence=confidence,
                            data=measurements,
                            description=f"Tool measured: {measurements}",
                            visualization_path=existing_visualization
                        ))
                    
                    # Add classification evidence 
                    evidence_list.append(VisualEvidence(
                        evidence_type=VisualEvidenceType.CLASSIFICATION_RESULT,
                        tool_name=tool_name,
                        confidence=confidence,
                        data={"pathology": pathology, "confidence": confidence},
                        description=f"Tool classified {pathology} with confidence {confidence:.2f}",
                        visualization_path=existing_visualization
                    ))
                
                # Determine target based on pathology
                target_mapping = {
                    "tracheal_deviation": "trachea and its position relative to midline",
                    "tracheal_position_normal": "trachea and its midline position",
                    "hilar_asymmetry": "hilar regions and their symmetry",
                    "pneumomediastinum": "mediastinal air collections",
                    "subcutaneous_emphysema": "subcutaneous air in soft tissues",
                    "carina_splaying": "carina and bronchial angle",
                    "tracheal_segmentation_verification": "tracheal segmentation mask accuracy",
                    "tracheal_localization_verification": "tracheal bounding box location accuracy",
                }
                
                target = target_mapping.get(pathology, f"airway structures related to {pathology}")
                
                # Extract ROI if location provided
                roi_bbox = None
                if location and hasattr(location, '__iter__') and len(location) >= 4:
                    roi_bbox = location
                
                # Use the new bias-resistant V-CoT
                result = self.vcot_module.generate(
                    image_path=state["image_path"],
                    task=f"Is the trachea midline?" if "tracheal" in pathology else f"Verify {pathology} finding in airway assessment",
                    target=target,
                    evidence_list=evidence_list,
                    roi_bbox=roi_bbox,
                    measurements=measurements or {}
                )
                
                return result
                
            else:
                # Fallback to old V-CoT interface for backward compatibility
                roi_bbox = None
                if location and hasattr(location, '__iter__') and len(location) >= 4:
                    roi_bbox = location
                
                result = self.vcot_module.generate(
                    image_path=state["image_path"],
                    roi_bbox=roi_bbox,
                    measurements=measurements or {},
                    task=f"Verify {pathology} finding",
                    confidence=confidence
                )
                
                return {"final_assessment": result}
                
        except Exception as e:
            print(f"Error in V-CoT: {e}")
            return None
    
    def _process_task_results(self, state: MultiAgentState, task: Dict, result: Dict, findings: List[Finding], 
                            measurements: Dict):
        """Process task results into findings"""
        if not result.get("success"):
            return
        
        tool_result = result.get("result", {})
        
        if result.get("tool") == "classification":
            # Process classification results for airway-relevant pathologies
            # Map to actual pathologies that exist in the classification model output
            # Note: Removed Mediastinal Widening as it belongs to CardiacAgent
            # Note: Removed Hilar Enlargement as it belongs to CardiacAgent per ABCDEF C: Circulation
            # Note: Removed Tubes/Foreign Devices as they belong to Everything_else_agent
            
            # Map airway-relevant pathologies to actual model outputs
            airway_pathology_mapping = {
                # Mediastinal abnormalities
                "Enlarged Cardiomediastinum": "enlarged_cardiomediastinum",  # Includes pneumomediastinum-like findings
                "Pneumothorax": "pneumothorax",  # Can affect airway/tracheal position
                "Emphysema": "emphysema",  # Can be related to subcutaneous emphysema
                
                # Mass/nodule that could be paratracheal
                "Mass": "paratracheal_mass",  # Could be paratracheal mass
                "Nodule": "paratracheal_nodule",  # Could be paratracheal nodule
                
                # Other airway-relevant findings
                "Atelectasis": "atelectasis",  # Can affect airway position
                "Consolidation": "consolidation",  # Can affect airway position
            }
            
            for model_pathology, airway_pathology in airway_pathology_mapping.items():
                confidence = tool_result.get(model_pathology, 0)
                if confidence > self.config.pathology_report_threshold:
                    
                    # Classification results already provide confidence scores
                    # No need for V-CoT verification since there's no visual output to verify
                    
                    findings.append(Finding(
                        pathology=airway_pathology,
                        confidence=confidence,
                        location=None,  # Will be filled by grounding if available
                        measurements=None,
                        visual_cot=None,  # No V-CoT for classification results
                        evidence=f"Classification confidence for {model_pathology}: {confidence:.3f}"
                    ))
        
        elif result.get("tool") == "segmentation":
            # Extract airway-relevant measurements from segmentation
            if "result" in result and isinstance(result["result"], dict):
                seg_result = result["result"]
                if "metrics" in seg_result:
                    metrics = seg_result["metrics"]
                    measurements.update(metrics)
                    
                    # Analyze tracheal position using Weasand as approximation
                    if "Weasand" in metrics:
                        weasand_metrics = metrics["Weasand"]
                        tool_confidence = weasand_metrics.get("confidence_score", 0.5)
                        
                        # Extract position from segmentation metrics
                        relative_pos = weasand_metrics.get("relative_position", {})
                        left_position = relative_pos.get("left", 0.5)
                        
                        # Get existing visualization path to reuse
                        existing_viz_path = seg_result.get("segmentation_image_path")
                        
                        # First, verify the segmentation mask if confidence is low
                        mask_visual_cot_result = None
                        final_confidence = tool_confidence
                        alternative_assessment = None
                        
                        if tool_confidence < self.config.high_confidence_threshold:
                            # Create evidence for V-CoT with clear tool conclusion
                            evidence_list = []
                            
                            # Add segmentation evidence with clear interpretation
                            tool_conclusion = "midline" if abs(left_position - 0.5) <= 0.05 else "deviated"
                            evidence_list.append(VisualEvidence(
                                evidence_type=VisualEvidenceType.SEGMENTATION_MASK,
                                tool_name="segmentation_tool",
                                confidence=tool_confidence,
                                data={"position": left_position, "interpretation": tool_conclusion},
                                description=f"Segmentation tool concluded: Trachea is {tool_conclusion} (position: {left_position:.3f}, confidence: {tool_confidence:.3f})",
                                visualization_path=existing_viz_path
                            ))
                            
                            visual_cot_result = self._trigger_vcot(
                                state, tool_confidence, "tracheal_segmentation_verification",
                                tool_name="segmentation_tool",
                                mask_data=weasand_metrics.get("mask_data"),
                                existing_visualization=existing_viz_path,
                                evidence_list=evidence_list
                            )
                            
                            if visual_cot_result:
                                mask_visual_cot_result = visual_cot_result
                                final_confidence = visual_cot_result.final_confidence
                                alternative_assessment = visual_cot_result.alternative_assessment
                        
                        # Now create findings based on V-CoT agreement
                        if mask_visual_cot_result and mask_visual_cot_result.tool_agreement == "disagrees":
                            # V-CoT disagrees with tool - use V-CoT's direct assessment
                            direct_assessment = mask_visual_cot_result.direct_visual_assessment
                            
                            # Determine pathology based on V-CoT's direct assessment
                            if direct_assessment and any(word in direct_assessment.lower() for word in ["deviat", "shift", "displaced"]):
                                pathology = "tracheal_deviation"
                            else:
                                pathology = "tracheal_position_normal"
                            
                            findings.append(Finding(
                                pathology=pathology,
                                confidence=final_confidence,
                                location=None,
                                measurements={
                                    "tool_position": left_position,
                                    "tool_confidence": tool_confidence,
                                    "tool_conclusion": tool_conclusion,
                                    "vcot_disagreement": True,
                                    "vcot_direct_assessment": direct_assessment
                                },
                                visual_cot=mask_visual_cot_result.full_reasoning,
                                evidence=f"V-CoT independent assessment: {direct_assessment}. Disagrees with tool conclusion of '{tool_conclusion}' (position: {left_position:.3f})"
                            ))
                        else:
                            # V-CoT agrees or is uncertain - use tool measurements with adjusted confidence
                            if abs(left_position - 0.5) > 0.05:  # Threshold for significant deviation
                                deviation_direction = "right" if left_position > 0.55 else "left"
                                deviation_magnitude = abs(left_position - 0.5)
                                
                                findings.append(Finding(
                                    pathology="tracheal_deviation",
                                    confidence=final_confidence,  # Use V-CoT adjusted confidence
                                    location=None,
                                    measurements={
                                        "relative_position": left_position, 
                                        "deviation_direction": deviation_direction,
                                        "tool_confidence": tool_confidence,
                                        "final_confidence": final_confidence,
                                        "deviation_magnitude": deviation_magnitude
                                    },
                                    visual_cot=mask_visual_cot_result.full_reasoning if mask_visual_cot_result else None,
                                    evidence=f"Tracheal deviation {deviation_direction} detected using Weasand approximation (position: {left_position:.3f}, tool_confidence: {tool_confidence:.3f}, final_confidence: {final_confidence:.3f})"
                                ))
                            else:
                                # Trachea is midline - measurements calculated from same mask
                                position_certainty = 1.0 - abs(left_position - 0.5) / 0.05
                                
                                findings.append(Finding(
                                    pathology="tracheal_position_normal",
                                    confidence=final_confidence,  # Use V-CoT adjusted confidence
                                    location=None,
                                    measurements={
                                        "relative_position": left_position, 
                                        "position": "midline",
                                        "tool_confidence": tool_confidence,
                                        "final_confidence": final_confidence,
                                        "position_certainty": position_certainty
                                    },
                                    visual_cot=mask_visual_cot_result.full_reasoning if mask_visual_cot_result else None,
                                    evidence=f"Trachea is midline using Weasand approximation (position: {left_position:.3f}, tool_confidence: {tool_confidence:.3f}, final_confidence: {final_confidence:.3f})"
                                ))
                    
                    # Analyze hilar symmetry
                    if "Left Hilus Pulmonis" in metrics and "Right Hilus Pulmonis" in metrics:
                        left_hilus = metrics["Left Hilus Pulmonis"]
                        right_hilus = metrics["Right Hilus Pulmonis"]
                        
                        # Compare hilar sizes
                        left_area = left_hilus.get("area_pixels", 0)
                        right_area = right_hilus.get("area_pixels", 0)
                        
                        if left_area > 0 and right_area > 0:
                            size_ratio = max(left_area, right_area) / min(left_area, right_area)
                            
                            if size_ratio > 1.5:  # Threshold for asymmetry
                                larger_side = "left" if left_area > right_area else "right"
                                confidence = min(0.8, (size_ratio - 1.0) / 2.0)
                                
                                # Size ratio is a mathematical calculation from segmentation masks
                                # Uses the mask verification from above, no separate V-CoT needed
                                
                                findings.append(Finding(
                                    pathology="hilar_asymmetry",
                                    confidence=confidence,
                                    location=None,
                                    measurements={"size_ratio": size_ratio, "larger_side": larger_side},
                                    visual_cot=None,  # Uses mask verification, not measurement verification
                                    evidence=f"Hilar asymmetry detected - {larger_side} hilus larger (ratio: {size_ratio:.1f})"
                                ))
                    
                    # Check for any enhanced measurements from segmentation tool
                    # (These would be added by the segmentation tool if it had airway-specific algorithms)
                    if "TrachealDeviation" in metrics:
                        deviation_data = metrics["TrachealDeviation"]
                        deviation = deviation_data.get("value_mm", 0)
                        if deviation_data.get("significant", False):
                            confidence = min(0.9, abs(deviation) / 20)
                            
                            # Enhanced measurement - no separate V-CoT needed (uses mask verification from above)
                            
                            findings.append(Finding(
                                pathology="tracheal_deviation",
                                confidence=confidence,
                                location=None,
                                measurements={"deviation_mm": deviation},
                                visual_cot=None,  # Uses mask verification from above, not measurement verification
                                evidence=f"Tracheal deviation: {deviation:.1f}mm {deviation_data.get('direction', '')} from midline"
                            ))
                    
                    if "CarinaAngle" in metrics:
                        angle_data = metrics["CarinaAngle"]
                        angle = angle_data.get("value_degrees", 0)
                        if angle_data.get("abnormal", False):
                            confidence = min(0.9, (angle - 100) / 40)
                            
                            # Enhanced measurement - no separate V-CoT needed (calculated from segmentation)
                            
                            findings.append(Finding(
                                pathology="carina_splaying",
                                confidence=confidence,
                                location=None,
                                measurements={"angle_degrees": angle},
                                visual_cot=None,  # Uses segmentation verification, not measurement verification
                                evidence=f"Carina angle: {angle:.1f}° (normal < {self.config.carina_angle_normal_max}°)"
                            ))
        
        elif result.get("tool") == "grounding":
            # Process grounding results for airway structures
            if "result" in result and isinstance(result["result"], dict):
                grounding_result = result["result"]
                
                # Handle direct tracheal grounding
                if "predictions" in grounding_result:
                    # Check if any predictions were found
                    if grounding_result["predictions"]:
                        for pred in grounding_result["predictions"]:
                            phrase = pred.get("phrase", "").lower()
                            bbox_data = pred.get("bounding_boxes", {}).get("image_coordinates", [])
                            confidence = pred.get("confidence", 0.5)
                            
                            if bbox_data and bbox_data[0]:
                                bbox = bbox_data[0]
                                
                                # Analyze tracheal position from grounding
                                if "trachea" in phrase:
                                    # Calculate deviation from image center
                                    image_center_x = state.get("image_width", 512) / 2  # Approximate
                                    trachea_center_x = (bbox[1] + bbox[3]) / 2  # (min_x + max_x) / 2
                                    
                                    deviation_pixels = abs(trachea_center_x - image_center_x)
                                    # Rough conversion to mm (assuming ~0.2mm/pixel)
                                    deviation_mm = deviation_pixels * 0.2
                                    
                                    # Always report tracheal position
                                    if deviation_mm <= 5.0:  # Midline threshold
                                        findings.append(Finding(
                                            pathology="tracheal_position_normal",
                                            confidence=confidence,
                                            location=bbox,
                                            measurements={"deviation_mm": deviation_mm, "position": "midline"},
                                            visual_cot=None,
                                                                                    evidence=f"Trachea is midline (deviation: {deviation_mm:.1f}mm from center, grounded with '{result.get('phrase_used', 'unknown')}')"
                                    ))
                                    else:  # Deviated
                                        direction = "right" if trachea_center_x > image_center_x else "left"
                                        
                                        # V-CoT should verify the bounding box location, not the measurement calculation
                                        existing_viz_path = grounding_result.get("visualization_path")
                                        visual_cot_result = self._trigger_vcot(
                                            state, confidence, "tracheal_localization_verification",
                                            location=bbox,
                                            tool_name="grounding_tool",
                                            existing_visualization=existing_viz_path
                                        )
                                        
                                        # Handle structured V-CoT result
                                        visual_cot = None
                                        final_confidence = confidence
                                        if visual_cot_result:
                                            visual_cot = visual_cot_result.full_reasoning
                                            final_confidence = visual_cot_result.final_confidence
                                            
                                            # If V-CoT disagrees with grounding result
                                            if visual_cot_result.tool_agreement == "disagrees":
                                                findings.append(Finding(
                                                    pathology="tracheal_localization_uncertain",
                                                    confidence=final_confidence,
                                                    location=bbox,
                                                    measurements={"deviation_mm": deviation_mm, "direction": direction, "vcot_disagreement": True},
                                                    visual_cot=visual_cot,
                                                    evidence=f"Grounding tool located trachea but V-CoT assessment disagrees: {visual_cot_result.alternative_assessment or 'Visual analysis contradicts bounding box location'}"
                                                ))
                                                continue  # Skip normal finding creation
                                        
                                        findings.append(Finding(
                                            pathology="tracheal_deviation",
                                            confidence=final_confidence,
                                            location=bbox,
                                            measurements={"deviation_mm": deviation_mm, "direction": direction, "tool_confidence": confidence, "final_confidence": final_confidence},
                                            visual_cot=visual_cot,
                                            evidence=f"Tracheal deviation {direction}: {deviation_mm:.1f}mm from midline (grounded with '{result.get('phrase_used', 'unknown')}', final_confidence: {final_confidence:.3f})"
                                        ))
                                
                                # Analyze carina findings
                                elif "carina" in phrase:
                                    # Store carina location for angle calculations
                                    measurements[f"carina_location"] = bbox
                                    
                                    findings.append(Finding(
                                        pathology="carina_identified",
                                        confidence=confidence,
                                        location=bbox,
                                        measurements=None,
                                        visual_cot=None,
                                        evidence=f"Carina located at coordinates {bbox} (grounded)"
                                    ))
                                
                                # Update location for existing findings
                                for finding in findings:
                                    if isinstance(finding, dict) and phrase in finding.get("pathology", ""):
                                        finding["location"] = bbox
                    else:
                        # No grounding predictions found - this is a valid medical result
                        # The absence of findings may indicate the structure is not clearly visible or localizable
                        phrase_used = result.get("phrase_used", "unknown")
                        if "trachea" in task.get("task_id", "").lower():
                            findings.append(Finding(
                                pathology="trachea_not_localizable",
                                confidence=0.7,  # High confidence that it's not visible/localizable
                                location=None,
                                measurements=None,
                                visual_cot=None,
                                evidence=f"Trachea could not be localized in this image using phrase '{phrase_used}' - may not be clearly visible"
                            ))
    
    def _needs_review(self, findings: List[Finding], measurements: Dict) -> bool:
        """Determine if human review is needed"""
        # Review needed for significant airway abnormalities
        for finding in findings:
            if isinstance(finding, dict):
                pathology = finding.get("pathology", "")
                confidence = self._extract_confidence_value(finding.get("confidence", 0))
                
                # High confidence critical findings
                if pathology in ["tracheal_deviation", "pneumomediastinum", "subcutaneous_emphysema"]:
                    if confidence > self.config.high_confidence_threshold:
                        return True
        
        # Review for concerning measurements
        if measurements.get("tracheal_deviation", 0) > self.config.significant_deviation_mm:
            return True
        if measurements.get("carina_angle", 0) > self.config.carina_angle_normal_max + 20:
            return True
        
        return False
    
    def _assess_confidence(self, findings: List[Finding]) -> str:
        """Assess overall confidence level"""
        if not findings:
            return "high"
        
        confidences = [self._extract_confidence_value(f.get("confidence", 0)) for f in findings if isinstance(f, dict)]
        if not confidences:
            return "high"
        
        avg_confidence = sum(confidences) / len(confidences)
        
        if avg_confidence >= self.config.high_confidence_threshold:
            return "high"
        elif avg_confidence >= 0.4:
            return "medium"
        else:
            return "low"
    
    def _get_optimal_organs_for_task(self, task_id: str, task_description: str) -> List[str]:
        """Get optimal organ list for segmentation based on task"""
        task_lower = task_id.lower() + " " + task_description.lower()
        
        # Use Weasand as closest approximation to trachea when segmentation is needed
        organs = []
        
        # For tracheal/airway assessment - use Weasand as closest approximation AND lungs for midline calculation
        if any(keyword in task_lower for keyword in ["trachea", "airway", "midline", "deviation"]):
            organs.append("Weasand")  # Closest available to trachea
            organs.extend(["Left Lung", "Right Lung"])  # Required for tracheal deviation calculation
        
        # For bronchi assessment - use hilus pulmonis 
        if any(keyword in task_lower for keyword in ["bronchi", "carina"]):
            organs.extend(["Left Hilus Pulmonis", "Right Hilus Pulmonis"])
            if "Left Lung" not in organs:
                organs.extend(["Left Lung", "Right Lung"])
        
        # Add aorta and mediastinum for paratracheal assessment
        if any(keyword in task_lower for keyword in ["paratracheal", "mediastinal"]):
            organs.extend(["Aorta", "Mediastinum"])
        
        # For comprehensive assessment
        if any(keyword in task_lower for keyword in ["comprehensive", "full"]):
            organs = ["Weasand", "Left Hilus Pulmonis", "Right Hilus Pulmonis", 
                      "Mediastinum", "Left Lung", "Right Lung", "Aorta"]
        
        # Fallback if no organs selected
        if not organs:
            organs = ["Weasand", "Left Lung", "Right Lung"]
        
        return list(set(organs))  # Remove duplicates
    
    def _extract_confidence_value(self, conf: Any) -> float:
        """Safely extract confidence value from various formats"""
        if isinstance(conf, (int, float)):
            return float(conf)
        elif isinstance(conf, dict):
            return float(conf.get("value", 0))
        else:
            return 0.0 