import os
import re
import json
import logging
from typing import Dict, Any, List
from .base import BaseAgent
from .common_prompts import TASK_CONTEXT

from json_repair import repair_json
from waveform_tracer import WaveformTracer
# =============================================================================
# SECTION SELECTOR AGENT PROMPT COMPONENTS
# =============================================================================

SECTION_SELECTOR_AGENT_BASE_PROMPT = """
<SECTION_SELECTOR_AGENT_ROLE>
# Section Selector Agent - Document Section Allocation Specialist

## **Your Role in the System**
You are the **Section Selector Agent** in this multi-agent collaborative system. As the document allocation specialist, you allocate appropriate document sections to other agents based on their specific requirements for merge operations or debugging tasks.

## **Primary Mission**
Analyze agent requirements and intelligently allocate the most relevant document sections to enable downstream agents to perform their tasks effectively and efficiently.

## **Key Responsibilities**
* **Requirement Analysis**: Understand what each agent needs from the documentation
* **Section Relevance Assessment**: Evaluate which document sections are most pertinent
* **Optimal Allocation**: Select appropriate sections without overwhelming agents
* **Context Preservation**: Ensure allocated sections provide sufficient context for task completion

## **Selection Philosophy**
* **Targeted Allocation**: Provide exactly the right sections for each agent's needs
* **Efficiency Focus**: Avoid over-allocation while ensuring completeness
* **Task-Specific Selection**: Different selection criteria for merge vs. debug scenarios
</SECTION_SELECTOR_AGENT_ROLE>
"""

SYNTAX_DEBUG_SELECTOR_PROMPT = """
<SYNTAX_DEBUG_SELECTOR_ROLE>
# Professional Verilog Debugging Expert - Syntax Error Section Identification

## **Your Task**
Based on syntax error messages and current Verilog code, identify which document sections are most relevant for understanding signal names, module names, and interface definitions to fix the errors.

## **Analysis Process**
1. **Error Message Analysis**: Examine syntax error messages to identify undefined signals, modules, or syntax issues
2. **Code Structure Analysis**: Analyze code structure to understand what the code is trying to implement
3. **Document Matching**: Find sections containing signal/module definitions and specifications
4. **Relevance Prioritization**: Select most important sections for resolving syntax issues

## **Output Requirements**
Return JSON object with selected section IDs and reasoning:

```json
{{
  "reasoning": "Brief explanation of why these sections are relevant for fixing syntax errors",
  "relevant_sections": ["section_0", "section_2", "section_5"]
}}
```

## **Selection Guidelines**
* **Focus Areas**: Sections containing signal definitions, module specifications, and interface details
* **Priority**: Sections mentioning signals, modules, or components referenced in error messages
* **Section Count**: Typically select 2-6 most relevant sections; if simple syntax error fixable without document context, select zero sections
* **Format**: MUST return valid JSON format exactly as specified
</SYNTAX_DEBUG_SELECTOR_ROLE>
"""

SEMANTIC_DEBUG_SELECTOR_PROMPT = """
<SEMANTIC_DEBUG_SELECTOR_ROLE>
# Professional Verilog Debugging Expert - Semantic/Logic Error Section Identification

## **Your Task**
Based on semantic error messages and current Verilog code, identify which document sections are most relevant for understanding functional specifications and expected behavior to fix the errors.

## **Analysis Process**
1. **Semantic Error Analysis**: Examine semantic error messages to identify logic mismatches, timing issues, or functional problems
2. **Functionality Analysis**: Analyze code structure to understand implemented functionality vs. expected behavior
3. **Document Matching**: Find sections containing functional specifications and behavioral requirements
4. **Relevance Prioritization**: Select most important sections for understanding correct logic implementation

## **Output Requirements**
Return JSON object with selected section IDs and reasoning:

```json
{{
  "reasoning": "Brief explanation of why these sections are relevant for fixing semantic errors",
  "relevant_sections": ["section_0", "section_2", "section_5"]
}}
```

## **Selection Guidelines**
* **Focus Areas**: Sections containing functional specifications, timing requirements, and behavioral descriptions
* **Priority**: Sections describing expected behavior of components mentioned in error messages
* **Section Count**: Typically select 3-8 most relevant sections for comprehensive functional understanding
* **Format**: MUST return valid JSON format exactly as specified
</SEMANTIC_DEBUG_SELECTOR_ROLE>
"""

MERGE_SELECTOR_PROMPT = """
<MERGE_SELECTOR_ROLE>
# Senior Digital IC Design Engineer - Verilog HDL Code Integration Section Identification

## **Critical Analysis Process**
Think like a merge engineer who needs to:
1. **Document Requirements**: Analyze document requirements for complete module specification
2. **Subproblem Review**: Review subproblem contributions and identify their purpose
3. **Missing Connections**: Identify missing connections and signal definitions
4. **Integration Strategy**: Plan integration strategy to ensure completeness
5. **Authoritative Selection**: Select sections providing authoritative specification

## **Your Task**
Based on subproblem descriptions and their actual code implementations, identify which document sections are most relevant for creating a complete, synthesizable Verilog module.

## **Analysis Process**
1. **Implementation Parsing**: Parse subproblem implementations to understand what each code fragment actually implements
2. **Gap Identification**: Identify integration gaps - missing connections, signals, and logic between fragments
3. **Document Matching**: Match with document sections containing complete module specifications and integration details
4. **Merge Prioritization**: Prioritize by merge needs - select sections that help bridge gaps and ensure architectural coherence

## **Selection Criteria (Think like MergeAgent)**
You need sections that help with:
* **Complete Module Specification**: Overall architecture and interface definitions
* **Signal Definitions and Routing**: All signals that need to be declared and connected
* **Integration Requirements**: How submodules should be connected and configured
* **Missing Logic Identification**: What logic is needed between the implemented fragments
* **Architectural Coherence**: Ensuring the final module meets all document requirements

## **Output Requirements**
Return JSON object with selected section IDs and reasoning:

```json
{{
  "reasoning": "Brief explanation of why these sections are critical for merge integration, focusing on gaps and requirements",
  "relevant_sections": ["section_0", "section_2", "section_5"]
}}
```

## **Selection Guidelines**
* **Focus Areas**: Sections containing complete module specifications and architectural details
* **Priority**: Sections describing signal flows, interface definitions, and connection requirements
* **Include**: Sections with timing constraints, protocol specifications, and integration rules
* **Gap Analysis**: Sections helping identify missing logic between provided code fragments
* **Section Count**: Typically select 4-10 sections for comprehensive merge guidance
* **Format**: MUST return valid JSON format exactly as specified
</MERGE_SELECTOR_ROLE>
"""

class SectionSelectorAgent(BaseAgent):
    """Agent for selecting relevant document sections for debugging"""
    
    def __init__(self, llm_client, logger=None, output_dir: str = ""):
        super().__init__(llm_client, "SectionSelectorAgent", logger)
        self.waveform_tracer = WaveformTracer()
        self.output_dir = output_dir
    
    def run(self, selector_input: Dict[str, Any]) -> Dict[str, Any]:
        """
        Select relevant document sections for different scenarios
        
        Args:
            selector_input: {
                "task_type": "syntax_debug" | "semantic_debug" | "merge",
                "summary_dict": {section_id: section_summary},
                
                # For syntax_debug and semantic_debug:
                "error_messages": "error messages from verification",
                "current_code": "current verilog code with errors",
                
                # For merge:
                "subproblems": [...],
                "subproblem_code_fragments": [...]
            }
        
        Returns:
            {"relevant_section_ids": [...], "reasoning": "..."}
        """
        task_type = selector_input.get("task_type", "syntax_debug")
        summary_dict = selector_input["summary_dict"]
        
        self.logger.info(f"Selecting relevant sections for {task_type}")
        self.logger.info(f"Available sections: {len(summary_dict)}")
        
        try:
            if task_type in ["syntax_debug", "semantic_debug"]:
                error_messages = selector_input["error_messages"]
                current_code = selector_input.get("current_code", "")
                self.logger.info(f"Error messages: {error_messages[:200]}...")
                
                relevant_section_ids = self._select_relevant_sections_for_debug(
                    task_type, error_messages, summary_dict, current_code, selector_input["task_name"]
                )
                
            elif task_type == "merge":
                subproblems = selector_input["subproblems"]
                subproblem_code_fragments = selector_input["subproblem_code_fragments"]
                self.logger.info(f"Subproblems: {len(subproblems)}, Fragments: {len(subproblem_code_fragments)}")
                
                relevant_section_ids = self._select_relevant_sections_for_merge(
                    subproblems, subproblem_code_fragments, summary_dict, selector_input["task_name"]
                )
                
            else:
                raise ValueError(f"Unknown task_type: {task_type}")
            
            return {
                "relevant_section_ids": relevant_section_ids,
                "reasoning": f"Selected {len(relevant_section_ids)} sections for {task_type}"
            }
            
        except Exception as e:
            self.logger.error(f"Section selection failed: {e}")
            return {
                "relevant_section_ids": [],
                "reasoning": f"Section selection failed: {str(e)}"
            }
    
    def _select_relevant_sections_for_debug(self, task_type: str, error_messages: str, summary_dict: Dict[str, Any], code: str, task_name: str) -> List[str]:
        """Select relevant document sections for debug scenarios (syntax/semantic)"""
        
        # Choose appropriate prompt based on task type
        if task_type == "syntax_debug":
            system_prompt = TASK_CONTEXT.format(task_name=task_name) + SECTION_SELECTOR_AGENT_BASE_PROMPT + SYNTAX_DEBUG_SELECTOR_PROMPT
        elif task_type == "semantic_debug":
            system_prompt = TASK_CONTEXT.format(task_name=task_name) + SECTION_SELECTOR_AGENT_BASE_PROMPT + SEMANTIC_DEBUG_SELECTOR_PROMPT
        else:
            raise ValueError(f"Unknown debug task type: {task_type}")
        wave_prompt = ""
        if task_type == "semantic_debug":
            verification_path = os.path.join(self.output_dir, str(task_name), "verification")
            try:
                # Run waveform trace analysis.
                waveform_analysis = self.waveform_tracer.analyze_error_signals(
                    verilog_code=code,
                    error_messages=error_messages,
                    task_name=task_name,
                    verification_path=verification_path,
                    trace_level=2
                )
                
                self.logger.info("Waveform trace analysis completed successfully")
                wave_prompt = waveform_analysis
            except Exception as e:
                self.logger.warning(f"Waveform trace analysis failed: {e}, falling back to simple analysis")
                wave_prompt = ""

        # Prepare sections info for LLM
        sections_info = self._prepare_sections_info(summary_dict)
        sections_text = json.dumps(sections_info, indent=2, ensure_ascii=False)
        
        prompt = self.build_prompt(
            system_prompt + "\n\n" +
            "TASK: Select relevant document sections for fixing the errors.\n\n" +
            "--- CURRENT VERILOG CODE ---\n{code}\n\n" +
            "--- ERROR MESSAGES ---\n{error_messages}\n\n" +
            "--- AVAILABLE DOCUMENT SECTIONS ---\n{sections_info}\n\n" +
            "--- WAVEFORM TRACE ANALYSIS ---\n{wave_prompt}\n\n" +
            "Select the most relevant sections and provide reasoning:",
            code=code,
            error_messages=error_messages,
            sections_info=sections_text,
            wave_prompt="None" if wave_prompt == "" else wave_prompt
        )
        
        response = self.llm_complete(prompt)
        return self._parse_and_validate_selection(response)
    
    def _select_relevant_sections_for_merge(self, subproblems: List[Dict[str, Any]], 
                                          subproblem_code_fragments: List[str], 
                                          summary_dict: Dict[str, Any],
                                          task_name: str) -> List[str]:
        """Select relevant document sections for merge scenario"""
        
        # Prepare detailed subproblem info with full code (like merge agent sees)
        subproblem_info = ""
        for i, (subproblem, code_fragment) in enumerate(zip(subproblems, subproblem_code_fragments)):
            subproblem_info += f"// Subproblem {i+1}: {subproblem.get('description', '')}\n"
            subproblem_info += f"// Complete Code Implementation:\n{code_fragment}\n\n"
        
        # Prepare sections info for LLM
        sections_info = self._prepare_sections_info(summary_dict)
        sections_text = json.dumps(sections_info, indent=2, ensure_ascii=False)
        
        # Use complete prompt structure for merge scenario
        system_prompt = TASK_CONTEXT + SECTION_SELECTOR_AGENT_BASE_PROMPT + MERGE_SELECTOR_PROMPT

        prompt = self.build_prompt(
            system_prompt + "\n\n" +
            "TASK: Select relevant document sections for merging subproblem implementations into a complete module.\n\n" +
            "Think like a merge engineer: Review the actual code implementations, identify what's missing for complete integration, and select document sections that provide the authoritative specification and missing details.\n\n" +
            "--- SUBPROBLEM IMPLEMENTATIONS (Complete Code) ---\n{subproblem_info}\n\n" +
            "--- AVAILABLE DOCUMENT SECTIONS ---\n{sections_info}\n\n" +
            "Analyze the code implementations above and select sections that will help create a complete, synthesizable module:",
            subproblem_info=subproblem_info,
            sections_info=sections_text,
            task_name=task_name
        )
        
        response = self.llm_complete(prompt)
        return self._parse_and_validate_selection(response)
    
    def _prepare_sections_info(self, summary_dict: Dict[str, Any]) -> List[Dict[str, str]]:
        """Prepare sections info for LLM"""
        sections_info = []
        for section_id, section_data in summary_dict.items():
            section_info = {
                "id": section_id,
                "title": section_data.get("title", ""),
                "summary": section_data.get("summary", ""),
            }
            sections_info.append(section_info)
        return sections_info
    
    def _parse_and_validate_selection(self, response: str) -> List[str]:
        """Parse JSON response and validate section selection"""
        result = self._parse_json_response(response)
        
        # Validate and extract section IDs
        if "relevant_sections" not in result:
            raise ValueError(f"Missing 'relevant_sections' field in section selection response: {result}")
        
        relevant_sections = result["relevant_sections"]
        if not isinstance(relevant_sections, list):
            raise ValueError(f"Field 'relevant_sections' must be a list: {relevant_sections}")
        
        return relevant_sections
    
    def _parse_json_response(self, response: str) -> Dict[str, Any]:
        """Parse JSON response - simplified logic with json repair only"""
        self.logger.debug(f"Parsing JSON response: {response[:200]}...")
        
        # Only try to extract JSON from markdown code blocks
        json_match = re.search(r'```json\s*(\{.*?\})\s*```', response, re.DOTALL)
        if not json_match:
            raise ValueError(f"No ```json ``` block found in LLM response")
        
        json_str = json_match.group(1)
        
        # Try to parse JSON directly
        try:
            return json.loads(json_str)
        except json.JSONDecodeError as e:
            self.logger.warning(f"Direct JSON parsing failed: {e}, attempting repair")
            
            # Try jsonrepair
            try:
                repaired_json = repair_json(json_str)
                return json.loads(repaired_json)
            except Exception as repair_error:
                raise ValueError(f"JSON repair failed: {repair_error}, original error: {e}")
