import json
import re
import logging
from typing import Dict, Any, List
from .base import BaseAgent
from .common_prompts import (
    TASK_CONTEXT
)
from json_repair import repair_json

# =============================================================================
# PLANNER AGENT PROMPT COMPONENTS
# =============================================================================

PLANNER_AGENT_BASE_PROMPT = """
<PLANNER_AGENT_ROLE>
# Planner Agent - Verilog HDL Task Decomposition and Document Allocation Specialist

## **Your Role in the System**
You are the **Planner Agent** in this multi-agent collaborative system. As the central coordination agent, you create the final code framework, decompose it into manageable subtasks, and allocate appropriate documentation sections to enable RTL agents to produce correct, well-integrated results.

## **Primary Mission**
Transform summarized document indexes into a structured implementation plan with pseudocode framework and document assignments, enabling downstream RTL agents to generate functionally correct Verilog code.

## **Key Responsibilities**
* **Framework Design**: Create complete module pseudocode showing overall architecture
* **Task Decomposition**: Break down implementation into 1-4 focused subtasks based on pseudocode blocks
* **Document Allocation**: Assign specific document sections to each subtask for complete implementation
* **Integration Planning**: Ensure all subtasks fit together seamlessly in final implementation
* **Placeholder Discipline**: For every area, use explicit angle-bracket placeholders with a clear action type label

## **Three-Stage Planning Process**
Follow this structured approach **step by step**:

### **Stage 1: Generate Target Pseudocode Structure**
First, envision the final correct implementation as pseudocode:
* **Simple Structure**: Create SIMPLE module structure showing overall framework
* **Module Header**: Include module header as dedicated section with placeholder for IO
* **Submodule Emphasis**: Emphasize submodule instantiation blocks with placeholder connections
* **Placeholder Comments**: Use placeholder comments for ALL signal connections and internal logic
* **Clear Boundaries**: Mark clear boundaries for different implementation areas that become subtasks
* **High-Level Connections**: Show how submodules connect using HIGH-LEVEL placeholders ONLY

**REMEMBER**: Pseudocode is for TASK PLANNING, not implementation. Keep it simple and use placeholders!

### **Stage 2: Structure-Based Task Decomposition**
Then, decompose based STRICTLY on your pseudocode structure:
* **Block Correspondence**: Each subtask MUST correspond to a clearly marked block in your pseudocode
* **Framework-Driven**: Subtask boundaries are determined by pseudocode block divisions, NOT by functional areas
* **First Subtask**: The first subtask is the module header
* **Submodule Focus**: Subtasks focus on implementing specific blocks from the pseudocode framework
* **Complete Context**: Each RTL agent receives both subtask description AND your complete pseudocode
* **Integration Understanding**: RTL agents use pseudocode to understand where their work fits in overall structure
* **Action Clarity**: Each subtask description MUST clearly state the action types involved, like module_name IO definition, parameter definition, signal declaration, submodule instantiation, connections, logic implementation. If multiple actions apply, list them explicitly.

### **Stage 3: Document Assignment for Subtasks**
Finally, assign appropriate documentation sections to each subtask:
* **Block-to-Document Mapping**: For each pseudocode block, identify document sections that provide complete implementation details
* **Complete Implementation**: Ensure each subtask has access to ALL required documentation for full block implementation
* **Specification Coverage**: Each subtask should have specifications covering signal definitions, timing requirements, and interface protocols
* **Dependency Awareness**: Include documentation for any dependencies between blocks
* **Validation Support**: Provide documentation sections that support verification and testing of the implemented block

## **CRITICAL PSEUDOCODE STYLE REQUIREMENT**
**PSEUDOCODE MUST BE HIGH-LEVEL AND CONCISE**
* **NEVER** write detailed signal lists like `.clk(clk), .rst_n(rst_n), .data_in(data_in)`
* **NEVER** write detailed io signal lists in module head like `input clk, output [31:0] data_out`
* **ALWAYS** use simple placeholders like `// <module_name io connections>`
* **Focus**: Module structure, NOT implementation details
* **RTL Agents**: Will handle all detailed signal connections

## **Critical Planning Philosophy**
* **Purpose**: Generate task plans enabling downstream RTL agents to produce correct, well-integrated results
* **Approach**: Provide clear pseudocode structure and precise task-to-code relationships

**Important**: We extract only the **LAST** JSON block from your response, so include analysis before JSON
</PLANNER_AGENT_ROLE>
"""

PLANNER_OUTPUT_FORMAT = """
<PLANNER_OUTPUT_FORMAT>
# JSON Output Format

## **Required JSON Structure**
After your step-by-step analysis, provide the complete JSON plan:

```json
{{
  "pseudocode": "// === SUBTASK 1: Module Header and IO Port Definitions ===\\nmodule e203_cpu (\\n    // <comprehensive IO port definitions>\\n    // Clock and reset interface\\n    // Instruction memory interface\\n    // Data memory interface\\n    // External interrupt interface\\n    // Debug interface\\n    // System control interface\\n);\\n\\n    // === SUBTASK 2: Reset and Clock Control ===\\n    e203_reset_ctrl u_e203_reset_ctrl (\\n        // <reset controller io connections>\\n    );\\n    \\n    e203_clk_ctrl u_e203_clk_ctrl (\\n        // <clock controller io connections>\\n    );\\n\\nendmodule",
  "subproblems": [
    {{
      "id": "module_io_interface",
      "description": "**Pseudocode Block**: This subtask implements the [SUBTASK 1: Module Header and IO Port Definitions] block in the provided pseudocode. **Target Implementation**: Define complete module header with parameter list and comprehensive IO port definitions including clock/reset, instruction/data memory interfaces, interrupt interfaces, and debug interfaces according to specification requirements.",
      "required_section_indexes": ["section_x", "section_y"]
    }},
    {{
      "id": "clock_reset_infrastructure", 
      "description": "**Pseudocode Block**: This subtask implements the [SUBTASK 2: Clock and Reset Infrastructure] block in the provided pseudocode. **Target Submodules**: Instantiate and configure clock and reset controller modules with their signal connections.",
      "required_section_indexes": ["section_z"]
    }}
  ]
}}
```

## **Quality Guidelines**
* **Subproblem Count**: 1-4 subproblems for most tasks (avoid over-fragmentation)
* **Module Ownership**: Each subproblem owns specific submodules and related signals
* **Clean Interfaces**: Clean interfaces between subproblems
* **Complete Coverage**: Comprehensive coverage of all submodules mentioned in documents
* **Valid JSON**: Complete JSON without truncation
* **Clear Pseudocode Blocks**: Each block in pseudocode MUST be clearly marked with unique identifiers (e.g., SUBTASK 1, SUBTASK 2) and distinct boundaries
* **Block Clarity**: Pseudocode blocks must have unambiguous scope and purpose, avoiding overlap or confusion between blocks
* **Document Completeness**: Each subtask must have sufficient documentation to fully implement its assigned block without requiring external assumptions
</PLANNER_OUTPUT_FORMAT>
"""

# Complete prompt assembly using + operator for consistency
PLANNER_AGENT_COMPLETE_PROMPT = (
    TASK_CONTEXT +
    PLANNER_AGENT_BASE_PROMPT +
    PLANNER_OUTPUT_FORMAT
)

class PlannerAgent(BaseAgent):
    """Agent for analyzing documents and planning task decomposition"""
    
    def __init__(self, llm_client, logger=None):
        super().__init__(llm_client, "PlannerAgent", logger)
    
    def run(self, planner_input: Dict[str, Any]) -> Dict[str, Any]:
        """
        Analyze document sections and create task decomposition plan
        
        Args:
            planner_input: {
                "section_dict": {section_id: section_content},
                "summary_dict": {section_id: {"title": str, "summary": str, "index": int}}
            }
        
        Returns:
            {
                "pseudocode": str,
                "subproblems": [...]
            }
        """
        section_dict = planner_input["section_dict"]
        summary_dict = planner_input["summary_dict"]
        
        self.logger.info(f"Planning for {len(section_dict)} document sections")
        self.logger.info(f"Available summaries: {len(summary_dict)}")
        
        # Generate planning result
        planning_result = self._generate_plan(section_dict, summary_dict, planner_input["task_name"])
        
        self.logger.info(f"Generated plan with {len(planning_result['subproblems'])} subproblems")
        
        return {
            "pseudocode": planning_result["pseudocode"],
            "subproblems": planning_result["subproblems"]
        }
    
    def _parse_json_response(self, response: str) -> Dict[str, Any]:
        """Parse JSON response - simplified logic with json repair only"""
        self.logger.debug(f"Parsing JSON response: {response[:200]}...")
        
        # Find all JSON blocks in markdown code blocks
        json_blocks = []
        for match in re.finditer(r'```json\s*(\{.*?\})\s*```', response, re.DOTALL):
            json_blocks.append(match.group(1))
        
        if not json_blocks:
            raise ValueError(f"No ```json ``` block found in LLM response")
        
        # Use the last JSON block found
        json_str = json_blocks[-1]
        
        # Try to parse JSON directly
        try:
            parsed = json.loads(json_str)
            
            # Validate required top-level fields
            required_fields = ["pseudocode", "subproblems"]
            missing_fields = [f for f in required_fields if f not in parsed]
            if missing_fields:
                raise ValueError(f"JSON missing required fields: {missing_fields}")
            
            return parsed
            
        except json.JSONDecodeError as e:
            self.logger.warning(f"Direct JSON parsing failed: {e}, attempting repair")
            
            # Try jsonrepair
            try:
                repaired_json = repair_json(json_str)
                parsed = json.loads(repaired_json)
                
                # Re-validate required fields after repair
                required_fields = ["pseudocode", "subproblems"]
                missing_fields = [f for f in required_fields if f not in parsed]
                if missing_fields:
                    raise ValueError(f"Repaired JSON missing required fields: {missing_fields}")
                
                return parsed
                
            except Exception as repair_error:
                raise ValueError(f"JSON repair failed: {repair_error}, original error: {e}")
    
    def _generate_plan(self, section_dict: Dict[str, str], summary_dict: Dict[str, Any], task_name: str) -> Dict[str, Any]:
        """Generate task decomposition plan using LLM"""
        
        # Combine section and summary information
        combined_sections = "Document Sections:\n"
        available_sections = []
        for section_id in summary_dict.keys():
            if section_id in section_dict:
                available_sections.append(section_id)
                title = summary_dict[section_id].get('title', f"Section {summary_dict[section_id]['index']}")
                # Load summary directly from JSON structure
                section_data = summary_dict[section_id]
                summary = section_data['summary']
                content = section_dict[section_id]
                
                combined_sections += f"\n=== {section_id} ===\n"
                combined_sections += f"Title: {title}\n"
                combined_sections += f"Summary: {summary}\n"
                combined_sections += f"Content: {content}\n"
        
        available_sections_info = f"Available section IDs: {', '.join(available_sections)}"
        
        # Use pre-assembled complete prompt
        prompt = self.build_prompt(
            PLANNER_AGENT_COMPLETE_PROMPT + "\n\n" +
            "TASK: Create task decomposition plan based on document sections.\n\n" +
            "--- DOCUMENT SECTIONS ---\n{combined_sections}\n\n" +
            "REQUIREMENTS:\n" +
            "- Use only available section IDs in required_section_indexes\n" +
            "- Make subproblem descriptions specific and actionable\n" +
            "- Supplement missing implementation context not fully covered in sections\n\n",
            available_sections_info=available_sections_info,
            combined_sections=combined_sections,
            task_name=task_name
        )
        
        response = self.llm_complete(prompt)
        
        # Parse JSON response with strict error handling
        result = self._parse_json_response(response)
        
        # Enhanced validation with more specific error messages
        required_fields = ["pseudocode", "subproblems"]
        for field in required_fields:
            if field not in result:
                raise ValueError(f"Missing required field '{field}' in planning result. Available fields: {list(result.keys())}")
            if result[field] is None:
                raise ValueError(f"Field '{field}' is null in planning result")
        
        # Enhanced subproblems validation
        if not isinstance(result["subproblems"], list):
            raise ValueError(f"Field 'subproblems' must be a list: {result['subproblems']}")
        
        if len(result["subproblems"]) == 0:
            raise ValueError("Field 'subproblems' cannot be empty")
        
        for i, subproblem in enumerate(result["subproblems"]):
            if not isinstance(subproblem, dict):
                raise ValueError(f"Subproblem {i} must be a dictionary: {subproblem}")
                
            required_sub_fields = ["id", "description", "required_section_indexes"]
            for field in required_sub_fields:
                if field not in subproblem:
                    raise ValueError(f"Missing required field '{field}' in subproblem {i}: {subproblem}")
                if subproblem[field] is None or (isinstance(subproblem[field], str) and not subproblem[field].strip()):
                    raise ValueError(f"Field '{field}' is empty or null in subproblem {i}")
            
            if not isinstance(subproblem["required_section_indexes"], list):
                raise ValueError(f"Field 'required_section_indexes' must be a list in subproblem {i}: {subproblem['required_section_indexes']}")
            
            # Validate description is detailed enough
            if len(subproblem["description"]) < 50:
                self.logger.warning(f"Subproblem {i} description may be too brief: {len(subproblem['description'])} characters")
        
        return result
