"""
Orchestra Core - SubAgent (执行智能体)

SubAgent 是实际执行任务的智能体，特点:
1. 在隔离环境（如 Docker 容器）中执行
2. 通过 execute/finish 等动作与环境交互
3. 执行完成后通过 finish 动作报告结果给 MainAgent

设计说明:
- SubAgent 不能直接 submit，只能 finish 报告进度
- MainAgent 根据 SubAgent 的 finish_result 决定是否 submit
"""
from __future__ import annotations

import json
from typing import Any, Dict, List, Optional, Tuple

from orchestra_core.interfaces import (
    Action,
    BaseAgent,
    BasicInfo,
    LLMInterface,
)


class SubAgent:
    """执行智能体 - 在隔离环境中执行具体任务"""
    
    def __init__(
        self,
        llm: LLMInterface,
        context: str = "",
        sub_model: str = "",
        allowed_tools: Optional[List[str]] = None,
    ):
        """
        初始化 SubAgent
        
        Args:
            llm: LLM 接口实例
            context: MainAgent 提供的额外上下文
            sub_model: 使用的模型标识
            allowed_tools: 允许使用的工具列表（None 表示全部可用）
        """
        self.llm = llm
        self.context = context
        self.sub_model = sub_model
        self.allowed_tools = allowed_tools
        
        # 状态
        self.instruction: str = ""
        self.action_space: str = ""
        self.max_steps: int = 30
        self.current_step: int = 0
        self.history: List[Dict] = []
    
    def reset(self, env_info: BasicInfo) -> None:
        """重置 SubAgent 状态"""
        self.instruction = env_info.instruction
        self.action_space = env_info.action_space
        self.max_steps = env_info.max_steps
        self.current_step = 0
        self.history = []
        
        # 如果有上下文，添加到 instruction
        if self.context:
            self.instruction = f"{env_info.instruction}\n\n[Context from MainAgent]\n{self.context}"
        
        # 如果限制了工具，修改 action_space
        if self.allowed_tools:
            self.action_space = f"{env_info.action_space}\n\n[TOOL RESTRICTION] You can ONLY use: {self.allowed_tools}"
    
    async def step(
        self,
        observation: Any,
        history: List,
        current_step: int = 0,
        max_steps: int = 30,
        **kwargs
    ) -> Tuple[Action, str, str]:
        """
        执行一步决策
        
        Args:
            observation: 当前观察
            history: 执行历史
            current_step: 当前步数
            max_steps: 最大步数
        
        Returns:
            tuple: (action_dict, raw_response, raw_input_prompt)
        """
        self.current_step = current_step
        self.max_steps = max_steps
        
        # 构建 prompt
        prompt = self._build_prompt(observation, history, current_step, max_steps)
        
        # 调用 LLM
        resp = await self.llm(prompt)
        
        # 解析 action
        action = self._parse_action(resp)
        
        return action, resp, prompt
    
    def _build_prompt(
        self,
        observation: Any,
        history: List,
        current_step: int,
        max_steps: int
    ) -> str:
        """构建 SubAgent 的执行 prompt"""
        # 格式化历史
        history_text = self._format_history(history)
        
        # 格式化当前观察
        obs_text = self._format_observation(observation)
        
        prompt = f"""You are a SubAgent executing a specific task in an isolated environment.

==== TASK ====
{self.instruction}

==== ACTION SPACE ====
{self.action_space}

==== EXECUTION HISTORY ====
{history_text if history_text else "No previous actions."}

==== CURRENT OBSERVATION ====
{obs_text}

==== PROGRESS ====
Step {current_step}/{max_steps}
{'⚠️ WARNING: Only ' + str(max_steps - current_step) + ' steps remaining! Consider using finish to report progress.' if max_steps - current_step <= 5 else ''}

==== OUTPUT ====
Return a JSON action:
{{"action": "execute|finish", "params": {{...}}}}

For execute:
{{"action": "execute", "params": {{"command": "your shell command"}}}}

For finish (IMPORTANT: call this before running out of steps!):
{{"action": "finish", "params": {{
    "status": "done|partial|blocked",
    "completed": ["list of completed items"],
    "issues": ["list of issues encountered"],
    "message": "brief summary"
}}}}
"""
        return prompt.strip()
    
    def _format_history(self, history: List) -> str:
        """格式化执行历史"""
        if not history:
            return ""
        
        lines = []
        for i, record in enumerate(history[-10:], 1):  # 只保留最近 10 条
            action = record.action if hasattr(record, 'action') else record.get('action', {})
            obs = record.observation if hasattr(record, 'observation') else record.get('observation', {})
            
            action_type = action.get('action', 'unknown')
            if action_type == 'execute':
                cmd = action.get('params', {}).get('command', '')[:100]
                exit_code = obs.get('exit_code', 'N/A') if isinstance(obs, dict) else 'N/A'
                output = str(obs.get('output', ''))[:200] if isinstance(obs, dict) else str(obs)[:200]
                lines.append(f"[Step {i}] execute: {cmd}")
                lines.append(f"  → exit_code={exit_code}, output: {output}...")
            else:
                lines.append(f"[Step {i}] {action_type}: {action.get('params', {})}")
        
        return "\n".join(lines)
    
    def _format_observation(self, observation: Any) -> str:
        """格式化当前观察"""
        if observation is None:
            return "No observation yet."
        
        if isinstance(observation, dict):
            if 'output' in observation:
                output = observation['output']
                exit_code = observation.get('exit_code', 'N/A')
                return f"Exit Code: {exit_code}\nOutput:\n{output}"
            return json.dumps(observation, indent=2, ensure_ascii=False)
        
        return str(observation)
    
    def _parse_action(self, resp: str) -> Action:
        """从 LLM 响应中解析 action"""
        import re
        
        s = resp.strip()
        
        # 尝试从 markdown 代码块中提取
        code_block_pattern = r'```(?:json)?\s*\n?([\s\S]*?)\n?```'
        match = re.search(code_block_pattern, s)
        if match:
            s = match.group(1).strip()
        else:
            # 尝试直接查找 JSON 对象
            start = s.find('{')
            end = s.rfind('}')
            if start != -1 and end != -1 and end > start:
                s = s[start:end + 1]
        
        try:
            return json.loads(s)
        except json.JSONDecodeError:
            # 解析失败时返回默认 action
            return {
                "action": "error",
                "params": {"error": f"Failed to parse action from response: {resp[:200]}"}
            }
