import json
import time
from typing import List, Tuple, Optional, Dict, Any, Literal
from pydantic import BaseModel, Field
from core.base_agent import BaseAgent
from core.environment import WorkEnvironment
from core.history_manager import HistoryManager

class Subtask(BaseModel):
    context: str = Field(..., description="The context for this subtask")
    tools: Dict[str, Any] = Field(default_factory=dict, description="Tool configurations")

class Dispatch_list(BaseModel):
    dispatch_list: List[Subtask] = Field(..., description="The list of subtasks")

class OrganizerResponse(BaseModel):
    dispatch_list: List[Subtask] = Field(..., description="The list of subtasks")
    scratchpad: str = Field(..., description="Summary of task progress")
    finish_msg: Optional[str] = Field(None, description="Final answer if the task is complete, otherwise null")


class Organizer(BaseAgent):

    PROMPT_START = """
    You are an Organizer. You are going to analyze the user query and available tools. 
    Decompose the user query into exclusively tool-based sub-tasks, assigning a single tool to each. 
    Dispatch only the subtasks that are ready to run given the current context. Defer any subtasks that depend on future tool outputs.
    If the current context provides sufficient information to satisfy the Objective or if the required actions are not supported by the available tools, DO NOT dispatch new tasks.
    For every sub-task, provide the shortest complete context necessary for execution to ensure atomicity and sub-task isolation.
    
    User Query: {query}
    Tools: {tools}
    
    Output a list of subtasks to be dispatched immediately. 
    Return JSON:
    {{
        "dispatch_list":[
                            {{
                                "context": "...",
                                "tools": "{{"name":..., "arguments": ...}}"
                            }},
                            {{...}}
                        ]
    }}
    """

    PROMPT_PLAN_AND_DISPATCH = """
    You are the Organizer.
    Available Toolset: {tools}
    Current Objective: {objective}
    Previous Scratchpad: {scratchpad}
    New Observations: {observation}
    Active Executors (Running): {active}

    **Directives:**
    1. **Update State:** Digest the observation result in last return. If tasks failed or revealed new info, update your plan immediately.
    2. **Check Concurrency:** Cross-reference the active and scratchpad. NEVER dispatch tasks that are already running. Do not retry.
    3. **Prune & Converge:** If the path is wrong, abandon pending tasks. Dispatch ONLY the next atomic step(s).
    4. **Dispatch Decision:** Dispatch only minimal, ready-to-run, new and necessary subtasks; return `[]` (0 tasks) if the objective is met, is blocked by dependencies, or requires unsupported tools.
    
    **Action:**
    Determine the next steps. Update the `scratchpad` to reflect the *current* situational summary (e.g., "Step A done, Step B failed, retrying B with new params").
    - If objective met: `dispatch_list`=[], set `finish_msg` to your final response to the objective.
    - If working: `dispatch_list`=[new_tasks], set `finish_msg`="".

    Return JSON:
    {{
        "dispatch_list": [
                            {{
                                "context": "...",
                                "tools": "{{"name":..., "arguments": ...}}"
                            }},
                            {{...}}
                        ],
        "scratchpad": "Updated concise summary of progress and next immediate focus.",
        "finish_msg": "" or "final response"
    }}
    """

    thinking_mode: bool = False
    dispatch_list: List[str] = []
    use_tester: bool = False

    def __init__(self, history_manager: HistoryManager, **kwargs):
        super().__init__(**kwargs)
        self.history_manager = history_manager

    def force_to_string(self, value):
        if isinstance(value, (dict, list)):
            return json.dumps(value, ensure_ascii=False)
        return str(value)    

    async def start(self, initial_message: str, tools: List[Dict], dataset_id: str, env: Optional[WorkEnvironment] = None) -> Tuple[WorkEnvironment, List[str]]:
        if env is None:
            env = WorkEnvironment()
            env.objective.append(initial_message)
            env.scratchpads.append('')
            env.tools = tools
        else:
            if not env.scratchpads:
                env.scratchpads.append('')

        if len(env.objective) > 1:
            # scratchpad[-1] as context
            combined_query = (
                f"Previous Context:\n{env.scratchpads[-1]}\n\n"
                f"Current User Query: {env.objective[-1]}"
            )
        else:
            combined_query = env.objective[-1]


        prompt = self.PROMPT_START.format(query=combined_query, tools=json.dumps(tools, ensure_ascii=False))
        messages = [{"role": "user", "content": prompt}]
        
        reasoning_content, content = await self.call(messages, Dispatch_list)

        initial_tasks_data = json.loads(content)
        dispatch_list = [str(t) for t in initial_tasks_data['dispatch_list']]

        env.dispatch_list_history.append(dispatch_list)
        env.thinking_history.append(reasoning_content or '')

        
        return env, dispatch_list

    def update_env(self, current_env: WorkEnvironment, executor_return: Dict) -> WorkEnvironment:
        current_env.unregister_executor(executor_return)
        return current_env

    async def plan_and_dispatch(self, current_env: WorkEnvironment, dataset_id: str, step: int, turn_index: int = 0) -> Tuple[str, List[str], Optional[str]]:
        # current_env.debug_print_executors()
        
        scratchpad = current_env.scratchpads[-1]
        executor_return_as_observation = json.dumps(current_env.task_history[-1], ensure_ascii=False) if current_env.task_history else ""
        active_str = json.dumps(current_env.active_registry, ensure_ascii=False)
        
        prompt = self.PROMPT_PLAN_AND_DISPATCH.format(
            tools=current_env.tools,
            objective=current_env.objective[-1],
            scratchpad=scratchpad,
            active=active_str,
            observation=executor_return_as_observation,
        )
        messages = [{"role": "user", "content": prompt}]
        
        reasoning_content, content = await self.call(messages, OrganizerResponse)
        current_env.thinking_history.append(reasoning_content or '')
        
        response = json.loads(content)
        current_env.scratchpads.append(response['scratchpad'])

        dispatch_list = response['dispatch_list']
        dispatch_list = [self.force_to_string(ctx) for ctx in dispatch_list]
        current_env.dispatch_list_history.append(dispatch_list)

        finish_msg = response['finish_msg']

        for context in dispatch_list:
            current_env.register_executor(context)
            
        to_write = (finish_msg != "")
        self.history_manager.save(
            current_env, dataset_id, step, finish_msg, turn_index=turn_index,
            to_write=to_write
        )
        
        return reasoning_content, dispatch_list, finish_msg

