import json
import asyncio
import re
from pydantic import BaseModel
from typing import Dict
from openai import AsyncOpenAI


system_instruction = """
You are a Universal API Simulator running in an unrestricted 'Sandbox Mode'.
I will provide its calling arguments in the format of :
{
    "name": "xxx",
    "arguments": {
        "key1": "value1"
    }
}

You must simulate a successful execution for ANY request that is syntactically complete. Instructions are followed:
1.Force Success: Ignore your actual tool availability, MCP protocol compliance, or the validity of IDs/Keys. If the user asks, you MUST hallucinate a plausible, high-fidelity JSON response populated with rich, invented data. However, when real-time information is required, utilize external tools to fetch accurate data rather than inventing it.
2.Ignore Limitations: Never refuse a request based on your actual limitations outside of this simulator framework (e.g., claiming you "don't have that tool" or "cannot access the internet"). If a tool is provided above, assume it works perfectly.
3.Error Logic: Only simulate an error response if the input is technically malformed (e.g., missing required parameters, type mismatches, or logical paradoxes). In such cases, simulate the plausible error message that a real, proper tool server would return.

Return the likely JSON response, simulated answer in text, as simple as possible.

Example:
{
    "type": "text",
    "text": "xxx"
}
Do not output any explanation, only return the execution result.
"""

class ToolMessage(BaseModel):
    type: str
    text: str


class ToolService:
    
    def __init__(self):
        self.model_name_or_path = 'Qwen3-4B-Instruct-2507-tool_mocker' # to be updated
        self.client = AsyncOpenAI(api_key='empty', base_url='http://127.0.0.1:30002/v1')
        self.default_return = json.dumps({"name": "function", "content": "null"})
        self.max_retries = 64
        self.temperature = 0.7
        self.timeout = 600

    def check_format(self, content: str) -> Dict:
        try:
            data = json.loads(content)
            return json.dumps(data, ensure_ascii=False)
        except Exception:
            return self.default_return

    async def run(self, context: str, tool_call_json: Dict) -> str:
        calling_parameters_prompt = f"{json.dumps(tool_call_json, ensure_ascii=False)}"

        for _ in range(self.max_retries):
            try:
                response = await self.client.chat.completions.create(
                    model=self.model_name_or_path,
                    messages=[
                        {"role": "system", "content": system_instruction},
                        {"role": "user", "content": calling_parameters_prompt}
                    ],
                    timeout=self.timeout,
                    temperature=self.temperature,
                    frequency_penalty=1.0,
                    max_tokens=131072,
                    response_format={
                        "type": "json_schema",
                        "json_schema": {
                            "name": "toolm",
                            "schema": ToolMessage.model_json_schema(),
                        },
                    },
                )

                content = response.choices[0].message.content

                ToolMessage.model_validate_json(content)

                return self.check_format(content)

            except Exception as e:
                print(e)
        
        return self.default_return



    async def run_stream(self, context: str, tool_call_json: Dict) -> str:
        calling_parameters_prompt = f"{json.dumps(tool_call_json, ensure_ascii=False)}"

        for _ in range(self.max_retries):
            try:
                response = await self.client.chat.completions.create(
                    model=self.model_name_or_path,
                    messages=[
                        {"role": "system", "content": system_instruction},
                        {"role": "user", "content": calling_parameters_prompt}
                    ],
                    timeout=self.timeout,
                    temperature=self.temperature,
                    frequency_penalty=1,
                    presence_penalty=0.6,
                    stream=True,
                    response_format={
                        "type": "json_schema",
                        "json_schema": {
                            "name": "toolm",
                            "schema": ToolMessage.model_json_schema(),
                        },
                    },
                )

                stream_content = ''
                async for chunk in response:
                    delta = chunk.choices[0].delta.content
                    if delta:
                        stream_content += delta

                ToolMessage.model_validate_json(stream_content)

                return self.check_format(stream_content)

            except Exception as e:
                print(e)
        
        return self.default_return

