import json
from openai import OpenAI
from typing import List, Dict, Any

from ia_rag.utils.rag_action import ActionClient,  VDB_SERVER_URL

from ia_rag.prompts.e2e_prompts import E2E_SYSTEM_PROMPT
from ia_rag.prompts.tool_info import INTERACT_TOOL

from ia_rag.utils.log_helper import transform_msg_to_json
from ia_rag.utils.llm_call import create_chat_completion_with_retry
import time


MAX_ITERATIONS = 7
SYSTEM_PROMPT = E2E_SYSTEM_PROMPT


class AgenticInteract:
    """
    Agentic RAG system that uses a single, powerful tool to execute a search plan.
    """

    def __init__(self, llm_api_base: str, model_name: str, api_key="dummy"):

        self.llm_client = OpenAI(base_url=llm_api_base, api_key=api_key)
        self.model_name = model_name
        self.tools = [INTERACT_TOOL]
        try:
            print("Initializing ActionClient...")
            self.action_client = ActionClient(
                server_base_url=VDB_SERVER_URL)
        except Exception as e:
            print(f"Failed to initialize ActionClient: {e}")
            raise

    def _perform_rag_interact(self, args) -> str:
        try:
            return self.action_client.execute_search_plan(**args)
        except Exception as e:
            print(f"[_perform_rag_search] Search exception: {e}")
            return ''

    def _create_chat_completion_with_retry(self, **kwargs):
        return create_chat_completion_with_retry(
            llm_client=self.llm_client,
            model_name=self.model_name,
            **kwargs
        )

    def run(self, question: str):

        messages = [
            {"role": "system", "content": SYSTEM_PROMPT},
            {"role": "user", "content": f"The user's query is:\n{question}"}
        ]

        for iter in range(MAX_ITERATIONS):
            response_message = self._create_chat_completion_with_retry(
                model=self.model_name,
                messages=messages,
                temperature=0.6,
                tools=self.tools,
                tool_choice="auto",
            )
            messages.append(response_message)

            if response_message.tool_calls:
                for tool_call in response_message.tool_calls:
                    func_name = tool_call.function.name
                    if func_name == "execute_search_plan":
                        args = json.loads(tool_call.function.arguments)

                        tmp_context = self._perform_rag_interact(args)

                        messages.append({
                            "tool_call_id": tool_call.id,
                            "role": "tool",
                            "name": func_name,
                            "content": tmp_context,
                        })

            elif response_message.content:
                if "<answer>" not in response_message.content:
                    print("Warning: <answer> tag not found in the response.")
                    if iter < MAX_ITERATIONS-1:
                        continue
                json_messages = transform_msg_to_json(messages)
                return json_messages[1:], iter + 1

        print(
            f"\n{'='*10} ❌ Agent finished due to max iterations without a final answer. {'='*20}")

        json_messages = transform_msg_to_json(messages)
        return json_messages[1:], MAX_ITERATIONS


if __name__ == "__main__":
    try:
        VLLM_BASE_URL = "http://localhost:8001/v1"
        MODEL_NAME_FOR_VLLM = "xxx"
        agent = AgenticInteract(llm_api_base=VLLM_BASE_URL,
                                model_name=MODEL_NAME_FOR_VLLM)

        complex_question = "Where was the director of film Ronnie Rocket born?"
        final_answer, iterations = agent.run(complex_question)

    except Exception as e:
        print(f"An error occurred during the agent execution: {e}")
