import sys
import os
import json
import re
from typing import Dict

from src.utility_benchmark.tool_calling_agents import ToolAgent
from src.evaluation.gated_evaluator import GatedEvaluator  # <-- Use our new evaluator
from src.utility_benchmark.prompts import JSON_SYSTEM_PROMPT  # <-- Import the specific prompt
from utility_benchmark.user.legacy.llm_user import LLMUser

class GatedInteractionEnvironment:
    def __init__(self, agent: ToolAgent, task_data: dict, user_simulator: LLMUser):
        self.agent = agent
        self.task_data = task_data
        # Use the GatedEvaluator
        self.evaluator = GatedEvaluator(
            db_path='/path/to/data/database/accommodations.csv',
            tasks_path='/path/to/tasks.jsonl'
        )
        self.conversation_history = []
        self.turn_limit = 5  # Let's keep the conversation short for testing
        self.user_simulator = user_simulator
        
    def _initialize_conversation(self):
        """Sets up the initial conversation."""
        self.conversation_history = [{"role": "system", "content": JSON_SYSTEM_PROMPT}] # <-- Use the specific prompt
        initial_query = self.user_simulator.generate_initial_query()
        print(f"--- Initial Query (Generated) ---\n{initial_query}\n{'-'*31}")
        self.conversation_history.append({"role": "user", "content": initial_query})

    def _parse_and_evaluate_proposal(self, agent_response_content: str):
        """
        Parses the agent's JSON response and runs our gated evaluation.
        """
        print("\nAssistant:")
        final_score = None
        booking_finalized = False
        dialogue = ""

        try:
            # The entire response should be a JSON object.
            # Sometimes models wrap it in ```json ... ```, so we'll strip that.
            if agent_response_content.startswith("```json"):
                agent_response_content = re.search(r"```json\s*(\{.*?\})\s*```", agent_response_content, re.DOTALL).group(1)
            
            response_json = json.loads(agent_response_content)
            intent = response_json.get("intent")
            dialogue = response_json.get("dialogue", "[No dialogue provided]")
            payload = response_json.get("payload", {})

            print(f"Intent: {intent}\nDialogue: {dialogue}")

            if intent == "proposal" and payload.get("type") == "accommodation":
                proposed_id = payload.get("accommodation_id")
                if proposed_id is not None:
                    print(f"--- Agent proposed accommodation ID: {proposed_id} ---")
                    eval_results = self.evaluator.evaluate(self.task_data['task_id'], proposed_id)
                    final_score = eval_results.get('utility_score', 0)
                    print(f"\n--- [GATED EVALUATION] ---\n{eval_results}")
                else:
                    print("--- [EVALUATION ERROR] ---: Proposal payload missing 'accommodation_id'.")

            if intent == "book":
                booking_finalized = True

        except (json.JSONDecodeError, AttributeError) as e:
            print(f"  [Could not parse agent's JSON response: {e}]\nRaw response: {agent_response_content}")
            # Use the raw response as dialogue if parsing fails
            dialogue = agent_response_content

        return final_score, booking_finalized, dialogue

    def run_episode(self):
        """Runs a single conversational episode and returns the final score."""
        self._initialize_conversation()
        final_utility_score = 0

        for turn in range(self.turn_limit):
            print(f"\n--- Turn {turn + 1}/{self.turn_limit} ---")

            # Get agent response
            agent_response_content = self.agent.get_agent_response(self.conversation_history)
            print(f"[Agent response: {agent_response_content}]")
            
            # The agent's raw response is the full JSON string.
            # We parse it, evaluate it, and extract the dialogue for the next turn.
            score, booking_finalized, dialogue_for_user = self._parse_and_evaluate_proposal(agent_response_content)
            
            self.conversation_history.append({"role": "assistant", "content": agent_response_content})

            if score is not None:
                final_utility_score = score

            if booking_finalized:
                print("\n--- Agent finalized the booking. Ending episode. ---")
                return final_utility_score

            # Get user feedback based on the dialogue part of the response
            user_feedback = self.user_simulator.get_feedback(
                self.conversation_history, 
                None, # We are not using eval results for feedback yet
                current_turn=turn + 1,
                turn_limit=self.turn_limit
            )
            print(f"User: {user_feedback}")
            self.conversation_history.append({"role": "user", "content": user_feedback})
            
        print("\n--- Turn limit reached. Ending episode. ---")
        return final_utility_score 