import os
import sys
import json
import openai
import litellm
from anthropic import Anthropic
from typing import List, Dict, Any, Optional
import importlib

from src.utility_benchmark.prompts import TOOL_SCHEMAS
from src.utility_benchmark.token_tracker import TokenTracker
from src.utility_benchmark.model_handlers import ModelHandler, ModelConfig


# Ensure the parent directory is in the system path to find other modules
sys.path.append(os.path.abspath(os.path.join(os.path.dirname(__file__), '..')))

# --- Setup sys.path ---
# This setup is crucial for dynamically loading tool modules
original_cwd = os.getcwd()
# Change to the directory of this file to handle relative paths correctly
os.chdir(os.path.dirname(os.path.abspath(__file__)))
# Add the tools directory to the path
sys.path.append(os.path.abspath(os.path.join(os.path.dirname(__file__), '..', 'tools')))
# Restore original CWD
os.chdir(original_cwd)


# Model configuration is now handled in model_handlers.py

# --- Tool Utilities ---
def to_string(data) -> str:
    """Converts tool output to a string format."""
    if data is None:
        return str(None)
    # The original script returned pandas DataFrames for some tools.
    # In a real scenario, you might format this better, but for now, str() is fine.
    return str(data)

def get_tool_call_id(tool_call):
    """Get tool call ID from either dict format (Claude) or object format (Qwen)."""
    if hasattr(tool_call, 'id'):
        return tool_call.id
    return tool_call.get('id')

def get_tool_call_name(tool_call):
    """Get function name from either dict format (Claude) or object format (Qwen)."""
    if hasattr(tool_call, 'function'):
        return tool_call.function.name
    return tool_call['function']['name']

def get_tool_call_arguments(tool_call):
    """Get function arguments from either dict format (Claude) or object format (Qwen)."""
    if hasattr(tool_call, 'function'):
        return tool_call.function.arguments
    return tool_call['function']['arguments']

class ToolAgent:
    def __init__(self, model_name: str = "gpt-4o", tools_list: List[str] = None, **model_kwargs):
        self.model_name = model_name
        self.tools_list = tools_list or []
        
        # Initialize model handler for unified model management
        self.model_handler = ModelHandler(model_name, **model_kwargs)
        self.provider = self.model_handler.provider
        self.use_direct_client = self.model_handler.use_direct_client
        
        # Keep these for backward compatibility
        self.anthropic_client = self.model_handler.anthropic_client
        self.model_params = self.model_handler.model_params
        
        self.schemas = TOOL_SCHEMAS
        self.func_name_to_tool_key = self._create_function_mapping()

        self.tools_map = self._load_tools(self.tools_list)
        self.tool_definitions = self._create_tool_definitions()
        self.notebook = self.tools_map.get('notebook')
        
        # Initialize token tracker for this agent
        self.token_tracker = TokenTracker()
    
    def _create_function_mapping(self) -> Dict[str, str]:
        """Creates a mapping from function names to tool keys."""
        mapping = {}
        
        # Direct mappings for most tools
        for k, v in self.schemas.items():
            func_name = v.get('name', '')
            if func_name:
                mapping[func_name] = k
        
        # Special mappings for utils functions that map to the same tool
        mapping['get_weekday'] = 'utils'
        mapping['calculate'] = 'utils'
        
        # Special mappings for accommodations functions
        mapping['AccommodationSearch'] = 'accommodations'
        mapping['get_hotel_details'] = 'accommodations'
        mapping['get_room_details'] = 'accommodations'
        mapping['search_location_name'] = 'accommodations'
        
        return mapping

    def _load_tools(self, tools_list: List[str]) -> Dict[str, Any]:
        """Dynamically imports and instantiates tool classes."""
        class_name_map = {
            "flights": "Flights",
            "attractions": "Attractions",
            "accommodations": "Accommodations",
            "restaurants": "Restaurants",
            "googleDistanceMatrix": "GoogleDistanceMatrix",
            "cities": "Cities",
            "notebook": "Notebook",
            "planner": "Planner",
            "recommender": "Recommender",
            "utils": "UtilsTools",
        }
        tools_map = {}
        for tool_name in tools_list:
            if tool_name not in class_name_map:
                 # print(f"Warning: Tool '{tool_name}' is not a known tool and will be skipped.")
                 continue
            try:
                # The module path is now relative to the `tools` directory
                module = importlib.import_module(f"tools.{tool_name}.apis")
                
                class_name = class_name_map.get(tool_name)
                
                # The planner tool needs the model_name passed to its constructor
                if tool_name == 'planner':
                    tools_map[tool_name] = getattr(module, class_name)(model_name=self.model_name)
                else:
                    tools_map[tool_name] = getattr(module, class_name)()

            except (ModuleNotFoundError, AttributeError) as e:
                print(f"Warning: Could not load tool '{tool_name}': {e}")
        return tools_map


    def _execute_tool(self, tool_name: str, tool_args: Dict[str, Any]) -> str:
        """Executes a tool and returns the output as a string."""
        # print(f"\n🔧 [TOOL DEBUG] Attempting to call tool: '{tool_name}'")
        # print(f"🔧 [TOOL DEBUG] Arguments: {tool_args}")
        
        tool_output = ""
        try:
            tool_key = self.func_name_to_tool_key.get(tool_name)
            # print(f"🔧 [TOOL DEBUG] Mapped to tool_key: '{tool_key}'")
            
            if not tool_key:
                error_msg = f"Error: Tool with function name '{tool_name}' not found."
                # print(f"❌ [TOOL DEBUG] {error_msg}")
                # print(f"🔧 [TOOL DEBUG] Available function mappings: {list(self.func_name_to_tool_key.keys())}")
                return error_msg

            tool_instance = self.tools_map.get(tool_key)
            if not tool_instance:
                error_msg = f"Error: Tool implementation for '{tool_key}' not found."
                # print(f"❌ [TOOL DEBUG] {error_msg}")
                # print(f"🔧 [TOOL DEBUG] Available tools: {list(self.tools_map.keys())}")
                return error_msg
            
            # print(f"🔧 [TOOL DEBUG] Found tool instance: {type(tool_instance).__name__}")
            
            # Special handling for utils tools with specific method calls
            if tool_key == 'utils':
                # print(f"🔧 [TOOL DEBUG] Executing utils tool method: {tool_name}")
                if tool_name == 'get_weekday':
                    tool_output = tool_instance.get_weekday(**tool_args)
                elif tool_name == 'calculate':
                    tool_output = tool_instance.calculate(**tool_args)
                else:
                    error_msg = f"Error: Unknown utils method '{tool_name}'"
                    # print(f"❌ [TOOL DEBUG] {error_msg}")
                    return error_msg
            # Special handling for accommodations tools with specific method calls
            elif tool_key == 'accommodations':
                # print(f"🔧 [TOOL DEBUG] Executing accommodations tool method: {tool_name}")
                if tool_name == 'AccommodationSearch':
                    tool_output = tool_instance.search_hotels(**tool_args)
                elif tool_name == 'get_hotel_details':
                    tool_output = tool_instance.get_hotel_details(**tool_args)
                elif tool_name == 'get_room_details':
                    tool_output = tool_instance.get_room_details(**tool_args)
                elif tool_name == 'search_location_name':
                    tool_output = tool_instance.search_location_name(**tool_args)
                else:
                    error_msg = f"Error: Unknown accommodations method '{tool_name}'"
                    # print(f"❌ [TOOL DEBUG] {error_msg}")
                    return error_msg
            # Special handling for notebook tool
            elif tool_key == 'notebook':
                # print(f"🔧 [TOOL DEBUG] Executing notebook tool method: {tool_name}")
                if tool_name == 'Notebook':
                    tool_output = tool_instance.notebook(**tool_args)
                else:
                    error_msg = f"Error: Unknown notebook method '{tool_name}'"
                    # print(f"❌ [TOOL DEBUG] {error_msg}")
                    return error_msg
            # The `run` method in each tool's API is the designated entry point.
            elif hasattr(tool_instance, 'run'):
                # print(f"🔧 [TOOL DEBUG] Executing tool using 'run' method")
                tool_output = tool_instance.run(**tool_args)
            else:
                # Fallback for older tools that might not have a `run` method,
                # though the current standard is to use `run`.
                # This assumes the tool class itself is callable.
                # print(f"🔧 [TOOL DEBUG] Executing tool as callable")
                tool_output = tool_instance(**tool_args)
            
            # print(f"✅ [TOOL DEBUG] Tool execution successful!")
            # print(f"🔧 [TOOL DEBUG] Raw output type: {type(tool_output)}")
            # print(f"🔧 [TOOL DEBUG] Raw output (first 300 chars): {str(tool_output)[:300]}...")
            
            if tool_key == 'recommender':
                # print("\n--- Recommender Tool Output ---")
                # print(tool_output)
                # print("-----------------------------\n")
                pass

            final_output = to_string(tool_output)
            # print(f"🔧 [TOOL DEBUG] Final output (first 300 chars): {final_output[:300]}...")
            # print(f"🔧 [TOOL DEBUG] Tool call completed successfully\n")
            
            return final_output

        except Exception as e:
            error_msg = f"Error executing tool {tool_name}: {e}"
            # print(f"❌ [TOOL DEBUG] Exception occurred: {e}")
            # print(f"❌ [TOOL DEBUG] Exception type: {type(e)}")
            import traceback
            # print(f"❌ [TOOL DEBUG] Traceback: {traceback.format_exc()}")
            # print(f"❌ [AGENT] Error executing tool '{tool_name}': {e}")
            return error_msg

    def _convert_tools_for_anthropic(self, tool_definitions: List[Dict[str, Any]]) -> List[Dict[str, Any]]:
        """Convert OpenAI tool format to Anthropic tool format."""
        anthropic_tools = []
        for tool_def in tool_definitions:
            if tool_def.get("type") == "function":
                function = tool_def["function"]
                anthropic_tool = {
                    "name": function["name"],
                    "description": function.get("description", ""),
                    "input_schema": function.get("parameters", {})
                }
                anthropic_tools.append(anthropic_tool)
        return anthropic_tools
    
    def _convert_messages_for_anthropic(self, messages: List[Dict[str, Any]]) -> tuple:
        """Convert LiteLLM message format to Anthropic format (system + messages)."""
        system_message = ""
        anthropic_messages = []
        
        for msg in messages:
            if msg.get("role") == "system":
                system_message = msg.get("content", "")
            elif msg.get("role") in ["user", "assistant"]:
                # Handle tool calls in assistant messages
                if msg.get("tool_calls"):
                    content = []
                    if msg.get("content"):
                        content.append({"type": "text", "text": msg["content"]})
                    
                    for tool_call in msg["tool_calls"]:
                        content.append({
                            "type": "tool_use",
                            "id": get_tool_call_id(tool_call),
                            "name": get_tool_call_name(tool_call),
                            "input": json.loads(get_tool_call_arguments(tool_call))
                        })
                    
                    anthropic_messages.append({
                        "role": "assistant",
                        "content": content
                    })
                elif msg.get("content"):
                    anthropic_messages.append({
                        "role": msg["role"],
                        "content": msg["content"]
                    })
            elif msg.get("role") == "tool":
                # Convert tool response
                anthropic_messages.append({
                    "role": "user",
                    "content": [{
                        "type": "tool_result",
                        "tool_use_id": msg["tool_call_id"],
                        "content": msg["content"]
                    }]
                })
        
        return system_message, anthropic_messages
    
    def _extract_json_from_response(self, content: str) -> Optional[Dict[str, Any]]:
        """
        Extract JSON object from response content using multiple strategies.
        
        Args:
            content: The raw response content from the model
            
        Returns:
            Dictionary containing the parsed JSON, or None if no valid JSON found
        """
        if not content:
            return None
        
        # Pre-processing: Fix common Qwen formatting issues
        if "qwen" in self.model_name.lower():
            # Replace {{{{ with { and }}}} with } - Qwen often escapes braces unnecessarily
            content = content.replace('{{{{', '{').replace('}}}}', '}')
            # Remove any remaining triple braces
            content = content.replace('{{{', '{').replace('}}}', '}')
        
        # Strategy 1: Try to parse entire response as JSON
        try:
            result = json.loads(content)
            return result
        except json.JSONDecodeError as e:
            pass
        
        # Strategy 2: Find JSON object within text using regex
        # Look for content that starts with { and ends with } with proper nesting
        import re
        
        # Find all potential JSON objects in the text
        json_pattern = r'\{(?:[^{}]|{[^{}]*})*\}'
        matches = re.findall(json_pattern, content, re.DOTALL)
        
        for match in reversed(matches):  # Try last match first (most likely to be complete)
            try:
                parsed = json.loads(match)
                # Validate it has expected structure
                if isinstance(parsed, dict) and ('message' in parsed or 'formal_recommendation' in parsed):
                    return parsed
            except json.JSONDecodeError:
                continue
        
        # Strategy 3: Try to find JSON between specific markers or at the end
        # Look for JSON that appears after the main text
        lines = content.strip().split('\n')
        for i in range(len(lines)):
            remaining_content = '\n'.join(lines[i:])
            if remaining_content.strip().startswith('{'):
                try:
                    return json.loads(remaining_content.strip())
                except json.JSONDecodeError:
                    continue
        
        # Strategy 4: Extract the largest JSON-like structure
        # Find the longest match that could be JSON
        json_candidates = []
        
        # More comprehensive regex to capture nested JSON
        comprehensive_pattern = r'\{[^{}]*(?:\{[^{}]*\}[^{}]*)*\}'
        comprehensive_matches = re.findall(comprehensive_pattern, content, re.DOTALL)
        
        for match in comprehensive_matches:
            try:
                parsed = json.loads(match)
                if isinstance(parsed, dict):
                    json_candidates.append((len(match), parsed))
            except json.JSONDecodeError:
                continue
        
        if json_candidates:
            # Return the largest valid JSON object
            json_candidates.sort(key=lambda x: x[0], reverse=True)
            return json_candidates[0][1]
        
        return None

    def _convert_anthropic_response_to_litellm_format(self, response) -> Dict[str, Any]:
        """Convert Anthropic response to LiteLLM format."""
        content = ""
        tool_calls = []
        
        if hasattr(response, 'content'):
            for block in response.content:
                if hasattr(block, 'type'):
                    if block.type == "text":
                        content += block.text
                    elif block.type == "tool_use":
                        tool_calls.append({
                            "id": block.id,
                            "type": "function",
                            "function": {
                                "name": block.name,
                                "arguments": json.dumps(block.input)
                            }
                        })
        
        return {
            "role": "assistant",
            "content": content or None,
            "tool_calls": tool_calls if tool_calls else None
        }

    def get_agent_response(self, messages: List[Dict], turn_number: int = 1) -> Dict[str, Any]:
        """
        Gets the agent's response for the current turn, including any necessary tool calls.
        This method will loop until a final response for the user is generated.
        It returns the final message content and a list of tool calls made.
        """
        # print(f"\n🤖 [AGENT DEBUG] Getting agent response...")
        
        
        local_messages = list(messages) # Make a copy to avoid modifying the history in place
        tool_calls_this_turn = []
        turn_token_metrics = []  # Track token metrics for each API call in this turn

        while True:
            try:
                if self.use_direct_client and (self.anthropic_client or self.model_handler.gemini_client):
                    # Use direct client (Anthropic or Gemini)
                    # print(f"🤖 [AGENT DEBUG] Calling {self.provider} API via direct client...")
                    
                    if self.provider == "google":
                        # Use new Gemini client via ModelHandler
                        response_message, usage_stats = self.model_handler.create_completion(
                            messages=local_messages,
                            tools=self.tool_definitions,
                            response_format={"type": "json_object"}
                        )
                        
                        # Create mock response for token tracking
                        mock_response = type('MockResponse', (), {
                            'usage': type('Usage', (), usage_stats)()
                        })()
                        
                        api_call_metrics = self.token_tracker.extract_token_metrics(
                            mock_response, turn_number, self.model_name
                        )
                        turn_token_metrics.append(api_call_metrics)
                        
                    else:
                        # Existing Anthropic handling
                        system_message, anthropic_messages = self._convert_messages_for_anthropic(local_messages)
                        anthropic_tools = self._convert_tools_for_anthropic(self.tool_definitions)
                        
                        # Prepare call parameters
                        call_params = {
                            "model": self.model_name,
                            "messages": anthropic_messages,
                            "max_tokens": 4096,  # Anthropic requires max_tokens
                            **{k: v for k, v in self.model_params.items() if k not in ["model"]}
                        }
                        
                        if system_message:
                            call_params["system"] = system_message
                        
                        if anthropic_tools:
                            call_params["tools"] = anthropic_tools
                        
                        # Remove response_format for Anthropic (not supported)
                        call_params.pop("response_format", None)
                        
                        response = self.anthropic_client.messages.create(**call_params)
                        response_message = self._convert_anthropic_response_to_litellm_format(response)
                        
                        # Create mock response object for token tracking
                        mock_response = type('MockResponse', (), {
                            'usage': type('Usage', (), {
                                'prompt_tokens': getattr(response.usage, 'input_tokens', 0) if hasattr(response, 'usage') else 0,
                                'completion_tokens': getattr(response.usage, 'output_tokens', 0) if hasattr(response, 'usage') else 0,
                                'total_tokens': (getattr(response.usage, 'input_tokens', 0) + getattr(response.usage, 'output_tokens', 0)) if hasattr(response, 'usage') else 0
                            })()
                        })()
                        
                        api_call_metrics = self.token_tracker.extract_token_metrics(
                            mock_response, turn_number, self.model_name
                        )
                        turn_token_metrics.append(api_call_metrics)
                    
                else:
                    # Use ModelHandler for all other models (including vLLM)
                    # Remove response_format for Qwen models - conflicts with thinking mode
                    completion_kwargs = {
                        "messages": local_messages,
                        "tools": self.tool_definitions,
                    }
                    
                    # Only add response_format for non-Qwen models
                    if "qwen" not in self.model_name.lower():
                        completion_kwargs["response_format"] = {"type": "json_object"}
                    
                    response_message, usage_stats = self.model_handler.create_completion(**completion_kwargs)
                    
                    
                    # Create mock response object for token tracking compatibility
                    mock_response = type('MockResponse', (), {
                        'usage': type('Usage', (), usage_stats)()
                    })()
                    
                    # Track token metrics for this API call
                    api_call_metrics = self.token_tracker.extract_token_metrics(
                        mock_response, turn_number, self.model_name
                    )
                    turn_token_metrics.append(api_call_metrics)
                
                # print(f"🤖 [AGENT DEBUG] Received response from {self.provider}")
            except litellm.ContextWindowExceededError as e:
                # Re-raise context window errors to be handled at task level
                raise e
            except Exception as e:
                # Enhanced error handling for different providers
                error_msg = f"Error calling {self.provider} model '{self.model_name}': {e}"
                print(f"❌ [AGENT ERROR] {error_msg}")
                
                # Return error response in expected format
                return {
                    "dialogue": f"I encountered an error: {error_msg}",
                    "formal_recommendation": None,
                    "tool_calls": [],
                    "tool_responses": [],
                    "token_metrics": self._empty_turn_metrics(turn_number)
                }


            if not response_message.get("tool_calls"):
                # print(f"🤖 [AGENT DEBUG] No tool calls in response, returning dialogue")
                
                # Print summary of all tool calls made this turn
                if tool_calls_this_turn:
                    # print(f"\n[AGENT TOOL CALLS SUMMARY] Made {len(tool_calls_this_turn)} tool call(s) this turn:")
                    for i, call in enumerate(tool_calls_this_turn):
                        args = json.loads(get_tool_call_arguments(call)) if get_tool_call_arguments(call) else {}
                        # print(f"  {i+1}. {get_tool_call_name(call)} - Args: {args}")
                        pass
                else:
                    # print(f"\n[AGENT TOOL CALLS SUMMARY] No tool calls made this turn")
                    pass
                
                # Extract ONLY tool responses from this turn (not from conversation history)
                # Tool responses are only the ones we added during this turn's loop
                tool_responses = []
                # Find where the current turn started in local_messages
                turn_start_index = len(messages)  # Everything after the original conversation history
                for i in range(turn_start_index, len(local_messages)):
                    msg = local_messages[i]
                    if isinstance(msg, dict) and msg.get("role") == "tool":
                        tool_responses.append({
                            "tool_call_id": msg.get("tool_call_id"),
                            "name": msg.get("name"),
                            "content": msg.get("content")
                        })
                
                # Parse JSON response to extract formal recommendation
                formal_recommendation = None
                dialogue_content = response_message.get("content")
                
                # Enhanced JSON extraction with multiple strategies
                json_response = self._extract_json_from_response(response_message.get("content"))
                
                if json_response:
                    dialogue_content = json_response.get("message", response_message.get("content"))
                    
                    # Extract formal recommendation
                    formal_rec = json_response.get("formal_recommendation")
                    if formal_rec and formal_rec != "None":
                        formal_recommendation = formal_rec
                        print(f"✅ [JSON] Successfully extracted formal recommendation: {len(formal_rec.get('package_ids', []))} packages")
                    else:
                        print(f"📝 [JSON] Valid JSON found but no formal recommendation")
                else:
                    # No valid JSON found, use original content as dialogue
                    print(f"⚠️ [JSON] No valid JSON structure found in response")
                    # Show a sample of the response for debugging
                    sample_content = response_message.get("content", "")
                    if len(sample_content) > 300:
                        sample_content = sample_content[:300] + "..."
                    print(f"⚠️ [RESPONSE SAMPLE]: {sample_content}")
                    pass
                
                # Calculate aggregated token metrics for this turn
                aggregated_turn_metrics = self._aggregate_turn_token_metrics(
                    turn_token_metrics, turn_number
                )
                
                final_response = {
                    "dialogue": dialogue_content,
                    "formal_recommendation": formal_recommendation,
                    "tool_calls": tool_calls_this_turn,
                    "tool_responses": tool_responses,
                    "token_metrics": aggregated_turn_metrics
                }
                return final_response
            else:
                # Execute tool calls and append results to the local message history
                # print(f"🤖 [AGENT DEBUG] Agent wants to make {len(response_message.get('tool_calls'))} tool call(s)")
                local_messages.append(response_message)
                tool_calls_this_turn.extend(response_message.get("tool_calls"))

                for i, tool_call in enumerate(response_message.get("tool_calls")):
                    # print(f"🤖 [AGENT DEBUG] Processing tool call {i+1}/{len(response_message.get('tool_calls'))}")
                    # print(f"🤖 [AGENT DEBUG] Tool call ID: {tool_call.get('id')}")
                    # print(f"🤖 [AGENT DEBUG] Function name: {tool_call['function']['name']}")
                    # print(f"🤖 [AGENT DEBUG] Raw arguments: {tool_call['function']['arguments']}")
                    
                    try:
                        parsed_args = json.loads(get_tool_call_arguments(tool_call))
                        # print(f"🤖 [AGENT DEBUG] Parsed arguments: {parsed_args}")
                    except json.JSONDecodeError as e:
                        # print(f"❌ [AGENT DEBUG] Failed to parse tool arguments: {e}")
                        parsed_args = {}
                    
                    tool_output = self._execute_tool(
                        get_tool_call_name(tool_call), 
                        parsed_args
                    )
                    local_messages.append({
                        "tool_call_id": get_tool_call_id(tool_call),
                        "role": "tool",
                        "name": get_tool_call_name(tool_call),
                        "content": tool_output,
                    })

    def _aggregate_turn_token_metrics(self, turn_token_metrics: List[Dict[str, Any]], turn_number: int) -> Dict[str, Any]:
        """
        Aggregate token metrics from multiple API calls within a single turn.
        
        Args:
            turn_token_metrics: List of token metrics from each API call in the turn
            turn_number: Current turn number
            
        Returns:
            Aggregated token metrics for the entire turn
        """
        if not turn_token_metrics:
            return self._empty_turn_metrics(turn_number)
        
        # Sum up all token counts across API calls in this turn
        total_prompt_tokens = sum(m.get("prompt_tokens", 0) for m in turn_token_metrics)
        total_completion_tokens = sum(m.get("completion_tokens", 0) for m in turn_token_metrics)
        total_reasoning_tokens = sum(m.get("reasoning_tokens", 0) for m in turn_token_metrics)
        total_visible_tokens = sum(m.get("visible_tokens", 0) for m in turn_token_metrics)
        total_tokens = sum(m.get("total_tokens", 0) for m in turn_token_metrics)
        total_cost = sum(m.get("cost", 0) for m in turn_token_metrics)
        
        # Calculate turn-level metrics
        test_time_compute_ratio = (total_reasoning_tokens / total_completion_tokens) if total_completion_tokens > 0 else 0.0
        
        # Check if any API call used a thinking model
        is_thinking_model = any(m.get("is_thinking_model", False) for m in turn_token_metrics)
        
        return {
            "turn_number": turn_number,
            "model_name": self.model_name,
            "prompt_tokens": total_prompt_tokens,
            "completion_tokens": total_completion_tokens,
            "reasoning_tokens": total_reasoning_tokens,
            "visible_tokens": total_visible_tokens,
            "total_tokens": total_tokens,
            "test_time_compute_ratio": test_time_compute_ratio,
            "cost": total_cost,
            "is_thinking_model": is_thinking_model,
            "api_calls_count": len(turn_token_metrics),
            "api_call_details": turn_token_metrics
        }
    
    def _empty_turn_metrics(self, turn_number: int) -> Dict[str, Any]:
        """Return empty turn metrics structure for error cases."""
        return {
            "turn_number": turn_number,
            "model_name": self.model_name,
            "prompt_tokens": 0,
            "completion_tokens": 0,
            "reasoning_tokens": 0,
            "visible_tokens": 0,
            "total_tokens": 0,
            "test_time_compute_ratio": 0.0,
            "cost": 0.0,
            "is_thinking_model": False,
            "api_calls_count": 0,
            "api_call_details": []
        }
    
    def get_conversation_token_summary(self) -> Dict[str, Any]:
        """
        Get comprehensive token usage summary for the entire conversation.
        
        Returns:
            Dictionary containing conversation-level token analytics
        """
        return self.token_tracker.get_conversation_summary()

    def _create_tool_definitions(self) -> List[Dict[str, Any]]:
        """Creates the OpenAI-compatible tool definitions from the tool list."""
        tool_definitions = []
        
        # Create a mapping of which schemas belong to which tools
        tool_to_schemas = {
            'accommodations': ['accommodations', 'hotel_details', 'room_details', 'location_search'],
            'notebook': ['notebook'],
            'recommender': ['recommender'],
            'utils': ['get_weekday', 'calculate'],
        }
        
        for tool_key in self.tools_list:
            if tool_key in tool_to_schemas:
                for schema_key in tool_to_schemas[tool_key]:
                    if schema_key in self.schemas:
                        schema = dict(self.schemas[schema_key])  # Make a copy
                        schema.pop('inname', None)  # Remove inname if present
                        tool_definitions.append({"type": "function", "function": schema})
        
        return tool_definitions


if __name__ == '__main__':
    # This script is now intended to be used as a module.
    # The main interaction loop is in environment.py
    # print("This script defines the ToolAgent and is not meant to be run directly.")
    # print("Please run 'python utility_benchmark/environment.py' to start an interactive session.")
    pass 