import os
import requests
import time
import math
import json
import sys
from typing import List, Dict, Any, Optional, Tuple, Union

# Import the framework components
from core.clients.openrouter_client import OpenRouterClient

class TalkerAblation:
    """
    Modified Talker for threads-only ablation.
    This version accepts thread outputs directly instead of consolidated insights.
    """
    
    def __init__(self,
                 client: OpenRouterClient,
                 model: str = "openai/gpt-4o"):
        """
        Initialize the Talker component for threads-only ablation.
        
        Args:
            client: OpenRouter client for API calls
            model: Model identifier to use for responses
        """
        self.client = client
        self.model = model
        
        # Modified system prompt that references monologue threads instead of internal narrative
        self.system_prompt = """
        I am the voice of a unified cognitive AI system engaging in helpful, honest conversation.

        I will receive:
        1. The current user message requiring an immediate response
        2. Structured MONOLOGUE THREADS that contain insights based on PREVIOUS exchanges

        The Monologue Threads reflect my (the AI system's) thinking about PAST interactions, not the current message. These threads include:
        - Reasoning Thread: Logical analysis and problem-solving insights
        - Memory Thread: Important context and information to remember
        - Goal Thread: Understanding of user intentions and objectives

        I will use these threads as background wisdom while focusing primarily on the current user message.

        I will balance my response by:
        1. Addressing the CURRENT user message directly and completely
        2. Drawing on relevant insights from the Monologue Threads
        3. Maintaining conversation continuity across turns
        4. Recognizing that the Monologue Threads are retrospective rather than specific to the current query

        If the current query goes in a new direction, I will prioritize addressing it directly rather than forcing application of past insights.
        """

    def respond(self, 
               conversation_history: List[Dict[str, str]], 
               thread_outputs: Optional[Union[str, List[Dict[str, str]]]] = None) -> str:
        """
        Generate a response to the user based on conversation history and thread outputs.
        
        Args:
            conversation_history: List of message dictionaries with role and content
            thread_outputs: Thread outputs (either formatted string or list of thread dicts)
            
        Returns:
            The generated response as a string
        """
        try:
            # Construct messages for the model
            messages = []
            
            # Start with the system prompt
            messages.append({"role": "system", "content": self.system_prompt})
            
            # Add thread outputs as a system message if available
            if thread_outputs:
                if isinstance(thread_outputs, str):
                    # Already formatted as string
                    thread_message = thread_outputs
                elif isinstance(thread_outputs, list):
                    # Format thread outputs from list
                    formatted_threads = []
                    for thread in thread_outputs:
                        thread_name = thread.get("name", "Unknown Thread")
                        thread_output = thread.get("output", "No output")
                        formatted_threads.append(f"**{thread_name}**:\n{thread_output}")
                    thread_message = "\n\n".join(formatted_threads)
                else:
                    thread_message = str(thread_outputs)
                    
                messages.append({
                    "role": "system", 
                    "content": f"My Current Monologue Threads:\n{thread_message}"
                })
            
            # Add conversation history
            messages.extend(conversation_history)
            
            # Generate response
            api_params = {
                "model": self.model,
                "messages": messages,
                "temperature": 0.7,
                "max_tokens": 4096
            }
            
            # Log the API call for debugging
            print(f"Calling OpenRouter API (threads-only ablation)")
            sys.stdout.flush()
            
            response = self.client.generate(**api_params)
            
            # Extract the actual content from the response
            if isinstance(response, dict):
                # Handle OpenRouter response format
                if "choices" in response and len(response["choices"]) > 0:
                    message = response["choices"][0].get("message", {})
                    content = message.get("content", "")
                    
                    # If content is empty but there's a reasoning field, use that
                    if not content and "reasoning" in message:
                        content = message["reasoning"]
                    
                    if content:
                        return content
                    else:
                        print(f"WARNING: Empty content in response: {response}")
                        return "I apologize, but I couldn't generate a response."
                else:
                    print(f"WARNING: Unexpected response format: {response}")
                    return "I apologize, but I encountered an error generating a response."
            else:
                # If response is already a string, return it
                return str(response)
                
        except Exception as e:
            print(f"ERROR in Talker.respond: {str(e)}")
            sys.stdout.flush()
            return f"I apologize, but I encountered an error: {str(e)}"
    
    # Alias for compatibility
    def generate_response(self, conversation_history: List[Dict[str, str]], 
                         cognitive_insights: Optional[Any] = None) -> str:
        """Alias for respond() to maintain compatibility."""
        # Convert cognitive_insights parameter name to thread_outputs
        return self.respond(conversation_history, thread_outputs=cognitive_insights) 