"""
API Clients for Non-Agentic Model Evaluation

Provides unified interface for different AI provider APIs with multi-turn conversation support:
- OpenAI Responses API (context via previous_response_id)
- Grok/xAI API (context via previous_response_id)
- Gemini API (context via thought signatures)
- DeepSeek via Fireworks API

Each client maintains conversation context and handles provider-specific details.
"""

import os
import logging
import asyncio
from abc import ABC, abstractmethod
from typing import Dict, Any, List, Optional, Tuple
from dataclasses import dataclass

logger = logging.getLogger(__name__)


@dataclass
class APIResponse:
    """
    Standardized response from any API provider.

    Attributes:
        content: The text response from the model
        context: Provider-specific context for next turn (response_id, signatures, etc.)
        raw_response: Full raw response object for debugging
        error: Error message if request failed
    """
    content: str
    context: Optional[Dict[str, Any]] = None
    raw_response: Optional[Any] = None
    error: Optional[str] = None


class BaseAPIClient(ABC):
    """
    Abstract base class for all API clients.

    Provides common interface for multi-turn conversations with different providers.
    """

    def __init__(self, model_name: str, api_key: str, model_args: Dict[str, Any],
                 reasoning_args: Dict[str, Any]):
        """
        Initialize API client.

        Args:
            model_name: Model identifier (e.g., "gpt-5-preview")
            api_key: API key for authentication
            model_args: Client initialization parameters
            reasoning_args: Evaluation parameters (reasoning_effort, tools, etc.)
        """
        self.model_name = model_name
        self.api_key = api_key
        self.model_args = model_args
        self.reasoning_args = reasoning_args
        self.conversation_context = None  # Tracks context across turns

    @abstractmethod
    async def send_message(self, message: str, context: Optional[Dict[str, Any]] = None) -> APIResponse:
        """
        Send a message and get response.

        Args:
            message: User message to send
            context: Context from previous turn (optional)

        Returns:
            APIResponse with content and context for next turn
        """
        pass

    async def multi_turn_conversation(self, messages: List[str]) -> List[APIResponse]:
        """
        Conduct a multi-turn conversation.

        Args:
            messages: List of user messages to send sequentially

        Returns:
            List of responses, one per message
        """
        responses = []
        context = None

        for msg in messages:
            response = await self.send_message(msg, context)
            responses.append(response)

            if response.error:
                logger.error(f"Error in conversation: {response.error}")
                break

            # Update context for next turn
            context = response.context

        return responses


class OpenAIResponsesClient(BaseAPIClient):
    """
    OpenAI Responses API client with reasoning context preservation.

    Uses previous_response_id to maintain reasoning tokens across turns.
    Supports web_search and code_interpreter tools.
    """

    def __init__(self, model_name: str, api_key: str, model_args: Dict[str, Any],
                 reasoning_args: Dict[str, Any]):
        super().__init__(model_name, api_key, model_args, reasoning_args)

        # Import OpenAI client
        from openai import AsyncOpenAI
        import httpx

        # Configure with explicit timeout and retry settings
        # Using 3600s (1 hour) timeout for complex reasoning with tools
        # max_retries=4 to handle transient 500 errors
        self.client = AsyncOpenAI(
            api_key=api_key,
            timeout=httpx.Timeout(
                connect=10.0,
                read=3600.0,    # 1 hour for reasoning + tools
                write=3600.0,
                pool=3600.0
            ),
            max_retries=4  # Up from default of 2
        )

        # Extract tool configuration
        self.tools = reasoning_args.get('tools', [])
        self.reasoning_effort = reasoning_args.get('reasoning_effort', 'high')

    async def send_message(self, message: str, context: Optional[Dict[str, Any]] = None) -> APIResponse:
        """
        Send message via OpenAI Responses API.

        Args:
            message: User message
            context: Dict with 'previous_response_id' if continuing conversation

        Returns:
            APIResponse with response_id in context
        """
        try:
            # Build request parameters
            request_params = {
                'model': self.model_name,
                'input': message,  # Responses API uses 'input', not 'messages'
                'reasoning': {'effort': self.reasoning_effort},  # Nested structure
                **self.model_args  # Additional model-specific args
            }

            # Add tools if specified
            if self.tools:
                # Map tool configurations to API format
                tool_types = []
                for tool in self.tools:
                    tool_type = tool.get('type') if isinstance(tool, dict) else tool

                    if tool_type == 'web_search':
                        tool_types.append({'type': 'web_search'})
                    elif tool_type == 'code_interpreter':
                        # Code interpreter requires container parameter
                        tool_types.append({
                            'type': 'code_interpreter',
                            'container': {'type': 'auto'}
                        })

                if tool_types:
                    request_params['tools'] = tool_types

            # Add context from previous turn
            if context and 'previous_response_id' in context:
                request_params['previous_response_id'] = context['previous_response_id']
                logger.debug(f"Using previous_response_id: {context['previous_response_id']}")

            # Make API call
            logger.info(f"OpenAI Responses API call to {self.model_name}")
            response = await self.client.responses.create(**request_params)

            # Log request ID for debugging 500 errors
            if hasattr(response, 'id'):
                logger.info(f"OpenAI Request ID: {response.id}")

            # Extract content from response
            content = self._extract_content(response)

            # Build context for next turn
            next_context = {
                'previous_response_id': response.id
            }

            logger.info(f"OpenAI response complete, content length: {len(content)}")

            return APIResponse(
                content=content,
                context=next_context,
                raw_response=response
            )

        except Exception as e:
            # Enhanced error logging
            logger.error(f"OpenAI API error: {str(e)}")
            logger.error(f"Error type: {type(e).__name__}")
            logger.error(f"Model: {self.model_name}")
            logger.error(f"Tools: {self.tools}")
            logger.error(f"Reasoning effort: {self.reasoning_effort}")
            if hasattr(e, 'response'):
                logger.error(f"Response status: {getattr(e.response, 'status_code', 'N/A')}")
                logger.error(f"Response body: {getattr(e.response, 'text', 'N/A')[:500]}")
            return APIResponse(
                content="",
                error=f"OpenAI API error: {str(e)}"
            )

    def _extract_content(self, response) -> str:
        """
        Extract text content from OpenAI Responses API response.

        Args:
            response: OpenAI response object

        Returns:
            Text content
        """
        try:
            # Responses API provides output_text directly
            if hasattr(response, 'output_text'):
                return response.output_text

            # Fallback: Parse output array
            if hasattr(response, 'output') and response.output:
                for item in response.output:
                    if hasattr(item, 'type') and item.type == 'message':
                        # Message item has content list
                        if hasattr(item, 'content') and item.content:
                            for content_item in item.content:
                                if hasattr(content_item, 'text'):
                                    return content_item.text

            # Fallback to Chat Completions format
            if hasattr(response, 'choices') and response.choices:
                return response.choices[0].message.content

            return str(response)

        except Exception as e:
            logger.error(f"Error extracting content: {str(e)}")
            return str(response)


class GrokAPIClient(BaseAPIClient):
    """
    Grok/xAI API client with reasoning support.

    Uses OpenAI-compatible API with reasoning_effort parameter.
    May use Responses API if available for context preservation.
    """

    def __init__(self, model_name: str, api_key: str, model_args: Dict[str, Any],
                 reasoning_args: Dict[str, Any]):
        super().__init__(model_name, api_key, model_args, reasoning_args)

        # Import OpenAI client (xAI uses OpenAI-compatible API)
        from openai import AsyncOpenAI
        import httpx

        # Configure with explicit timeout and retry settings
        # Using 3600s (1 hour) timeout as recommended by xAI docs
        # max_retries=4 to handle transient errors
        self.client = AsyncOpenAI(
            api_key=api_key,
            base_url="https://api.x.ai/v1",
            timeout=httpx.Timeout(
                connect=10.0,
                read=3600.0,    # 1 hour as recommended by xAI
                write=3600.0,
                pool=3600.0
            ),
            max_retries=4
        )

        # Extract configuration
        self.tools = reasoning_args.get('tools', [])
        self.reasoning_effort = reasoning_args.get('reasoning_effort', 'high')

    async def send_message(self, message: str, context: Optional[Dict[str, Any]] = None) -> APIResponse:
        """
        Send message via Grok API.

        For grok-3-mini: Uses reasoning_effort parameter
        For grok-4: Native tool use and search integration

        Args:
            message: User message
            context: Dict with 'previous_response_id' if continuing conversation

        Returns:
            APIResponse
        """
        try:
            # Try Responses API first (if available)
            if hasattr(self.client, 'responses'):
                return await self._send_via_responses_api(message, context)
            else:
                return await self._send_via_chat_api(message, context)

        except Exception as e:
            # Enhanced error logging
            logger.error(f"Grok API error: {str(e)}")
            logger.error(f"Error type: {type(e).__name__}")
            logger.error(f"Model: {self.model_name}")
            if hasattr(e, 'response'):
                logger.error(f"Response status: {getattr(e.response, 'status_code', 'N/A')}")
                logger.error(f"Response body: {getattr(e.response, 'text', 'N/A')[:500]}")
            return APIResponse(
                content="",
                error=f"Grok API error: {str(e)}"
            )

    async def _send_via_responses_api(self, message: str, context: Optional[Dict[str, Any]] = None) -> APIResponse:
        """Send via Responses API (preferred for context preservation)."""
        request_params = {
            'model': self.model_name,
            'input': message,  # Responses API uses 'input', not 'messages'
            **self.model_args
        }

        # Note: Grok does not support reasoning_effort parameter in Responses API
        # The model has built-in reasoning capabilities

        # Add context
        if context and 'previous_response_id' in context:
            request_params['previous_response_id'] = context['previous_response_id']

        logger.info(f"Grok Responses API call to {self.model_name}")
        response = await self.client.responses.create(**request_params)

        # Log request ID for debugging
        if hasattr(response, 'id'):
            logger.info(f"Grok Request ID: {response.id}")

        content = self._extract_content_from_responses(response)

        logger.info(f"Grok response complete, content length: {len(content)}")

        return APIResponse(
            content=content,
            context={'previous_response_id': response.id},
            raw_response=response
        )

    async def _send_via_chat_api(self, message: str, context: Optional[Dict[str, Any]] = None) -> APIResponse:
        """Send via Chat Completions API (fallback)."""
        # Build message history from context
        messages = []
        if context and 'message_history' in context:
            messages = context['message_history']
        messages.append({'role': 'user', 'content': message})

        request_params = {
            'model': self.model_name,
            'messages': messages,
            **self.model_args
        }

        # Add reasoning_effort for grok-3-mini
        if 'grok-3-mini' in self.model_name:
            request_params['reasoning_effort'] = self.reasoning_effort

        logger.info(f"Grok Chat API call to {self.model_name}")
        response = await self.client.chat.completions.create(**request_params)

        content = response.choices[0].message.content

        # Update message history
        messages.append({'role': 'assistant', 'content': content})

        return APIResponse(
            content=content,
            context={'message_history': messages},
            raw_response=response
        )

    def _extract_content_from_responses(self, response) -> str:
        """Extract content from Responses API response."""
        try:
            # Use output_text directly (same as OpenAI)
            if hasattr(response, 'output_text'):
                return response.output_text

            # Fallback to parsing output array
            if hasattr(response, 'output') and response.output:
                for item in response.output:
                    if hasattr(item, 'content'):
                        return item.content
            return str(response)
        except:
            return str(response)


class GeminiAPIClient(BaseAPIClient):
    """
    Google Gemini API client with thinking mode and thought signatures.

    Uses google.genai SDK (not google.generativeai).
    Requires function declarations to enable thought signatures.
    Maintains context by passing full conversation history including all parts.
    """

    def __init__(self, model_name: str, api_key: str, model_args: Dict[str, Any],
                 reasoning_args: Dict[str, Any]):
        super().__init__(model_name, api_key, model_args, reasoning_args)

        # Import new Gemini SDK
        from google import genai
        from google.genai import types

        self.client = genai.Client(api_key=api_key)
        self.types = types

        # Dummy function declaration to enable thought signatures
        # (Required by Gemini API - must use function calling)
        self.tools = [
            types.Tool(
                function_declarations=[
                    types.FunctionDeclaration(
                        name='placeholder',
                        description='Placeholder function to enable thought signatures',
                        parameters={'type': 'object', 'properties': {}}
                    )
                ]
            )
        ]

        # Build generation config
        self.config = types.GenerateContentConfig(
            thinking_config=types.ThinkingConfig(
                include_thoughts=True
            ),
            tools=self.tools,
            **model_args
        )

    async def send_message(self, message: str, context: Optional[Dict[str, Any]] = None) -> APIResponse:
        """
        Send message via Gemini API with thought signatures.

        Args:
            message: User message
            context: Dict with 'conversation_history' containing full history

        Returns:
            APIResponse with conversation history in context
        """
        try:
            # Build conversation content
            conversation = []

            # Add previous conversation history (including thought signatures)
            if context and 'conversation_history' in context:
                conversation = context['conversation_history']

            # Add new user message
            conversation.append(
                self.types.Content(
                    role='user',
                    parts=[self.types.Part(text=message)]
                )
            )

            # Generate response
            logger.info(f"Gemini API call to {self.model_name}")
            response = await asyncio.to_thread(
                self.client.models.generate_content,
                model=self.model_name,
                contents=conversation,
                config=self.config
            )

            # Extract text content
            content = response.text if hasattr(response, 'text') else str(response)

            # Build context with full conversation including model response
            # IMPORTANT: Must include ALL parts (including thought signatures)
            next_history = conversation + [response.candidates[0].content]

            return APIResponse(
                content=content,
                context={'conversation_history': next_history},
                raw_response=response
            )

        except Exception as e:
            logger.error(f"Gemini API error: {str(e)}")
            return APIResponse(
                content="",
                error=f"Gemini API error: {str(e)}"
            )


class FireworksDeepSeekClient(BaseAPIClient):
    """
    DeepSeek via Fireworks AI API client.

    Uses OpenAI-compatible API. May support thinking mode and/or Responses API.
    """

    def __init__(self, model_name: str, api_key: str, model_args: Dict[str, Any],
                 reasoning_args: Dict[str, Any]):
        super().__init__(model_name, api_key, model_args, reasoning_args)

        # Import OpenAI client (Fireworks uses OpenAI-compatible API)
        from openai import AsyncOpenAI

        # Fireworks base URL (same as Inspect AI uses)
        self.client = AsyncOpenAI(
            api_key=api_key,
            base_url="https://api.fireworks.ai/inference/v1"
        )

        # Extract configuration
        self.enable_thinking = reasoning_args.get('enable_thinking', True)

    async def send_message(self, message: str, context: Optional[Dict[str, Any]] = None) -> APIResponse:
        """
        Send message via Fireworks/DeepSeek API.

        Args:
            message: User message
            context: Context from previous turn

        Returns:
            APIResponse
        """
        try:
            # Check if Responses API is supported
            if hasattr(self.client, 'responses'):
                return await self._send_via_responses_api(message, context)
            else:
                return await self._send_via_chat_api(message, context)

        except Exception as e:
            logger.error(f"Fireworks/DeepSeek API error: {str(e)}")
            return APIResponse(
                content="",
                error=f"Fireworks/DeepSeek API error: {str(e)}"
            )

    async def _send_via_responses_api(self, message: str, context: Optional[Dict[str, Any]] = None) -> APIResponse:
        """Send via Responses API if supported."""
        request_params = {
            'model': self.model_name,
            'input': message,  # Responses API uses 'input', not 'messages'
            'reasoning': {'effort': 'high'},  # DeepSeek supports reasoning
            **self.model_args
        }

        if context and 'previous_response_id' in context:
            request_params['previous_response_id'] = context['previous_response_id']

        logger.info(f"Fireworks Responses API call to {self.model_name}")
        response = await self.client.responses.create(**request_params)

        content = self._extract_content_from_responses(response)

        return APIResponse(
            content=content,
            context={'previous_response_id': response.id},
            raw_response=response
        )

    async def _send_via_chat_api(self, message: str, context: Optional[Dict[str, Any]] = None) -> APIResponse:
        """Send via Chat Completions API."""
        messages = []
        if context and 'message_history' in context:
            messages = context['message_history']
        messages.append({'role': 'user', 'content': message})

        request_params = {
            'model': self.model_name,
            'messages': messages,
            **self.model_args
        }

        logger.info(f"Fireworks Chat API call to {self.model_name}")
        response = await self.client.chat.completions.create(**request_params)

        content = response.choices[0].message.content
        messages.append({'role': 'assistant', 'content': content})

        return APIResponse(
            content=content,
            context={'message_history': messages},
            raw_response=response
        )

    def _extract_content_from_responses(self, response) -> str:
        """Extract content from Responses API response."""
        try:
            # Use output_text directly (same as OpenAI/Grok)
            if hasattr(response, 'output_text'):
                return response.output_text

            # Fallback to parsing output array
            if hasattr(response, 'output') and response.output:
                for item in response.output:
                    if hasattr(item, 'content'):
                        return item.content
            return str(response)
        except:
            return str(response)


def create_api_client(company_name: str, model_name: str, api_key: str,
                      model_args: Dict[str, Any], reasoning_args: Dict[str, Any]) -> BaseAPIClient:
    """
    Factory function to create appropriate API client based on company.

    Args:
        company_name: Company identifier (openai, xai, google, fireworks)
        model_name: Model identifier
        api_key: API key
        model_args: Client initialization parameters
        reasoning_args: Evaluation parameters

    Returns:
        Appropriate API client instance
    """
    company_lower = company_name.lower()

    if company_lower == 'openai':
        return OpenAIResponsesClient(model_name, api_key, model_args, reasoning_args)
    elif company_lower in ['xai', 'grok']:
        return GrokAPIClient(model_name, api_key, model_args, reasoning_args)
    elif company_lower in ['google', 'gemini']:
        return GeminiAPIClient(model_name, api_key, model_args, reasoning_args)
    elif company_lower == 'fireworks':
        return FireworksDeepSeekClient(model_name, api_key, model_args, reasoning_args)
    else:
        raise ValueError(f"Unsupported company: {company_name}")
