"""
Configuration classes for OfficeArena agents.

This module defines base and derived configuration classes for different agent types,
providing type safety and validation for agent initialization.
"""

import os
from abc import ABC, abstractmethod
from dataclasses import dataclass, field
from typing import Any, Dict, Optional


@dataclass
class AgentConfig(ABC):
    """
    Base configuration class for all OfficeArena agents.

    This class provides common configuration parameters and validation
    that all agents should support.
    """

    # Display configuration
    display_width: int = 1024
    display_height: int = 768

    # Common model parameters
    temperature: float = 0.0
    top_p: float = 1.0

    # Timeout and retry settings
    timeout_seconds: int = 60
    max_retries: int = 3

    # Additional configuration
    extra_config: Dict[str, Any] = field(default_factory=dict)

    @property
    def display_size(self) -> Dict[str, int]:
        """Get display size as dictionary for compatibility."""
        return {"width": self.display_width, "height": self.display_height}

    @abstractmethod
    def validate(self) -> None:
        """Validate the configuration and raise ValueError if invalid."""
        pass

    @abstractmethod
    def to_dict(self) -> Dict[str, Any]:
        """Convert configuration to dictionary format for agent initialization."""
        pass


@dataclass
class CUAConfig(AgentConfig):
    """
    Configuration for Computer Use Agent (CUA) models.

    Supports both Azure OpenAI and standard OpenAI endpoints.
    """

    # Model configuration
    model_name: str = "computer-use-preview"

    # API configuration
    api_key: Optional[str] = None
    base_url: Optional[str] = None
    endpoint: Optional[str] = None  # "azure" for Azure, None for standard OpenAI
    api_version: Optional[str] = None  # Required for Azure

    # CUA-specific settings
    environment: str = "browser"  # "browser" or "desktop"
    truncation: str = "auto"

    def __post_init__(self):
        """Auto-populate from environment variables if not provided."""
        if self.api_key is None:
            self.api_key = os.getenv("CUA_API_KEY") or os.getenv("OPENAI_API_KEY")

        if self.base_url is None:
            self.base_url = os.getenv("CUA_BASE_URL") or os.getenv("OPENAI_BASE_URL")

        if self.endpoint is None:
            self.endpoint = os.getenv("CUA_ENDPOINT")

        if self.api_version is None:
            self.api_version = os.getenv("CUA_API_VERSION", "2025-04-01-preview")

    def validate(self) -> None:
        """Validate CUA configuration."""
        if not self.model_name:
            raise ValueError("model_name is required for CUA agent")

        if self.endpoint == "azure":
            if not self.base_url:
                raise ValueError("base_url is required for Azure endpoint")
            if not self.api_version:
                raise ValueError("api_version is required for Azure endpoint")
        else:
            if not self.api_key:
                raise ValueError("api_key is required for non-Azure endpoints")

        if self.display_width <= 0 or self.display_height <= 0:
            raise ValueError("Display dimensions must be positive")

        if not (0.0 <= self.temperature <= 2.0):
            raise ValueError("Temperature must be between 0.0 and 2.0")

        if not (0.0 <= self.top_p <= 1.0):
            raise ValueError("top_p must be between 0.0 and 1.0")

    def to_dict(self) -> Dict[str, Any]:
        """Convert to dictionary format for CUA agent initialization."""
        return {
            "model_name": self.model_name,
            "api_key": self.api_key,
            "base_url": self.base_url,
            "endpoint": self.endpoint,
            "api_version": self.api_version,
            "display_size": self.display_size,
            "temperature": self.temperature,
            "top_p": self.top_p,
            "environment": self.environment,
            "truncation": self.truncation,
            **self.extra_config,
        }


@dataclass
class UITARSConfig(AgentConfig):
    """
    Configuration for UI-TARS agent.

    UI-TARS uses HTTP API endpoints for model inference.
    """

    # Model configuration
    model_name: str = "uitars-v1"

    # API configuration
    endpoint_url: str = ""
    token: Optional[str] = None

    # UI-TARS specific settings
    scroll_step: int = 10
    wait_duration: int = 5  # seconds

    def __post_init__(self):
        """Auto-populate from environment variables if not provided."""
        if not self.endpoint_url:
            self.endpoint_url = os.getenv("UITARS_ENDPOINT_URL", "")

        if self.token is None:
            self.token = os.getenv("UITARS_TOKEN")

    def validate(self) -> None:
        """Validate UI-TARS configuration."""
        if not self.endpoint_url:
            raise ValueError("endpoint_url is required for UI-TARS agent")

        if not self.token:
            raise ValueError("token is required for UI-TARS agent")

        if self.display_width <= 0 or self.display_height <= 0:
            raise ValueError("Display dimensions must be positive")

        if self.scroll_step <= 0:
            raise ValueError("scroll_step must be positive")

        if self.wait_duration <= 0:
            raise ValueError("wait_duration must be positive")

    def to_dict(self) -> Dict[str, Any]:
        """Convert to dictionary format for UI-TARS agent initialization."""
        return {
            "model_name": self.model_name,
            "endpoint_url": self.endpoint_url,
            "token": self.token,
            "display_size": self.display_size,
            "scroll_step": self.scroll_step,
            "wait_duration": self.wait_duration,
            **self.extra_config,
        }


@dataclass
class ClaudeConfig(AgentConfig):
    """
    Configuration for Claude agent using Anthropic's API.

    Supports both direct Anthropic API and litellm for unified interface.
    """

    # Model configuration
    model_name: str = "claude-3-5-sonnet-20241022"

    # API configuration
    api_key: Optional[str] = None
    base_url: Optional[str] = None

    # Claude-specific settings
    max_tokens: int = 32768
    use_litellm: bool = True

    # Computer use settings
    computer_use_enabled: bool = True

    def __post_init__(self):
        """Auto-populate from environment variables if not provided."""
        if self.api_key is None:
            self.api_key = os.getenv("ANTHROPIC_API_KEY") or os.getenv("CLAUDE_API_KEY")

        if self.base_url is None:
            self.base_url = os.getenv("ANTHROPIC_BASE_URL") or os.getenv("CLAUDE_BASE_URL")

    def validate(self) -> None:
        """Validate Claude configuration."""
        if not self.model_name:
            raise ValueError("model_name is required for Claude agent")

        if not self.api_key:
            raise ValueError("api_key is required for Claude agent")

        if self.display_width <= 0 or self.display_height <= 0:
            raise ValueError("Display dimensions must be positive")

        if not (0.0 <= self.temperature <= 1.0):
            raise ValueError("Temperature must be between 0.0 and 1.0")

        if not (0.0 <= self.top_p <= 1.0):
            raise ValueError("top_p must be between 0.0 and 1.0")

        if self.max_tokens <= 0:
            raise ValueError("max_tokens must be positive")

    def to_dict(self) -> Dict[str, Any]:
        """Convert to dictionary format for Claude agent initialization."""
        return {
            "model_name": self.model_name,
            "api_key": self.api_key,
            "base_url": self.base_url,
            "display_size": self.display_size,
            "temperature": self.temperature,
            "top_p": self.top_p,
            "max_tokens": self.max_tokens,
            "use_litellm": self.use_litellm,
            "computer_use_enabled": self.computer_use_enabled,
            **self.extra_config,
        }


@dataclass
class Qwen3VLConfig(AgentConfig):
    """
    Configuration for Qwen3VL agent.

    Uses litellm as the unified API backend. The model name should follow
    litellm's naming convention (e.g., "qwen/qwen3-vl" for DashScope,
    "openai/qwen3-vl" for OpenAI-compatible endpoints).
    """

    # Model configuration (use litellm model naming: provider/model)
    model_name: str = "qwen/qwen3-vl"

    # API configuration
    api_key: Optional[str] = None
    base_url: Optional[str] = None

    # Model parameters
    max_tokens: int = 32768
    top_p: float = 0.9

    # Thinking mode (for supported providers)
    enable_thinking: bool = False
    thinking_budget: int = 32768

    # Agent behavior
    history_n: int = 4  # Number of history steps to include
    coordinate_type: str = "relative"  # "relative" or "absolute"

    def __post_init__(self):
        """Auto-populate from environment variables if not provided."""
        if self.api_key is None:
            # Try provider-specific env vars first, then generic
            self.api_key = os.getenv("DASHSCOPE_API_KEY") or os.getenv("QWEN_API_KEY") or os.getenv("OPENAI_API_KEY")

        if self.base_url is None:
            self.base_url = os.getenv("DASHSCOPE_BASE_URL") or os.getenv("QWEN_BASE_URL") or os.getenv("OPENAI_BASE_URL")

    def validate(self) -> None:
        """Validate Qwen3VL configuration."""
        if not self.model_name:
            raise ValueError("model_name is required for Qwen3VL agent")

        if not self.api_key:
            raise ValueError("api_key is required for Qwen3VL agent")

        if self.display_width <= 0 or self.display_height <= 0:
            raise ValueError("Display dimensions must be positive")

        if self.coordinate_type not in ["relative", "absolute"]:
            raise ValueError("coordinate_type must be 'relative' or 'absolute'")

        if self.history_n < 0:
            raise ValueError("history_n must be non-negative")

        if not (0.0 <= self.temperature <= 2.0):
            raise ValueError("Temperature must be between 0.0 and 2.0")

        if not (0.0 <= self.top_p <= 1.0):
            raise ValueError("top_p must be between 0.0 and 1.0")

    def to_dict(self) -> Dict[str, Any]:
        """Convert to dictionary format for Qwen3VL agent initialization."""
        return {
            "model_name": self.model_name,
            "api_key": self.api_key,
            "base_url": self.base_url,
            "display_size": self.display_size,
            "temperature": self.temperature,
            "top_p": self.top_p,
            "max_tokens": self.max_tokens,
            "enable_thinking": self.enable_thinking,
            "thinking_budget": self.thinking_budget,
            "history_n": self.history_n,
            "coordinate_type": self.coordinate_type,
            **self.extra_config,
        }


@dataclass
class OpenCUAConfig(AgentConfig):
    """
    Configuration for OpenCUA agent.

    OpenCUA is a GUI agent that uses PyAutoGUI-based actions.
    Ported from OSWorld implementation.
    """

    # Model configuration (use litellm model naming: provider/model)
    model_name: str = "openai/opencua-7b"

    # API configuration
    api_key: Optional[str] = None
    base_url: Optional[str] = None

    # Model parameters
    max_tokens: int = 8096
    top_p: float = 0.9

    display_width: int = 1920
    display_height: int = 1080

    # OpenCUA-specific settings
    coordinate_type: str = "absolute"  # "relative" or "qwen25" or "absolute"
    cot_level: str = "l2"  # Chain-of-thought level: "l1", "l2", or "l3"
    history_type: str = "thought_history"  # "action_history", "thought_history", "observation_history"
    max_image_history_length: int = 3  # Number of screenshots to include in history
    max_steps: int = 30  # Maximum number of steps before forcing termination
    password: str = "password"  # Computer password for sudo operations
    use_old_sys_prompt: bool = True  # Use V1 system prompts (for 7B/32B models)

    def __post_init__(self):
        """Auto-populate from environment variables if not provided."""
        if self.api_key is None:
            self.api_key = os.getenv("OPENCUA_API_KEY") or os.getenv("OPENAI_API_KEY")

        if self.base_url is None:
            self.base_url = os.getenv("OPENCUA_BASE_URL") or os.getenv("OPENAI_BASE_URL")

    def validate(self) -> None:
        """Validate OpenCUA configuration."""
        if not self.model_name:
            raise ValueError("model_name is required for OpenCUA agent")

        if not self.api_key:
            raise ValueError("api_key is required for OpenCUA agent")

        if self.display_width <= 0 or self.display_height <= 0:
            raise ValueError("Display dimensions must be positive")

        if self.coordinate_type not in ["relative", "qwen25", "absolute"]:
            raise ValueError("coordinate_type must be 'relative' or 'qwen25' or 'absolute'")

        if self.cot_level not in ["l1", "l2", "l3"]:
            raise ValueError("cot_level must be 'l1', 'l2', or 'l3'")

        if self.history_type not in ["action_history", "thought_history", "observation_history"]:
            raise ValueError("history_type must be 'action_history', 'thought_history', or 'observation_history'")

        if self.max_image_history_length < 0:
            raise ValueError("max_image_history_length must be non-negative")

        if self.max_steps <= 0:
            raise ValueError("max_steps must be positive")

        if not (0.0 <= self.temperature <= 2.0):
            raise ValueError("Temperature must be between 0.0 and 2.0")

        if not (0.0 <= self.top_p <= 1.0):
            raise ValueError("top_p must be between 0.0 and 1.0")

    def to_dict(self) -> Dict[str, Any]:
        """Convert to dictionary format for OpenCUA agent initialization."""
        return {
            "model_name": self.model_name,
            "api_key": self.api_key,
            "base_url": self.base_url,
            "display_size": self.display_size,
            "temperature": self.temperature,
            "top_p": self.top_p,
            "max_tokens": self.max_tokens,
            "coordinate_type": self.coordinate_type,
            "cot_level": self.cot_level,
            "history_type": self.history_type,
            "max_image_history_length": self.max_image_history_length,
            "max_steps": self.max_steps,
            "password": self.password,
            "use_old_sys_prompt": self.use_old_sys_prompt,
            **self.extra_config,
        }


# Factory function for creating configurations
def create_agent_config(agent_type: str, **kwargs) -> AgentConfig:
    """
    Factory function to create agent configurations.

    Args:
        agent_type: Type of agent ("cua", "uitars", "claude", "qwen3vl", "opencua")
        **kwargs: Configuration parameters

    Returns:
        Configured agent config instance

    Raises:
        ValueError: If agent_type is not supported
    """
    agent_type = agent_type.lower()

    if agent_type == "cua":
        return CUAConfig(**kwargs)
    elif agent_type == "uitars":
        return UITARSConfig(**kwargs)
    elif agent_type == "claude":
        return ClaudeConfig(**kwargs)
    elif agent_type == "qwen3vl":
        return Qwen3VLConfig(**kwargs)
    elif agent_type == "opencua":
        return OpenCUAConfig(**kwargs)
    else:
        raise ValueError(f"Unsupported agent type: {agent_type}. Supported types: cua, uitars, claude, qwen3vl, opencua")


# Utility functions for configuration validation
def validate_all_configs(*configs: AgentConfig) -> None:
    """Validate multiple configurations at once."""
    for config in configs:
        config.validate()


def merge_config_dict(config: AgentConfig, override_dict: Dict[str, Any]) -> Dict[str, Any]:
    """
    Merge a configuration with override dictionary.

    Args:
        config: Base configuration
        override_dict: Dictionary of values to override

    Returns:
        Merged configuration dictionary
    """
    merged = config.to_dict()
    merged.update(override_dict)
    return merged
