#!/usr/bin/env python3
import os
from typing import Optional, TypeVar, Type
import anthropic
from pydantic import BaseModel
from tenacity import retry, stop_after_attempt, wait_exponential, retry_if_exception

T = TypeVar('T', bound=BaseModel)


class ClaudeLLM:
    def __init__(self, api_key: Optional[str] = None, model: str = 'claude-sonnet-4-20250514'):
        self.api_key = api_key or os.getenv('ANTHROPIC_API_KEY')
        if not self.api_key:
            raise ValueError(
                'Claude API key required. Set ANTHROPIC_API_KEY environment variable or pass api_key parameter'
            )
        self.client = anthropic.Anthropic(api_key=self.api_key)
        self.async_client = anthropic.AsyncAnthropic(api_key=self.api_key)
        self.model = model
        print(f'Claude initialized: {self.model}')

    def _is_rate_limit_error(self, error) -> bool:
        if hasattr(error, 'status_code') and error.status_code == 429:
            return True
        if hasattr(error, 'message'):
            error_msg = str(error.message).lower()
            return any(
                (phrase in error_msg for phrase in ['rate limit', 'quota', 'too many requests', 'limit exceeded'])
            )
        return False

    def _get_retry_decorator(self):
        return retry(
            retry=retry_if_exception(self._is_rate_limit_error),
            wait=wait_exponential(multiplier=1, min=10, max=120),
            stop=stop_after_attempt(6),
            reraise=True,
        )

    def chat(self, messages: list, max_tokens: int = 4000, temperature: float = 0.1) -> str:
        @self._get_retry_decorator()
        def _make_api_call():
            response = self.client.messages.create(
                model=self.model, max_tokens=max_tokens, temperature=temperature, messages=messages
            )
            return response.content[0].text

        return _make_api_call()

    def count_tokens(self, text: str) -> int:
        response = self.client.messages.count_tokens(model=self.model, messages=[{'role': 'user', 'content': text}])
        return response.input_tokens

    def chat_structured(
        self, messages: list, response_model: Type[T], max_tokens: int = 4000, temperature: float = 0.1
    ) -> T:
        schema = response_model.model_json_schema()
        tool_name = f'provide_{response_model.__name__.lower()}'
        tool = {
            'name': tool_name,
            'description': f'Provide response in {response_model.__name__} format',
            'input_schema': schema,
        }

        @self._get_retry_decorator()
        def _make_structured_api_call():
            response = self.client.messages.create(
                model=self.model,
                max_tokens=max_tokens,
                temperature=temperature,
                messages=messages,
                tools=[tool],
                tool_choice={'type': 'tool', 'name': tool_name},
            )
            if response.content and len(response.content) > 0:
                for content in response.content:
                    if hasattr(content, 'type') and content.type == 'tool_use':
                        if content.name == tool_name:
                            return response_model.model_validate(content.input)
            raise ValueError("No structured tool response found in Claude's response")

        return _make_structured_api_call()

    async def count_tokens_async(self, text: str) -> int:
        @self._get_retry_decorator()
        async def _make_async_token_call():
            response = await self.async_client.messages.count_tokens(
                model=self.model, messages=[{'role': 'user', 'content': text}]
            )
            return response.input_tokens

        return await _make_async_token_call()

    async def chat_structured_async(
        self, messages: list, response_model: Type[T], max_tokens: int = 4000, temperature: float = 0.1
    ) -> T:
        schema = response_model.model_json_schema()
        tool_name = f'provide_{response_model.__name__.lower()}'
        tool = {
            'name': tool_name,
            'description': f'Provide response in {response_model.__name__} format',
            'input_schema': schema,
        }

        @self._get_retry_decorator()
        async def _make_async_structured_call():
            response = await self.async_client.messages.create(
                model=self.model,
                max_tokens=max_tokens,
                temperature=temperature,
                messages=messages,
                tools=[tool],
                tool_choice={'type': 'tool', 'name': tool_name},
            )
            if response.content and len(response.content) > 0:
                for content in response.content:
                    if hasattr(content, 'type') and content.type == 'tool_use':
                        if content.name == tool_name:
                            return response_model.model_validate(content.input)
            raise ValueError("No structured tool response found in Claude's response")

        return await _make_async_structured_call()
