import os
import requests
import json
from typing import Dict, Any, Optional
import time

class LLMProxyClient:
    def __init__(self):
        """Initialize the LLM proxy client with proxy server details from environment variables."""
        self.proxy_host = os.environ.get('LLM_PROXY_HOST', 'chpclic1')
        self.proxy_port = os.environ.get('LLM_PROXY_PORT', '5000')
        self.proxy_url = f"http://{self.proxy_host}:{self.proxy_port}/llm_proxy"
        
    def make_request(self, 
                    url: str, 
                    headers: Dict[str, str], 
                    payload: Dict[str, Any],
                    max_retries: int = 3,
                    retry_delay: float = 1.0) -> Dict[str, Any]:
        """
        Make an LLM API request through the proxy server.
        
        Args:
            url: The target LLM API URL
            headers: HTTP headers for the request
            payload: The request payload
            max_retries: Maximum number of retry attempts
            retry_delay: Delay between retries in seconds
            
        Returns:
            Dict containing the API response
            
        Raises:
            requests.exceptions.RequestException: If the request fails after all retries
        """
        proxy_payload = {
            'url': url,
            'headers': headers,
            'payload': payload
        }
        
        for attempt in range(max_retries):
            try:
                response = requests.post(
                    self.proxy_url,
                    json=proxy_payload,
                    timeout=30  # 30 second timeout
                )
                response.raise_for_status()
                return response.json()
            except requests.exceptions.RequestException as e:
                if attempt == max_retries - 1:  # Last attempt
                    raise  # Re-raise the last exception
                time.sleep(retry_delay * (attempt + 1))  # Exponential backoff
                
    def chat_completion(self,
                       model: str,
                       messages: list,
                       temperature: float = 1.0,
                       max_tokens: Optional[int] = None) -> Dict[str, Any]:
        """
        Make a chat completion request to the LLM API through the proxy.
        
        Args:
            model: The LLM model to use
            messages: List of message dictionaries
            temperature: Sampling temperature
            max_tokens: Maximum number of tokens to generate
            
        Returns:
            Dict containing the chat completion response
        """
        url = "https://api.openai.com/v1/chat/completions"
        headers = {
            "Content-Type": "application/json",
            "Authorization": f"Bearer {os.environ.get('OPENAI_API_KEY')}"
        }
        
        payload = {
            "model": model,
            "messages": messages,
            "temperature": temperature
        }
        
        if max_tokens is not None:
            payload["max_tokens"] = max_tokens
            
        return self.make_request(url, headers, payload) 