# backends/gemini_backend.py

import os
from google import genai
from google.genai import types
from .base_backend import BaseBackend
from .throttle import global_throttle

class GeminiBackend(BaseBackend):
    """
    Gemini API backend using google.genai v2 SDK (Gemini 2.5).
    Defaults to gemini-2.5-flash-lite.
    """

    def __init__(self,
                 model_name: str = "gemini-2.5-flash-lite",
                 temperature: float = 0.7,
                 max_tokens: int = 1024,
                 system_instruction: str = None,
                 api_key: str = None,
                 token_tracker=None,
                 **kwargs):

        self.api_key = api_key or os.getenv("GEMINI_API_KEY")
        if not self.api_key:
            raise ValueError("Missing Gemini API key. Set `GEMINI_API_KEY` or pass `api_key`.")

        # Create client
        self.client = genai.Client(api_key=self.api_key)
        self.model_name = model_name
        self.temperature = temperature
        self.max_tokens = max_tokens
        self.system_instruction = system_instruction
        self.token_tracker = token_tracker

    def chat(self, system: str, user: str, agent_id: str = None, return_usage: bool = False) -> str | dict:
        # Build combined system + user if system provided here; 
        # or use system_instruction from initializer
        # Choosing to prefer explicit `self.system_instruction` first, then passed `system`
        sys_instr = self.system_instruction or system

        full_prompt = user  # contents in docs is just the user input

        # Build config if needed
        config_kwargs = {}
        if self.temperature is not None:
            config_kwargs["temperature"] = self.temperature
        if self.max_tokens is not None:
            config_kwargs["max_output_tokens"] = self.max_tokens
        if sys_instr is not None:
            config_kwargs["system_instruction"] = sys_instr

        # Use types.GenerateContentConfig if any config options are set
        config = None
        if config_kwargs:
            config = types.GenerateContentConfig(**config_kwargs)

        # Call generate_content
        global_throttle()
        if config is not None:
            response = self.client.models.generate_content(
                model=self.model_name,
                contents=full_prompt,
                config=config
            )
        else:
            response = self.client.models.generate_content(
                model=self.model_name,
                contents=full_prompt
            )

        # Token usage logging
        meta = response.usage_metadata
        input_tokens = getattr(meta, "prompt_token_count", 0)
        output_tokens = getattr(meta, "candidates_token_count", 0)

        if self.token_tracker:
            self.token_tracker.log(
                agent_id=agent_id or "unknown",
                input_tokens=input_tokens,
                output_tokens=output_tokens,
                cached_input_tokens=0  # Gemini does not expose this
            )
    
        # Prepare return values
        answer_text = response.text.strip()

        if return_usage:
            return {
                "answer_text": answer_text,
                "usage": {
                    "input_tokens": input_tokens,
                    "output_tokens": output_tokens,
                    "cached_input_tokens": 0,
                    "total_tokens": input_tokens + output_tokens
                }
            }

        return answer_text