import json
import os
import random
import time

import litellm

_PRINTED_MODEL_DEBUG = set()


def get_llm_output(
    message,
    model="gpt-4o",
    max_new_tokens=4096,
    temperature=0,
    json_object=False,
    system_prompt=None,
    **generation_kwargs
):
    """
    Use litellm to complete a prompt using the specified model.

    Args:
        message (str or list): The input message or a list of message dicts.
        model (str): The model to use for completion.
        max_new_tokens (int): Maximum number of tokens to generate.
        temperature (float): Sampling temperature.
        json_object (bool): Whether to output in JSON format.
        system_prompt (str): Optional system prompt.

    Returns:
        str: The completed text generated by the model.
    """
    # Convert message to litellm-compatible format if needed
    if isinstance(message, str):
        messages = [{"role": "user", "content": message}]
        if system_prompt:
            messages.insert(0, {"role": "system", "content": system_prompt})
    else:
        messages = message

    debug_llm = (os.getenv("TEXTRESNET_DEBUG_LLM") or "").strip().lower() in {"1", "true", "yes"}
    orig_model = model
    route_note = ""

    # Auto-route to OpenRouter if user provided OPENROUTER_API_KEY.
    #
    # Behavior:
    # - If model already starts with "openrouter/", keep as-is.
    # - If OPENROUTER_API_KEY is set and (OPENAI_API_KEY is NOT set OR TEXTRESNET_USE_OPENROUTER=1),
    #   rewrite common model strings to OpenRouter-compatible IDs.
    #
    # Examples:
    # - "openai/gpt-4o-mini" -> "openrouter/openai/gpt-4o-mini"
    # - "gpt-4o" -> "openrouter/openai/gpt-4o"
    # - "claude-3-haiku-20240307" -> "openrouter/anthropic/claude-3-haiku-20240307"
    if isinstance(model, str) and not model.startswith("openrouter/"):
        has_openrouter_key = bool(os.getenv("OPENROUTER_API_KEY"))
        force_openrouter = (os.getenv("TEXTRESNET_USE_OPENROUTER") or "").strip().lower() in {"1", "true", "yes"}
        has_openai_key = bool(os.getenv("OPENAI_API_KEY"))
        if has_openrouter_key and (force_openrouter or not has_openai_key):
            if model.startswith(("openai/", "anthropic/", "meta-llama/", "google/", "mistralai/", "qwen/")):
                model = f"openrouter/{model}"
                route_note = "auto_route(openrouter_key=1): openrouter/{provider_model}"
            elif model.startswith("gpt-"):
                model = f"openrouter/openai/{model}"
                route_note = "auto_route(openrouter_key=1): openrouter/openai/{gpt-*}"
            elif model.startswith("claude-"):
                model = f"openrouter/anthropic/{model}"
                route_note = "auto_route(openrouter_key=1): openrouter/anthropic/{claude-*}"
        elif has_openrouter_key and has_openai_key and not force_openrouter:
            route_note = (
                "auto_route_skipped: OPENAI_API_KEY present; set TEXTRESNET_USE_OPENROUTER=1 to force"
            )

    # Optional model prefix helper (useful for OpenRouter without changing configs).
    # Example:
    #   export TEXTRESNET_LITELLM_MODEL_PREFIX=openrouter
    #   model="gpt-4o" -> "openrouter/gpt-4o"
    #   model="openai/gpt-4o-mini" -> "openrouter/openai/gpt-4o-mini"
    if isinstance(model, str):
        prefix = os.getenv("TEXTRESNET_LITELLM_MODEL_PREFIX") or os.getenv("TEXTRESNET_MODEL_PREFIX")
        if prefix:
            prefix = prefix.strip()
            if prefix and not model.startswith(prefix.rstrip("/") + "/") and not model.startswith("openrouter/"):
                model = f"{prefix.rstrip('/')}/{model.lstrip('/')}"
                if not route_note:
                    route_note = f"prefix({prefix.rstrip('/')})"

    # Debug print (once per resolved model per process)
    if debug_llm:
        key = (str(orig_model), str(model), route_note)
        if key not in _PRINTED_MODEL_DEBUG:
            _PRINTED_MODEL_DEBUG.add(key)
            print(
                "[TEXTRESNET_LLM_DEBUG] "
                f"orig_model={orig_model!r} -> resolved_model={model!r} "
                f"route={route_note or 'none'} "
                f"OPENROUTER_API_KEY={'1' if os.getenv('OPENROUTER_API_KEY') else '0'} "
                f"OPENAI_API_KEY={'1' if os.getenv('OPENAI_API_KEY') else '0'} "
                f"TEXTRESNET_USE_OPENROUTER={os.getenv('TEXTRESNET_USE_OPENROUTER')!r}"
            )

    kwargs = {
        "model": model,
        "messages": messages,
        "max_tokens": max_new_tokens,
        "temperature": temperature,
    }
    kwargs.update(generation_kwargs)

    if json_object:
        kwargs["response_format"] = {"type": "json_object"}

    # Timeout + retries (helps with transient network/proxy errors like:
    # "peer closed connection without sending complete message body (incomplete chunked read)")
    def _env_int(name: str, default: int) -> int:
        try:
            return int(os.getenv(name, default))
        except Exception:
            return default

    def _env_float(name: str, default: float) -> float:
        try:
            return float(os.getenv(name, default))
        except Exception:
            return default

    max_retries = _env_int("TEXTRESNET_LLM_MAX_RETRIES", 3)
    base_sleep = _env_float("TEXTRESNET_LLM_RETRY_BASE_SECONDS", 1.0)
    timeout_s = _env_float("TEXTRESNET_LLM_TIMEOUT_SECONDS", 120.0)

    if "timeout" not in kwargs and "request_timeout" not in kwargs:
        kwargs["timeout"] = timeout_s

    # Provider defaults (kept minimal on purpose)
    # - OpenRouter: requires model="openrouter/..." and OPENROUTER_API_KEY
    if isinstance(model, str) and model.startswith("openrouter/"):
        if "api_key" not in kwargs:
            # Prefer OpenRouter key; fall back to OPENAI_API_KEY if user reuses it.
            kwargs["api_key"] = os.getenv("OPENROUTER_API_KEY") or os.getenv("OPENAI_API_KEY")

        if "api_base" not in kwargs and os.getenv("OPENROUTER_API_BASE"):
            kwargs["api_base"] = os.getenv("OPENROUTER_API_BASE")

        # Optional OpenRouter attribution headers (recommended by OpenRouter)
        extra_headers = kwargs.get("extra_headers") or {}
        http_referer = os.getenv("OPENROUTER_HTTP_REFERER") or os.getenv("OPENROUTER_SITE_URL")
        x_title = os.getenv("OPENROUTER_X_TITLE") or os.getenv("OPENROUTER_APP_NAME")
        if http_referer and "HTTP-Referer" not in extra_headers:
            extra_headers["HTTP-Referer"] = http_referer
        if x_title and "X-Title" not in extra_headers:
            extra_headers["X-Title"] = x_title
        if extra_headers:
            kwargs["extra_headers"] = extra_headers

    # Call litellm (with a small compatibility fallback for providers that don't
    # support OpenAI's response_format)
    def _is_transient_error(e: Exception) -> bool:
        msg = (str(e) or "").lower()
        name = type(e).__name__.lower()
        transient_markers = [
            "incomplete chunked read",
            "peer closed connection",
            "remoteprotocolerror",
            "connection reset",
            "connection aborted",
            "timed out",
            "timeout",
            "temporarily unavailable",
            "502",
            "503",
            "504",
            "rate limit",
        ]
        if any(m in msg for m in transient_markers):
            return True
        if "openrouter" in name or "apierror" in name:
            # litellm often wraps transport errors as APIError/OpenrouterException
            return True
        return False

    last_err: Exception | None = None
    for attempt in range(max(1, max_retries) + 1):
        try:
            try:
                response = litellm.completion(**kwargs)
            except Exception as e:
                if json_object and "response_format" in kwargs:
                    retry_kwargs = dict(kwargs)
                    retry_kwargs.pop("response_format", None)
                    response = litellm.completion(**retry_kwargs)
                else:
                    raise e
            last_err = None
            break
        except Exception as e:
            last_err = e
            if attempt >= max_retries or not _is_transient_error(e):
                raise
            # exponential backoff with jitter
            sleep_s = min(30.0, base_sleep * (2 ** max(0, attempt - 1)))
            sleep_s = sleep_s * (0.8 + 0.4 * random.random())
            if debug_llm:
                print(
                    "[TEXTRESNET_LLM_DEBUG] "
                    f"retry={attempt}/{max_retries} sleep={sleep_s:.2f}s "
                    f"err={type(e).__name__}: {str(e)[:200]}"
                )
            time.sleep(sleep_s)

    if last_err is not None:
        raise last_err

    # litellm returns an object similar to OpenAI
    content = response.choices[0].message.content
    if json_object:
        try:
            return json.loads(content)
        except Exception as e:
            raise ValueError(f"Model did not return valid JSON. Raw content: {content[:500]}") from e
    else:
        return content
