import os
import sys
import base64
import binascii
from dotenv import load_dotenv

import json, inspect
from typing import Callable, Any, Dict, List

# ── Third-party SDKs ───────────────────────────────────────────────────────────
from openai import OpenAI                       # OpenAI-compatible endpoint
from anthropic import Anthropic                 # Claude / Anthropic endpoint

# ── Local project setup ────────────────────────────────────────────────────────
load_dotenv()
project_root = os.path.abspath(os.path.dirname(os.path.dirname(__file__)))
sys.path.insert(0, project_root)

# ── API clients ────────────────────────────────────────────────────────────────
openai_client = OpenAI(
    api_key=os.environ["OPENAILIKE_VLM_API_KEY"],
    base_url=os.environ["OPENAILIKE_VLM_BASE_URL"],
)

anthropic_client = Anthropic(
    api_key=os.environ["ANTHROPIC_VLM_API_KEY"],
    base_url=os.environ["ANTHROPIC_VLM_BASE_URL"],
)

def _build_numbered_clients(
    sdk_cls,
    key_prefix: str,
    url_prefix: str,
):
    """
    Collect sequentially-numbered <PREFIX>_API_KEY{n} / <PREFIX>_BASE_URL{n}
    pairs found in os.environ and return a list
    """
    clients = []          # slot 0 = the default, for convenience

    idx = 0
    while True:
        key_var  = f"{key_prefix}{idx}"
        url_var  = f"{url_prefix}{idx}"

        if key_var not in os.environ or url_var not in os.environ:
            break                       # stop at the first gap

        api_key   = os.environ[key_var]
        base_url  = os.environ[url_var]  # fall-back

        clients.append(
            sdk_cls(api_key=api_key, base_url=base_url)
        )
        idx += 1

    return clients


openai_clients = _build_numbered_clients(
    sdk_cls=OpenAI,
    key_prefix="OPENAILIKE_API_KEY",
    url_prefix="OPENAILIKE_BASE_URL",
)

anthropic_clients = _build_numbered_clients(
    sdk_cls=Anthropic,
    key_prefix="ANTHROPIC_API_KEY",
    url_prefix="ANTHROPIC_BASE_URL",
)

# ── Helper: light-weight MIME sniffing ─────────────────────────────────────────
def _detect_media_type(b64: str, fallback: str = "image/jpeg") -> str:
    """
    Inspect the first bytes of a Base-64 image and deduce its MIME type.
    Defaults to `fallback` if unknown.
    """
    try:
        hdr = base64.b64decode(b64[:64], validate=False)  # only a few bytes
    except binascii.Error:
        return fallback

    if hdr.startswith(b"\xFF\xD8\xFF"):               # JPEG SOI
        return "image/jpeg"
    if hdr.startswith(b"\x89PNG\r\n\x1A\n"):          # PNG signature
        return "image/png"
    if hdr.startswith(b"GIF87a") or hdr.startswith(b"GIF89a"):
        return "image/gif"
    if hdr[0:4] == b"RIFF" and hdr[8:12] == b"WEBP":  # WebP
        return "image/webp"
    return fallback

# ── Helper: OpenAI → Anthropic message conversion ─────────────────────────────
def _convert_to_anthropic(messages: list[dict]) -> tuple[str | None, list[dict]]:
    """
    Transform OpenAI-style messages (including image_url blocks)
    into Anthropic v1 format.
    """
    converted: list[dict] = []
    system_text: str | None = None

    for msg in messages:
        role = msg["role"]

        # System prompt is passed separately.
        if role == "system":
            system_text = msg["content"]
            continue

        new_msg: dict = {"role": role, "content": []}

        # 1️⃣ Pure-text message
        if isinstance(msg["content"], str):
            new_msg["content"].append({"type": "text", "text": msg["content"]})
            converted.append(new_msg)
            continue

        # 2️⃣ Mixed content list (text + images)
        for block in msg["content"]:
            if block["type"] == "text":
                new_msg["content"].append({"type": "text", "text": block["text"]})

            elif block["type"] == "image_url":
                url = block["image_url"]["url"]        # data:image/xyz;base64,…
                media_prefix, b64_data = url.split(";base64,", maxsplit=1)

                # Prefer real signature over the prefix (fixes 400 error)
                media_type = _detect_media_type(b64_data, fallback=media_prefix.replace("data:", ""))

                new_msg["content"].append(
                    {
                        "type": "image",
                        "source": {
                            "type": "base64",
                            "media_type": media_type,
                            "data": b64_data,
                        },
                    }
                )

        converted.append(new_msg)

    return system_text, converted

# ── Unified generation function ────────────────────────────────────────────────
def vlm_generation(messages: list[dict], model: str, index: int | None = None, **kwargs) -> str:
    """
    Route the request to Anthropic or OpenAI depending on `model`.
    """
    is_anthropic = any(tag in model.lower() for tag in ("anthropic", "claude"))

    if is_anthropic:
        system_text, claude_msgs = _convert_to_anthropic(messages)

        if index is None:
            response = anthropic_client.messages.create(
                model=model,
                system=system_text,
                messages=claude_msgs,
                max_tokens=kwargs.pop("max_tokens", 4096),   # Anthropic requires it
                **kwargs,
            )
        else:
            response = anthropic_clients[index].messages.create(
                model=model,
                system=system_text,
                messages=claude_msgs,
                max_tokens=kwargs.pop("max_tokens", 4096),   # Anthropic requires it
                **kwargs,
            )
        # Claude replies with a list of content blocks; first is always text.
        return response.content[0].text

    # ── OpenAI-compatible call ────────────────────────────────────────────────
    if index is None:
        chat_response = openai_client.chat.completions.create(
            model=model,
            messages=messages,
            **kwargs,
        )
    else:
        chat_response = openai_clients[index].chat.completions.create(
            model=model,
            messages=messages,
            **kwargs,
        )
    return chat_response.choices[0].message.content

if __name__ == "__main__":
    # Example usage (for testing purposes)
    example_messages = [
        {"role": "system", "content": "You are a helpful assistant."},
        {"role": "user", "content": "What is the capital of France?"},
    ]
    print(vlm_generation(example_messages, model="Qwen3-VL-30B-A3B-Instruct"))