from .base import BaseVLM
from .qwen import QwenVLVLM
# from .internvl_chat import InternVLVLM
from .internvl_generate import InternVLVLM
from .ovis import OvisVLM
from .ovis_u1 import OvisU1VLM
from .vintern import VinternVLM
from .smolvlm import SmolVLM
from .vila import VilaVLM
from .llava_vision import LLaVAVisionVLM
from .qtunevl_intern_generate import QTuneInternVLVLM
from .qtunevl_qwen_generate import QTuneQwenVLVLM
from .bunny import BunnyVLM
from .gemma3 import Gemma3VLM
from .phi import PhiVisionVLM
from .sail import SailVLVLM
from .molmo import MolmoVLM
from .llava_1_5 import Llava15VLM
from .granite import GraniteVisionVLM
from .minicpmv2 import MiniCPMVLMV2
from .h2ovl import H2OVLVLM
from .llava_next import  LlavaInterleaveVLM
from .ovis_llama import OvisLlamaVLM

# new models
from .varco import VarcoVisionVLM
from .r4b import R4BVLM
from .points import POINTSVLM
from .omchat import OmChatVLM
from .pixtral import PixtralVLM
from .sharegpt4v import ShareGPT4VVLM
from .ristretto import RistrettoVLM
from .minicpm_llama3 import MiniCPMLlama3V25VLM
from .minicpm import MiniCPMVLM

def create_backend(
    model_key: str,
    model,
    tokenizer,
    processor,
    device: str = "cuda",
) -> BaseVLM:
    mk = model_key.lower()

    if any(
        kw in mk
        for kw in [
            "wepoints/points-qwen-2-5-7b-chat",
            "points-qwen-2-5-7b-chat",
            "wepoints/points-yi-1-5-9b-chat",
            "points-yi-1-5-9b-chat",
        ]
    ):
        # Here: `processor` should be the image processor (e.g., CLIPImageProcessor)
        return POINTSVLM(model=model, tokenizer=tokenizer, image_processor=processor, device=device)

    if any(kw in mk for kw in ["pixtral", "mistral-community/pixtral-12b", "mistralai/pixtral"]):
        return PixtralVLM(model=model, tokenizer=tokenizer, processor=processor, device=device)

    if any(kw in mk for kw in ["varco-vision-2.0", "varco-vision-2", "varco-vision"]):
        return VarcoVisionVLM(model=model, processor=processor, device=device)

    if any(kw in mk for kw in ["yannqi/r-4b", "r-4b"]):
        return R4BVLM(model=model, tokenizer=tokenizer, processor=processor, device=device)

    if any(kw in mk for kw in ["omchat", "omlab/omchat"]):
        return OmChatVLM(model=model, tokenizer=tokenizer, processor=processor, device=device)

    if "sharegpt4v-7b-hf" in mk or "gokul-mbzuai" in mk:
        return ShareGPT4VVLM(model=model, tokenizer=tokenizer, processor=processor, device=device)

    if "liautoad/ristretto-3b" in mk or "ristretto-3b" in mk:
        return RistrettoVLM(model=model, tokenizer=tokenizer, processor=processor, device=device)

    if any(kw in mk for kw in ["minicpm-llama3-v-2_5"]):
        return MiniCPMLlama3V25VLM(model=model, tokenizer=tokenizer, processor=processor, device=device)

    if any(kw in mk for kw in ["minicpm"]):
        return MiniCPMVLM(model=model, tokenizer=tokenizer, processor=processor, device=device)

    # ============================================ 分割线 ======================================================

    # InternVL 系列
    if "internvl" in mk:
        return InternVLVLM(model=model, tokenizer=tokenizer, device=device)

    if "vintern" in mk:
        return VinternVLM(model=model, tokenizer=tokenizer, device=device)

    # Ovis 系列
    if "ovis" in mk:
        if "ovis-u1" in mk:
            return OvisU1VLM(model=model, device=device)
        else:
            if "llama" in mk:
                return OvisLlamaVLM(model=model, device=device)
        return OvisVLM(model=model, device=device)

    # Gemma3 系列
    if "gemma-3" in mk:
        return Gemma3VLM(model=model, processor=processor, device=device)

    # Phi Vision 系列
    if any(kw in mk for kw in ["phi-3.5-vision", "phi-3.5-vision-instruct", "phi-4-vision", "phi-3-vision", "phi-4"]):
        return PhiVisionVLM(model=model, processor=processor, device=device)

    # Qwen-VL + llama 系列
    if any(kw in mk for kw in ["qwen2.5-vl", "qwen2-vl", "qwen-vl", "llama-3.2-11b-vision-instruct", "llama-3.2-90b-vision-instruct", "xinyuan"]):
        if "llama" in mk:
            return QwenVLVLM(model=model, tokenizer=tokenizer, processor=processor, device=device, model_type="llama")
        else:
            return QwenVLVLM(model=model, tokenizer=tokenizer, processor=processor, device=device)

    # smolvm 系列
    if "smolvlm" in mk:
        return SmolVLM(model=model, tokenizer=tokenizer, processor=processor, device=device)

    # vila 系列
    if "vila" in mk:
        return  VilaVLM(model=model, device=device)

    # llava-v1.5 系列
    if "llava-v1.5" in mk:
        return Llava15VLM(model=model, processor=processor, device=device)

    # sail 系列
    if "sail" in mk:
        return SailVLVLM(model=model, tokenizer=tokenizer, device=device)

    # molmo 系列
    if "molmo" in mk:
        return MolmoVLM(model=model, processor=processor, device=device)

    # bunny 系列
    if "bunny" in mk:
        return BunnyVLM(model=model, tokenizer=tokenizer, device=device)

    # qtunevl_intern + qtune_qwen 系列
    if "qtunevl" in mk:
        if "2b" in mk:
            return QTuneInternVLVLM(model=model, tokenizer=tokenizer, processor=processor, device=device)
        else:
            if "3b" in mk:
                return QTuneQwenVLVLM(model=model, tokenizer=tokenizer, processor=processor, device=device)

    # granite 系列
    if "granite" in mk:
        return GraniteVisionVLM(model=model, tokenizer=tokenizer, processor=processor, device=device)

    # minicpm 系列（minicpm-v-2）
    if "minicpm" in mk and "2" in mk:
        return MiniCPMVLMV2(model=model, processor=processor, tokenizer=tokenizer, device=device)

    # h2ovl 系列
    if "h2ovl" in mk:
        return H2OVLVLM(model=model, tokenizer=tokenizer, device=device, max_tiles=6)

    # llava-next 系列
    if "llava-interleave" in mk or "llava-next" in mk:
        return LlavaInterleaveVLM(model=model, processor=processor, device=device)

    # llava-onevision 系列
    if "llava-onevision" in mk or "llava-vision" in mk:
        return LLaVAVisionVLM(model=model, tokenizer=tokenizer, processor=processor, device=device)

