from transformers import AutoModel, AutoTokenizer
import sys
sys.path.append("the relative path")
import argparse
import torch
import logging
from PIL import Image
logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(message)s')
import io
class MiniCPM():
    def __init__(self, cfg): 
        super().__init__()
        self.name = "MiniCPM"
        self.device = cfg.device
        self.temperature = cfg.temperature #0
        """Load model and tokenizer."""
        logging.info("Loading model and tokenizer...")
        self.model =AutoModel.from_pretrained(cfg.model_path, trust_remote_code=True, attn_implementation='sdpa', torch_dtype=torch.bfloat16)
        self.model.eval().cuda()
        self.tokenizer = AutoTokenizer.from_pretrained(cfg.model_path, trust_remote_code=True) # , use_fast=False
        self.use_image_token = False
        self.prompt = None  

    def generate_prompt(self, prompt = None):
        
        self.prompt = prompt.replace('<image>',"")
        
        return self.prompt

    def save_temp_image(self, image, image_path):
        image.save(image_path, format="JPEG")
    
    def get_answer(self, image_path):
        if isinstance(image_path, bytes):
            image = Image.open(io.BytesIO(image_path)).convert("RGB")
        else:
            image = Image.open(image_path).convert("RGB")
            # temp_image_path = image_path
            
        with torch.no_grad():   
            print(self.prompt)         
            messages = [
                {"role": 'user','content': [image, self.prompt]},
            ]

            res = self.model.chat(
                image=None,
                msgs=messages,
                tokenizer=self.tokenizer
            )

        return res, 1, 2

