import math
from io import BytesIO
from PIL import Image

from qwen_vl_utils.vision_process import (
    to_rgb,
    round_by_factor,
    floor_by_factor,
    ceil_by_factor,
    IMAGE_FACTOR,
    MIN_PIXELS,
    MAX_PIXELS,
    MAX_RATIO,
)


def load_image(image: dict | Image.Image) -> Image.Image:
    if isinstance(image, Image.Image):
        return image.convert("RGB")

    # assert "bytes" in image and "image" not in image
    image = Image.open(BytesIO(image["bytes"]))
    return to_rgb(image)

def create_empty_image(size: tuple[int, int] = (28, 28), mode: str = "RGB") -> Image.Image:
    return Image.new(mode, size, color=0)


def controlled_smart_resize(
    height: int, width: int, factor: int = IMAGE_FACTOR,
    min_pixels: int = MIN_PIXELS, max_pixels: int = MAX_PIXELS,
    max_ratio: float = MAX_RATIO,
) -> tuple[int, int]:
    """
    Rescales the image so that the following conditions are met:

    1. Both dimensions (height and width) are divisible by 'factor'.

    2. The total number of pixels is within the range ['min_pixels', 'max_pixels'].

    3. The aspect ratio of the image is maintained as closely as possible.
    """
    h_bar = max(factor, round_by_factor(height, factor))
    w_bar = max(factor, round_by_factor(width, factor))
    if h_bar * w_bar > max_pixels:
        beta = math.sqrt((height * width) / max_pixels)
        h_bar = floor_by_factor(height / beta, factor)
        w_bar = floor_by_factor(width / beta, factor)
    elif h_bar * w_bar < min_pixels:
        beta = math.sqrt(min_pixels / (height * width))
        h_bar = ceil_by_factor(height * beta, factor)
        w_bar = ceil_by_factor(width * beta, factor)

    ratio = max(h_bar, w_bar) / min(h_bar, w_bar)
    if max_ratio > 0 and ratio > max_ratio:
        if h_bar > w_bar:
            h_bar = floor_by_factor(h_bar / ratio * max_ratio, factor)
        else:
            w_bar = floor_by_factor(w_bar / ratio * max_ratio, factor)

    return h_bar, w_bar
