import json
import os

import cv2
import numpy as np

from PIL import Image
from tqdm import tqdm, trange
from utils.graphics_utils import focal2fov, fov2focal

from .camera_info import CameraInfo
from .functions import shift_image

from .functions import (
    rotate_camera_around_x_axis,
    rotate_camera_around_y_axis,
    rotate_camera_around_z_axis,
)

def read_cameras_from_transforms_wild_smoke(
    path,
    transforms_file,
    white_background,
    start_time=50,
    duration=50,
    time_step=1,
    max_timestamp=1.0,
    gray_image=False,
    img_offset=False,
    read_image=True,
    *args,
    **kwargs,
):
    cam_infos = []
    print(f"start_time {start_time} duration {duration} time_step {time_step}")

    with open(os.path.join(path, transforms_file)) as json_file:
        contents = json.load(json_file)

    near = float(contents["near"])
    far = float(contents["far"])

    # voxel_scale = np.array(contents["voxel_scale"])
    # voxel_scale = np.broadcast_to(voxel_scale, [3])

    # voxel_matrix = np.array(contents["voxel_matrix"])
    # voxel_matrix = np.stack([voxel_matrix[:, 2], voxel_matrix[:, 1], voxel_matrix[:, 0], voxel_matrix[:, 3]], axis=1)
    # voxel_matrix_inv = np.linalg.inv(voxel_matrix)

    frames = contents["frames"]
    total_frames = duration

    fg_pts = contents.get('fg_pts', None)
    bg_pts = contents.get('bg_pts', None)

    if 'dust3r_points' in contents:
        dust3d_points = contents['dust3d_points']

    camera_uid = 0

    desc_str = "  reading views"
    start_time = 0 ###### lyq
                      
    for idx, frame in tqdm(enumerate(frames), desc=desc_str, total=len(frames), leave=True):
        time_idx = int(frame['frame_idx'] )
        timestamp = time_idx / (total_frames - 1) * max_timestamp

        camera_hw = frame["camera_hw"]
        h, w = camera_hw
        fx, fy, cx, cy = frame["fx"], frame["fy"], frame["cx"], frame["cy"]
        fxr, fyr = focal2fov(fx, w), focal2fov(fy, h)  # convert focal length to fov
        
        # Dust3D 'transform_matrix' is c2w
        c2w_gl = np.array(frame['transform_matrix'])  # 4×4
        c2w_gl[:3, 1:3] *= -1   
        c2w_gl = c2w_gl.astype(np.float32)

        theta_y = np.deg2rad(-15)
        c2w_gl = rotate_camera_around_y_axis(c2w_gl, theta_y)


        w2c = np.linalg.inv(c2w_gl)
        R = np.transpose(w2c[:3, :3])  # R is stored transposed due to 'glm' in CUDA code
        T = w2c[:3, 3]

        # change from OpenGL camera axes (Y up, Z back) to COLMAP (Y down, Z forward)
        # c2w_gl[:3, 1:3] *= -1
        # R_glm = c2w_gl[:3,:3].T           # store transposed
        # C     = c2w_gl[:3,3]
        # T_glm = -R_glm @ C


        focal_length = frame["focal"]
        # cam_name = frame["file_path"].split("/")[-2] # train0x -> x used to determine with train_views
        cam_name = frame["file_path"].split("/")[-2].split("cam")[-1]  # frames_cam00
        image_name = frame["file_path"].split("/")[-1] # lyq for

        

        if read_image:
            frame_name = frame["file_path"]
            image_path = os.path.join(path, frame_name)

            assert os.path.exists(image_path), f"Image path {image_path} does not exist!"

            image = cv2.imread(image_path, cv2.IMREAD_COLOR)
            image = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)


        else:
            image_path = ""
            image = np.zeros((h, w, 3), dtype=np.uint8)
            image = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)

        image[image < 10] = 0

        image = Image.fromarray(image)

        if gray_image:
            image = image.convert("L")

        pose = 1 if time_idx == start_time else None
        hp_directions = 1 if time_idx == start_time else None

        uid = camera_uid  # idx * duration//time_step + time_idx
        camera_uid += 1


        cam_infos.append(
            CameraInfo(
                uid=uid,
                R=R,
                T=T,
                FovY=fyr,
                FovX=fxr,
                image=image,
                real_image=image,
                image_path=image_path,
                image_name=image_name,
                width=image.size[0],
                height=image.size[1],
                time_idx=time_idx - start_time,
                timestamp=timestamp,
                near=near,
                far=far,
                pose=pose,
                hp_directions=hp_directions,
                cxr=0.0,
                cyr=0.0,
                is_fake_view=False,
                fg_pts=fg_pts,
                bg_pts=bg_pts,
            )
        )

    return cam_infos
