from dataclasses import dataclass, field

import numpy as np
import torch

import threestudio
from threestudio.systems.base import BaseLift3DSystem
from threestudio.utils.typing import *


@threestudio.register("sjc-system")
class ScoreJacobianChaining(BaseLift3DSystem):
    @dataclass
    class Config(BaseLift3DSystem.Config):
        subpixel_rendering: bool = True

    cfg: Config

    def configure(self):
        # create geometry, material, background, renderer
        super().configure()
        self.guidance = threestudio.find(self.cfg.guidance_type)(self.cfg.guidance)

    def forward(self, batch: Dict[str, Any], decode: bool = False) -> Dict[str, Any]:
        render_out = self.renderer(**batch)
        out = {
            **render_out,
        }
        if decode:
            if self.cfg.subpixel_rendering:
                latent_height, latent_width = 128, 128
            else:
                latent_height, latent_width = 64, 64
            out["decoded_rgb"] = self.guidance.decode_latents(
                out["comp_rgb"].permute(0, 3, 1, 2),
                latent_height=latent_height,
                latent_width=latent_width,
            ).permute(0, 2, 3, 1)
        return out

    def on_fit_start(self) -> None:
        super().on_fit_start()
        self.output_rgb = []
        # only used in training
        self.prompt_processor = threestudio.find(self.cfg.prompt_processor_type)(
            self.cfg.prompt_processor
        )

    def on_test_start(self) -> None:
        # check if guidance is initialized, such as when loading from checkpoint
        if not hasattr(self, "guidance"):
            self.guidance = threestudio.find(self.cfg.guidance_type)(self.cfg.guidance)

    def training_step(self, batch, batch_idx):
        out = self(batch)
        prompt_utils = self.prompt_processor()
        guidance_out = self.guidance(
            out["comp_rgb"], prompt_utils, **batch, rgb_as_latents=True
        )

        loss = 0.0

        for name, value in guidance_out.items():
            self.log(f"train/{name}", value)
            if name.startswith("loss_"):
                loss += value * self.C(self.cfg.loss[name.replace("loss_", "lambda_")])

        loss_emptiness = (
            self.C(self.cfg.loss.lambda_emptiness)
            * torch.log(1 + self.cfg.loss.emptiness_scale * out["weights"]).mean()
        )

        self.log("train/loss_emptiness", loss_emptiness)
        loss += loss_emptiness

        # About the depth loss, see https://github.com/pals-ttic/sjc/issues/21
        if self.C(self.cfg.loss.lambda_depth) > 0:
            _, h, w, _ = out["comp_rgb"].shape
            comp_depth = (out["depth"] + 10 * (1 - out["opacity"])).squeeze(-1)
            center_h = int(self.cfg.loss.center_ratio * h)
            center_w = int(self.cfg.loss.center_ratio * w)
            border_h = (h - center_h) // 2
            border_w = (h - center_w) // 2
            center_depth = comp_depth[
                ..., border_h : border_h + center_h, border_w : border_w + center_w
            ]
            center_depth_mean = center_depth.mean()
            border_depth_mean = (comp_depth.sum() - center_depth.sum()) / (
                h * w - center_h * center_w
            )
            log_input = center_depth_mean - border_depth_mean + 1e-12
            loss_depth = (
                torch.sign(log_input)
                * torch.log(log_input)
                * self.C(self.cfg.loss.lambda_depth)
            )

            self.log("train/loss_depth", loss_depth)
            loss += loss_depth

        for name, value in self.cfg.loss.items():
            self.log(f"train_params/{name}", self.C(value))

        return {"loss": loss}

    def vis_depth(self, pred_depth):
        depth = pred_depth.detach().cpu().numpy()
        depth = np.log(1.0 + depth + 1e-12) / np.log(1 + 10.0)
        return depth

    def validation_step(self, batch, batch_idx):
        # out = self(batch, decode=True)
        # comp_depth = out["depth"] + 10 * (1 - out["opacity"])  # 10 for background
        # vis_depth = self.vis_depth(comp_depth.squeeze(-1))

        # self.save_image_grid(
        #     f"it{self.true_global_step}-{batch['index'][0]}.png",
        #     [
        #         {
        #             "type": "rgb",
        #             "img": out["decoded_rgb"][0],
        #             "kwargs": {"data_format": "HWC"},
        #         },
        #     ]
        #     + (
        #         [
        #             {
        #                 "type": "rgb",
        #                 "img": out["comp_normal"][0],
        #                 "kwargs": {"data_format": "HWC", "data_range": (0, 1)},
        #             }
        #         ]
        #         if "comp_normal" in out
        #         else []
        #     )
        #     + [
        #         {
        #             "type": "grayscale",
        #             "img": out["opacity"][0, :, :, 0],
        #             "kwargs": {"cmap": None, "data_range": (0, 1)},
        #         },
        #     ]
        #     + [
        #         {
        #             "type": "grayscale",
        #             "img": vis_depth[0],
        #             "kwargs": {"cmap": "spectral", "data_range": (0, 1)},
        #         },
        #     ],
        #     align=512,
        #     name="validation_step",
        #     step=self.true_global_step,
        # )
        pass

    def on_validation_epoch_end(self):
        pass

    def test_step(self, batch, batch_idx):
        out = self(batch, decode=True)
        rgb_img = self.get_rgb_image_(
            out["decoded_rgb"][0],
            "HWC",
            (0, 1)
        )
        print(out["decoded_rgb"][0].shape)
        self.output_rgb.append(rgb_img)
        # self.save_image_grid(
        #     f"it{self.true_global_step}-test/{batch['index'][0]}.png",
        #     [
        #         {
        #             "type": "rgb",
        #             "img": out["decoded_rgb"][0],
        #             "kwargs": {"data_format": "HWC"},
        #         },
        #     ]
        #     + (
        #         [
        #             {
        #                 "type": "rgb",
        #                 "img": out["comp_normal"][0],
        #                 "kwargs": {"data_format": "HWC", "data_range": (0, 1)},
        #             }
        #         ]
        #         if "comp_normal" in out
        #         else []
        #     )
        #     + [
        #         {
        #             "type": "grayscale",
        #             "img": out["opacity"][0, :, :, 0],
        #             "kwargs": {"cmap": None, "data_range": (0, 1)},
        #         },
        #     ],
        #     align=512,
        #     name="test_step",
        #     step=self.true_global_step,
        # )

    def on_test_epoch_end(self):
        # self.save_img_sequence(
        #     f"it{self.true_global_step}-test",
        #     f"it{self.true_global_step}-test",
        #     "(\d+)\.png",
        #     save_format="mp4",
        #     fps=30,
        #     name="test",
        #     step=self.true_global_step,
        # )
        pass
    # def result_imgs(self):
    #     return self.get_img_sequence(
    #         f"it{self.true_global_step}-test",
    #         "(\d+)\.png"
    #     )