import os
import subprocess
import h5py

import numpy as np
import torch

import torchvision
from torchvision.datasets.utils import download_url
import random
from dl.datasets.base import DisentangledDataset

THIS_PATH = os.path.dirname(__file__)
ROOT_PATH = os.path.abspath(os.path.join(THIS_PATH, '..', '..', '..', '..', '..'))
IMAGE_PATH = os.path.join(ROOT_PATH, 'datasets/disentanglement/mpi3d_toy')

urls = {
    "train":
        "https://storage.googleapis.com/disentanglement_dataset/Final_Dataset/mpi3d_toy.npz",
    "md5":
        "55889cb7c7dfc655d6e0277beee88868",
}
files = {"train": "mpi3d_toy.npz"}
lat_names = ('objCol', 'objShape', 'objSize', 'cameraHeight', 'backCol', 'posX', 'posY')
lat_sizes = np.array([6, 6, 2, 3, 3, 40, 40])
img_size = (3, 64, 64)
# lat_values = {
#     'objCol': np.linspace(0, 5, 6),
#     'objShape': np.linspace(0, 5, 6),
#     'objSize': np.linspace(0, 1, 2),
#     'cameraHeight': np.linspace(0, 2, 3),
#     'backCol': np.linspace(0, 2, 3),
#     'posX': np.linspace(0, 39, 40),
#     'posY': np.linspace(0, 39, 40)
# }


class MPI3D_toy_Semi(DisentangledDataset):
    """MPI3D Dataset as part of the NeurIPS 2019 Disentanglement Challenge.

    A data-set which consists of over one million images of physical 3D objects with seven factors of variation,
    such as object color, shape, size and position.

    Notes
    -----
    - Link : https://storage.googleapis.com/disentanglement_dataset/Final_Dataset/mpi3d_toy.npz
    - hard coded metadata because issue with python 3 loading of python 2

    Parameters
    ----------
    root : string
        Root directory of dataset.

    """

    def __init__(self, root=IMAGE_PATH, transforms_list=[torchvision.transforms.ToTensor()], semi_ratio=0.5):
        super(MPI3D_toy_Semi, self).__init__(root=root, transforms_list=transforms_list)


        self.train_data = os.path.join(root, files["train"])

        if not os.path.isdir(root):
            # self.logger.info("Downloading {} ...".format(str(type(self))))
            self.download()

        data = np.load(self.train_data)
        self.data = data['images']

        latents_classes = []
        # https://github.com/facebookresearch/disentangling-correlated-factors/blob/main/datasets/mpi3d_real.py
        lat_values = {
            "objCol": np.arange(6),
            "objShape": np.arange(6),
            "objSize": np.arange(2),
            "cameraHeight": np.arange(3),
            "backCol": np.arange(3),
            "posX": np.arange(40),
            "posY": np.arange(40),
        }
        for col in lat_values["objCol"]:
            for shp in lat_values["objShape"]:
                for siz in lat_values["objSize"]:
                    for hgt in lat_values["cameraHeight"]:
                        for bck in lat_values["backCol"]:
                            for x in lat_values["posX"]:
                                for y in lat_values["posY"]:
                                    latents_classes.append(
                                        [col, shp, siz, hgt, bck, x, y]
                                    )
        self.latents_classes = np.array(latents_classes)
        self.factor_num = self.latents_classes.shape[-1]
        self.factor_dict = {0: 4, 1: 4, 2: 2, 3: 3, 4: 3, 5: 40, 6: 40}
        assert self.factor_num == 7

        # set semi-supervised learning
        t_total = self.__len__()
        self.semi_idx = np.random.choice(
            t_total, round(t_total * semi_ratio), replace=False
        )

    def download(self):
        """Download the dataset."""
        os.makedirs(self.root)
        # download_url(urls["train"], IMAGE_PATH, files["train"], urls["md5"])
        # subprocess.check_call([
        #     "wget", "-P", IMAGE_PATH, "-O", files["train"],
        #     urls["train"]
        # ])
        subprocess.check_call([
            "curl", "--insecure", "-I","-L",
            urls["train"], "--output", self.train_data
        ])


    def __getitem__(self, idx):
        """Get the image of `idx`
        Return
        ------
        sample : torch.Tensor
            Tensor in [0.,1.] of shape `img_size`.

        lat_value : np.array
            Array of length 6, that gives the value of each factor of variation.
        """
        # ToTensor transforms numpy.ndarray (H x W x C) in the range
        # [0, 255] to a torch.FloatTensor of shape (C x H x W) in the range [0.0, 1.0]
        # return self.transforms(self.data[idx]), torch.Tensor(self.latents_classes[idx])
        data = self.transforms(self.data[idx])
        classes = torch.Tensor(self.latents_classes[idx])
        semi_classes = torch.Tensor(self.latents_classes[idx])
        if idx not in self.semi_idx:
            semi_classes += 9999
        return data, classes, semi_classes

    def factor_to_idx(self, factor):
        base = np.array(
            [6 * 2 * 3 * 3 * 40 * 40, 2 * 3 * 3 * 40 * 40, 3 * 3 * 40 * 40, 3 * 40 * 40, 40 * 40, 40, 1]
        )
        idx = np.dot(factor, base)
        return idx








