import os,sys
import os.path
import pdb
import numpy as np
import torch
import torch.utils.data
from torchvision import datasets,transforms
from sklearn.utils import shuffle
import urllib.request
from PIL import Image
import pickle

from .utils import *

########################################################################################################################

def get(seed=0, fixed_order=False, pc_valid=0.15, base_dir=None):
    data={}
    taskcla=[]
    size= [32, 32, 3] # [3,32,32]

    idata=np.arange(8)
    if not fixed_order:
        idata=list(shuffle(idata,random_state=seed))
    # print('Task order =',idata)

    if not os.path.isdir(base_dir+'/data/binary_mixture/'):
        os.makedirs(base_dir+'/data/binary_mixture')
        # Pre-load
        for n,idx in enumerate(idata):
            if idx==0:
                # CIFAR10
                mean=[x/255 for x in [125.3,123.0,113.9]]
                std=[x/255 for x in [63.0,62.1,66.7]]
                dat={}
                dat['train']=datasets.CIFAR10(base_dir+'/data/',train=True,download=True) #transform=transforms.Compose([transforms.ToTensor()]),transforms.Normalize(mean,std)
                dat['test']=datasets.CIFAR10(base_dir+'/data/',train=False,download=True) #,transform=transforms.Compose([transforms.ToTensor()]),transforms.Normalize(mean,std)
                data[n]={}
                data[n]['name']='cifar10'
                data[n]['ncla']=10
                for s in ['train','test']:
                    # loader=torch.utils.data.DataLoader(dat[s],batch_size=1,shuffle=False)
                    data[n][s]={'x': [],'y': []}
                    for image,target in dat[s]:
                        data[n][s]['x'].append(np.asarray(image))
                        data[n][s]['y'].append(target)

            elif idx==1:
                # CIFAR100
                mean=[x/255 for x in [125.3,123.0,113.9]]
                std=[x/255 for x in [63.0,62.1,66.7]]
                dat={}
                dat['train']=datasets.CIFAR100(base_dir+'/data/',train=True,download=True) #,transform=transforms.Compose([transforms.ToTensor()]),transforms.Normalize(mean,std)
                dat['test']=datasets.CIFAR100(base_dir+'/data/',train=False,download=True) #,transform=transforms.Compose([transforms.ToTensor()]),transforms.Normalize(mean,std)
                data[n]={}
                data[n]['name']='cifar100'
                data[n]['ncla']=100
                for s in ['train','test']:
                    # loader=torch.utils.data.DataLoader(dat[s],batch_size=1,shuffle=False)
                    data[n][s]={'x': [],'y': []}
                    for image,target in dat[s]:
                        data[n][s]['x'].append(np.asarray(image))
                        data[n][s]['y'].append(target)
                    # for image,target in loader:
                    #     data[n][s]['x'].append(image)
                    #     data[n][s]['y'].append(target.numpy()[0])

            elif idx==2:
                # MNIST
                #mean=(0.1307,) # Mean and std without including the padding
                #std=(0.3081,)
                mean=(0.1,) # Mean and std including the padding
                std=(0.2752,)
                dat={}
                dat['train']=datasets.MNIST(base_dir+'/data/',train=True,download=True,transform=transforms.Compose([
                    transforms.Pad(padding=2,fill=0)])) #,transforms.Normalize(mean,std),transforms.ToTensor()
                dat['test']=datasets.MNIST(base_dir+'/data/',train=False,download=True,transform=transforms.Compose([
                    transforms.Pad(padding=2,fill=0)])) #,transforms.Normalize(mean,std),transforms.ToTensor()
                data[n]={}
                data[n]['name']='mnist'
                data[n]['ncla']=10
                for s in ['train','test']:
                    # loader=torch.utils.data.DataLoader(dat[s],batch_size=1,shuffle=False)
                    data[n][s]={'x': [],'y': []}
                    for image,target in dat[s]:
                        image = np.reshape(np.stack([image,image,image], axis=-1), (32,32,3))
                        # image=image.expand(1,3,image.size(2),image.size(3)) # Create 3 equal channels
                        data[n][s]['x'].append(np.asarray(image))
                        data[n][s]['y'].append(target)
                    # for image,target in loader:
                    #     image=image.expand(1,3,image.size(2),image.size(3)) # Create 3 equal channels
                    #     data[n][s]['x'].append(image)
                    #     data[n][s]['y'].append(target.numpy()[0])

            elif idx == 3:
                # SVHN
                mean=[0.4377,0.4438,0.4728]
                std=[0.198,0.201,0.197]
                dat = {}
                dat['train']=datasets.SVHN(base_dir+'/data/',split='train',download=True) #,transform=transforms.Compose([transforms.ToTensor()]),transforms.Normalize(mean,std)
                dat['test']=datasets.SVHN(base_dir+'/data/',split='test',download=True) #,transform=transforms.Compose([transforms.ToTensor()]),transforms.Normalize(mean,std)
                data[n] = {}
                data[n]['name']='svhn'
                data[n]['ncla']=10
                for s in ['train','test']:
                    # loader = torch.utils.data.DataLoader(dat[s], batch_size=1, shuffle=False)
                    data[n][s] = {'x': [], 'y': []}
                    for image,target in dat[s]:
                        data[n][s]['x'].append(np.asarray(image))
                        data[n][s]['y'].append(target-1)
                    # for image, target in loader:
                    #     data[n][s]['x'].append(image)
                    #     data[n][s]['y'].append(target.numpy()[0]-1)

            elif idx == 4:
                # FashionMNIST
                mean=(0.2190,) # Mean and std including the padding
                std=(0.3318,)
                dat={}
                dat['train']=FashionMNIST(base_dir+'/data/fashion_mnist', train=True, download=True, transform=transforms.Compose([
                    transforms.Pad(padding=2, fill=0)])) #,transforms.Normalize(mean, std), transforms.ToTensor()
                dat['test']=FashionMNIST(base_dir+'/data/fashion_mnist', train=False, download=True, transform=transforms.Compose([
                    transforms.Pad(padding=2, fill=0)])) #,transforms.Normalize(mean, std), transforms.ToTensor()
                data[n]={}
                data[n]['name']='fashion-mnist'
                data[n]['ncla']=10
                for s in ['train','test']:
                    # loader=torch.utils.data.DataLoader(dat[s], batch_size=1, shuffle=False)
                    data[n][s]={'x': [], 'y': []}
                    for image,target in dat[s]:
                        image = np.reshape(np.stack([image,image,image], axis=-1), (32,32,3))
                        # image=image.expand(1, 3, image.size(2), image.size(3))  # Create 3 equal channels
                        data[n][s]['x'].append(np.asarray(image))
                        data[n][s]['y'].append(target)
                    # for image,target in loader:
                    #     image=image.expand(1, 3, image.size(2), image.size(3))  # Create 3 equal channels
                    #     data[n][s]['x'].append(image)
                    #     data[n][s]['y'].append(target.numpy()[0])

            elif idx == 5:
                # Traffic signs
                mean=[0.3398,0.3117,0.3210]
                std=[0.2755,0.2647,0.2712]
                dat={}
                dat['train']=TrafficSigns(base_dir+'/data/traffic_signs', train=True, download=True) #,transforms.Normalize(mean,std), transform=transforms.Compose([transforms.ToTensor()])
                dat['test']=TrafficSigns(base_dir+'/data/traffic_signs', train=False, download=True) #,transforms.Normalize(mean,std), transform=transforms.Compose([transforms.ToTensor()])
                # mean, var = utils.compute_mean_std_dataset(dat['train'])
                data[n]={}
                data[n]['name']='traffic-signs'
                data[n]['ncla']=43
                for s in ['train','test']:
                    # loader = torch.utils.data.DataLoader(dat[s], batch_size=1, shuffle=False)
                    data[n][s] = {'x': [], 'y': []}
                    for image,target in dat[s]:
                        data[n][s]['x'].append(np.asarray(image))
                        data[n][s]['y'].append(target)
                    # for image, target in loader:
                    #     data[n][s]['x'].append(image)
                    #     data[n][s]['y'].append(target.numpy()[0])
            elif idx == 6:
                # Facescrub 100 faces
                mean=[0.5163,0.5569,0.4695]
                std=[0.2307,0.2272,0.2479]
                dat={}
                dat['train']=Facescrub(base_dir+'/data/facescrub', train=True, download=True)#,transforms.Normalize(mean,std), transform=transforms.Compose([transforms.ToTensor()])
                dat['test']=Facescrub(base_dir+'/data/facescrub', train=False, download=True)#,transforms.Normalize(mean,std), transform=transforms.Compose([transforms.ToTensor()])
                #mean, std = utils.compute_mean_std_dataset(dat['train']); print(mean,std); sys.exit()
                data[n]={}
                data[n]['name']='facescrub'
                data[n]['ncla']=100
                for s in ['train','test']:
                    # loader = torch.utils.data.DataLoader(dat[s], batch_size=1, shuffle=False)
                    data[n][s] = {'x': [], 'y': []}
                    for image,target in dat[s]:
                        data[n][s]['x'].append(np.asarray(image))
                        data[n][s]['y'].append(target)
                    # for image, target in loader:
                    #     data[n][s]['x'].append(image)
                    #     data[n][s]['y'].append(target.numpy()[0])
            elif idx == 7:
                # notMNIST A-J letters
                mean=(0.4254,)
                std=(0.4501,)
                dat={}
                dat['train']=notMNIST(base_dir+'/data/notmnist', train=True, download=True) #,transforms.Normalize(mean,std), transform=transforms.Compose([transforms.ToTensor()])
                dat['test']=notMNIST(base_dir+'/data/notmnist', train=False, download=True) #,transforms.Normalize(mean,std), transform=transforms.Compose([transforms.ToTensor()])
                #mean, std = utils.compute_mean_std_dataset(dat['train']); print(mean,std); sys.exit()
                data[n]={}
                data[n]['name']='notmnist'
                data[n]['ncla']=10
                for s in ['train','test']:
                    # loader = torch.utils.data.DataLoader(dat[s], batch_size=1, shuffle=False)
                    data[n][s] = {'x': [], 'y': []}
                    for image,target in dat[s]:
                        image = np.reshape(np.concatenate((image,)*3, axis=-1), (32,32,3))
                        data[n][s]['x'].append(np.asarray(image))
                        data[n][s]['y'].append(target)
                    # for image, target in loader:
                    #     image=image.expand(1,3,image.size(2),image.size(3))
                    #     data[n][s]['x'].append(image)
                    #     data[n][s]['y'].append(target.numpy()[0])
            else:
                print('ERROR: Undefined data set',n)
                sys.exit()
            #print(n,data[n]['name'],data[n]['ncla'],len(data[n]['train']['x']))

            # "Unify" and save
            for s in ['train','test']:
                # data[n][s]['x']=torch.stack(data[n][s]['x']).view(-1,size[0],size[1],size[2])
                # data[n][s]['y']=torch.LongTensor(np.array(data[n][s]['y'],dtype=int)).view(-1)
                # pdb.set_trace()
                # data[n][s]['x'] = np.reshape(data[n][s]['x'], (-1,size[0],size[1],size[2]))
                # data[n][s]['y'] = np.array(data[n][s]['y'], dtype=int)
                torch.save(data[n][s]['x'], os.path.join(os.path.expanduser(base_dir+'/data/binary_mixture'),'data'+str(idx)+s+'x.bin'))
                torch.save(data[n][s]['y'], os.path.join(os.path.expanduser(base_dir+'/data/binary_mixture'),'data'+str(idx)+s+'y.bin'))

    else:

        # Load binary files
        for n,idx in enumerate(idata):
            data[n] = dict.fromkeys(['name','ncla','train','test'])
            if idx==0:
                data[n]['name']='cifar10'
                data[n]['ncla']=10
            elif idx==1:
                data[n]['name']='cifar100'
                data[n]['ncla']=100
            elif idx==2:
                data[n]['name']='mnist'
                data[n]['ncla']=10
            elif idx==3:
                data[n]['name']='svhn'
                data[n]['ncla']=10
            elif idx==4:
                data[n]['name']='fashion-mnist'
                data[n]['ncla']=10
            elif idx==5:
                data[n]['name']='traffic-signs'
                data[n]['ncla']=43
            elif idx==6:
                data[n]['name']='facescrub'
                data[n]['ncla']=100
            elif idx==7:
                data[n]['name']='notmnist'
                data[n]['ncla']=10
            else:
                print('ERROR: Undefined data set',n)
                sys.exit()

            # Load
            for s in ['train','test']:
                data[n][s]={'x':[],'y':[]}
                data[n][s]['x'] = torch.load(os.path.join(os.path.expanduser(base_dir+'/data/binary_mixture'),'data'+str(idx)+s+'x.bin'))
                data[n][s]['y'] = torch.load(os.path.join(os.path.expanduser(base_dir+'/data/binary_mixture'),'data'+str(idx)+s+'y.bin'))

    # Validation
    # for t in data.keys():
    #     r=np.arange(data[t]['train']['x'].size(0))
    #     r=np.array(shuffle(r,random_state=seed),dtype=int)
    #     nvalid=int(pc_valid*len(r))
    #     ivalid=torch.LongTensor(r[:nvalid])
    #     itrain=torch.LongTensor(r[nvalid:])
    #     data[t]['valid']={}
    #     data[t]['valid']['x']=data[t]['train']['x'][ivalid].clone()
    #     data[t]['valid']['y']=data[t]['train']['y'][ivalid].clone()
    #     data[t]['train']['x']=data[t]['train']['x'][itrain].clone()
    #     data[t]['train']['y']=data[t]['train']['y'][itrain].clone()

    # Others
    n=0
    for t in data.keys():
        taskcla.append((t,data[t]['ncla']))
        n+=data[t]['ncla']
    data['ncla']=n

    return data,taskcla,size

########################################################################################################################

class FashionMNIST(datasets.MNIST):
    """`Fashion MNIST <https://github.com/zalandoresearch/fashion-mnist>`_ Dataset.
    """
    urls = [
        'http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-images-idx3-ubyte.gz',
        'http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/train-labels-idx1-ubyte.gz',
        'http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-images-idx3-ubyte.gz',
        'http://fashion-mnist.s3-website.eu-central-1.amazonaws.com/t10k-labels-idx1-ubyte.gz',
    ]

########################################################################################################################

class TrafficSigns(torch.utils.data.Dataset):
    """`German Traffic Signs <http://benchmark.ini.rub.de/?section=gtsrb&subsection=dataset>`_ Dataset.
    Args:
        root (string): Root directory of dataset where directory ``Traffic signs`` exists.
        split (string): One of {'train', 'test'}.
        transform (callable, optional): A function/transform that  takes in an PIL image
            and returns a transformed version. E.g, ``transforms.RandomCrop``
        target_transform (callable, optional): A function/transform that takes in the
            target and transforms it.
        download (bool, optional): If true, downloads the dataset from the internet and puts it in root directory.
            If dataset is already downloaded, it is not downloaded again.
    """

    def __init__(self, root, train=True,transform=None, download=False):
        self.root = os.path.expanduser(root)
        self.transform = transform
        self.filename = "traffic_signs_dataset.zip"
        self.url = "https://d17h27t6h515a5.cloudfront.net/topher/2016/October/580d53ce_traffic-sign-data/traffic-sign-data.zip"
        # Other options for the same 32x32 pickled dataset
        # url="https://d17h27t6h515a5.cloudfront.net/topher/2016/November/581faac4_traffic-signs-data/traffic-signs-data.zip"
        # url_train="https://drive.google.com/open?id=0B5WIzrIVeL0WR1dsTC1FdWEtWFE"
        # url_test="https://drive.google.com/open?id=0B5WIzrIVeL0WLTlPNlR2RG95S3c"

        fpath = os.path.join(root, self.filename)
        if not os.path.isfile(fpath):
            if not download:
               raise RuntimeError('Dataset not found. You can use download=True to download it')
            else:
                print('Downloading from '+self.url)
                self.download()

        training_file = 'lab 2 data/train.p'
        testing_file = 'lab 2 data/test.p'
        if train:
            with open(os.path.join(root,training_file), mode='rb') as f:
                train = pickle.load(f)
            self.data = train['features']
            self.labels = train['labels']
        else:
            with open(os.path.join(root,testing_file), mode='rb') as f:
                test = pickle.load(f)
            self.data = test['features']
            self.labels = test['labels']

        self.data = np.transpose(self.data, (0, 3, 1, 2))
        #print(self.data.shape); sys.exit()

    def __getitem__(self, index):
        """
        Args: index (int): Index
        Returns: tuple: (image, target) where target is index of the target class.
        """
        img, target = self.data[index], self.labels[index]

        # doing this so that it is consistent with all other datasets
        # to return a PIL Image
        img = Image.fromarray(np.transpose(img, (1, 2, 0)))

        if self.transform is not None:
            img = self.transform(img)

        return img, target

    def __len__(self):
        return len(self.data)

    def download(self):
        import errno
        root = os.path.expanduser(self.root)
        fpath = os.path.join(root, self.filename)

        try:
            os.makedirs(root)
        except OSError as e:
            if e.errno == errno.EEXIST:
                pass
            else:
                raise
        urllib.request.urlretrieve(self.url, fpath)
        import zipfile
        zip_ref = zipfile.ZipFile(fpath, 'r')
        zip_ref.extractall(root)
        zip_ref.close()


########################################################################################################################

class Facescrub(torch.utils.data.Dataset):
    """Subset of the Facescrub cropped from the official Megaface challenge page: http://megaface.cs.washington.edu/participate/challenge.html, resized to 38x38
    Args:
        root (string): Root directory of dataset where directory ``Traffic signs`` exists.
        split (string): One of {'train', 'test'}.
        transform (callable, optional): A function/transform that  takes in an PIL image
            and returns a transformed version. E.g, ``transforms.RandomCrop``
        target_transform (callable, optional): A function/transform that takes in the
            target and transforms it.
        download (bool, optional): If true, downloads the dataset from the internet and puts it in root directory.
            If dataset is already downloaded, it is not downloaded again.
    """

    def __init__(self, root, train=True,transform=None, download=False):
        self.root = os.path.expanduser(root)
        self.transform = transform
        self.filename = "facescrub_100.zip"
        self.url = "https://github.com/nkundiushuti/facescrub_subset/blob/master/data/facescrub_100.zip?raw=true"

        fpath=os.path.join(root,self.filename)
        if not os.path.isfile(fpath):
            if not download:
               raise RuntimeError('Dataset not found. You can use download=True to download it')
            else:
                print('Downloading from '+self.url)
                self.download()

        training_file = 'facescrub_train_100.pkl'
        testing_file = 'facescrub_test_100.pkl'
        if train:
            with open(os.path.join(root,training_file),'rb') as f:
                # u = pickle._Unpickler(f)
                # u.encoding = 'latin1'
                # train  = u.load()
                train = pickle.load(f)
            self.data = train['features'].astype(np.uint8)
            self.labels = train['labels'].astype(np.uint8)
            """
            print(self.data.shape)
            print(self.data.mean())
            print(self.data.std())
            print(self.labels.max())
            #"""
        else:
            with open(os.path.join(root,testing_file),'rb') as f:
                # u = pickle._Unpickler(f)
                # u.encoding = 'latin1'
                # test  = u.load()
                test = pickle.load(f)

            self.data = test['features'].astype(np.uint8)
            self.labels = test['labels'].astype(np.uint8)

    def __getitem__(self, index):
        """
        Args: index (int): Index
        Returns: tuple: (image, target) where target is index of the target class.
        """
        img, target = self.data[index], self.labels[index]

        # doing this so that it is consistent with all other datasets
        # to return a PIL Image
        img = Image.fromarray(np.transpose(img, (1, 2, 0)))

        if self.transform is not None:
            img = self.transform(img)

        return img, target

    def __len__(self):
        return len(self.data)

    def download(self):
        import errno
        root = os.path.expanduser(self.root)

        fpath = os.path.join(root, self.filename)

        try:
            os.makedirs(root)
        except OSError as e:
            if e.errno == errno.EEXIST:
                pass
            else:
                raise
        urllib.request.urlretrieve(self.url, fpath)

        import zipfile
        zip_ref = zipfile.ZipFile(fpath, 'r')
        zip_ref.extractall(root)
        zip_ref.close()


########################################################################################################################

class notMNIST(torch.utils.data.Dataset):
    """The notMNIST dataset is a image recognition dataset of font glypyhs for the letters A through J useful with simple neural networks. It is quite similar to the classic MNIST dataset of handwritten digits 0 through 9.
    Args:
        root (string): Root directory of dataset where directory ``Traffic signs`` exists.
        split (string): One of {'train', 'test'}.
        transform (callable, optional): A function/transform that  takes in an PIL image
            and returns a transformed version. E.g, ``transforms.RandomCrop``
        target_transform (callable, optional): A function/transform that takes in the
            target and transforms it.
        download (bool, optional): If true, downloads the dataset from the internet and puts it in root directory.
            If dataset is already downloaded, it is not downloaded again.
    """

    def __init__(self, root, train=True,transform=None, download=False):
        self.root = os.path.expanduser(root)
        self.transform = transform
        self.filename = "notmnist.zip"
        self.url = "https://github.com/nkundiushuti/notmnist_convert/blob/master/notmnist.zip?raw=true"

        fpath = os.path.join(root, self.filename)
        if not os.path.isfile(fpath):
            if not download:
               raise RuntimeError('Dataset not found. You can use download=True to download it')
            else:
                print('Downloading from '+self.url)
                self.download()

        training_file = 'notmnist_train.pkl'
        testing_file = 'notmnist_test.pkl'
        if train:
            with open(os.path.join(root,training_file),'rb') as f:
                # u = pickle._Unpickler(f)
                # u.encoding = 'latin1'
                # train  = u.load()
                train = pickle.load(f)
            self.data = train['features'].astype(np.uint8)
            self.labels = train['labels'].astype(np.uint8)
        else:
            with open(os.path.join(root,testing_file),'rb') as f:
                # u = pickle._Unpickler(f)
                # u.encoding = 'latin1'
                # test  = u.load()
                test = pickle.load(f)

            self.data = test['features'].astype(np.uint8)
            self.labels = test['labels'].astype(np.uint8)


    def __getitem__(self, index):
        """
        Args: index (int): Index
        Returns: tuple: (image, target) where target is index of the target class.
        """
        img, target = self.data[index], self.labels[index]
        # doing this so that it is consistent with all other datasets
        # to return a PIL Image
        img = Image.fromarray(img[0])

        if self.transform is not None:
            img = self.transform(img)

        return img, target

    def __len__(self):
        return len(self.data)

    def download(self):
        import errno
        root = os.path.expanduser(self.root)

        fpath = os.path.join(root, self.filename)

        try:
            os.makedirs(root)
        except OSError as e:
            if e.errno == errno.EEXIST:
                pass
            else:
                raise
        urllib.request.urlretrieve(self.url, fpath)

        import zipfile
        zip_ref = zipfile.ZipFile(fpath, 'r')
        zip_ref.extractall(root)
        zip_ref.close()