from torchvision import datasets
from torch.utils.data import Subset
import numpy as np
from .builder import DATASETS
from .base_dataset import BaseDataset
from torchvision.transforms import transforms
from query_strategies.utils import UnNormalize
import random


@DATASETS.register_module()
class imagenet(BaseDataset):
    def __init__(self,
                 data_path=None,
                 initial_size=None):
        self.raw_tr = None
        self.raw_vl = None
        self.raw_te = None
        super(imagenet, self).__init__(data_path, initial_size)

    
    def load_data(self):
        if self.DATA_PATH is None:
            self.DATA_PATH = '../data/imagenet'
        self.raw_tr = datasets.ImageNet(self.DATA_PATH, split='train', download=False)
        self.raw_vl = datasets.ImageNet(self.DATA_PATH, split='val', download=False)
        self.raw_te = datasets.ImageNet(self.DATA_PATH, split='val', download=False)
        num_tr = len(self.raw_tr.targets)
        num_vl = len(self.raw_vl.targets)
        num_te = len(self.raw_te.targets)
        self.DATA_INFOS['train_full'] = [{'no': i, 'img': self.raw_tr.imgs[i][0],
                                          'gt_label': self.raw_tr.targets[i]} for i in range(num_tr)]
        self.DATA_INFOS['val'] = [{'no': i, 'img': self.raw_vl.imgs[i][0],
                                   'gt_label': self.raw_vl.targets[i]} for i in range(num_vl)]
        self.DATA_INFOS['test'] = [{'no': - (i + 1), 'img': self.raw_te.imgs[i][0],
                                    'gt_label': self.raw_te.targets[i]} for i in range(num_te)]
        self.num_samples = num_tr + num_te
        self.INDEX_LB = np.zeros(num_tr, dtype=bool)
        self.CLASSES = self.raw_tr.classes

    
    def prepare_data(self, idx, split, transform=None, aug_transform=None):
        x_path, y = self.DATA_INFOS[split][idx]['img'], self.DATA_INFOS[split][idx]['gt_label']
        if split not in ['distill']:
            x = self.raw_tr.loader(x_path)
            if aug_transform is not None:
                x = aug_transform(x)
            if transform is None:
                x = self.TRANSFORM[split](x)
            else:
                x = transform(x)
        else:
            x = x_path
        return x, y, self.DATA_INFOS[split][idx]['no'], idx

    @property
    def default_train_transform(self):
        return transforms.Compose([
            transforms.RandomResizedCrop(size=224),
            transforms.RandomHorizontalFlip(),
            transforms.ToTensor(),
            transforms.Normalize(mean=[0.485, 0.456, 0.406],
                                 std=[0.229, 0.224, 0.225])
        ])

    @property
    def default_val_transform(self):
        return transforms.Compose([
            transforms.Resize(size=256),
            transforms.CenterCrop(size=224),
            transforms.ToTensor(),
            transforms.Normalize(mean=[0.485, 0.456, 0.406],
                                 std=[0.229, 0.224, 0.225])
        ])

    @property
    def inverse_transform(self):
        return transforms.Compose([
            UnNormalize(mean=[0.485, 0.456, 0.406],
                        std=[0.229, 0.224, 0.225]),
            transforms.ToPILImage()
        ])

    def get_raw_data(self, idx, split='train'):
        transform = self.default_val_transform
        x_path = self.DATA_INFOS[split][idx]['img']
        x = self.raw_tr.loader(x_path)
        x = transform(x)
        return x


@DATASETS.register_module()
class sampledimagenet(imagenet):
    def __init__(self,
                 data_path=None,
                 initial_size=None):
        self.raw_tr = None
        self.raw_vl = None
        self.raw_te = None
        super(imagenet, self).__init__(data_path, initial_size)

    
    def load_data(self):
        if self.DATA_PATH is None:
            self.DATA_PATH = '../data/imagenet'
        
        self.raw_tr = datasets.ImageNet(self.DATA_PATH, split='train', download=False)
        self.raw_vl = datasets.ImageNet(self.DATA_PATH, split='val', download=False)
        self.raw_te = datasets.ImageNet(self.DATA_PATH, split='val', download=False)
        num_vl = len(self.raw_vl.targets)
        num_te = len(self.raw_te.targets)
        tr_idxs = random.sample(list(range(len(self.raw_tr))), 500000)
        self.DATA_INFOS['train_full'] = [{'no': i, 'img': self.raw_tr.imgs[idx][0],
                                          'gt_label': self.raw_tr.targets[idx]} for i, idx in enumerate(tr_idxs)]
        self.DATA_INFOS['val'] = [{'no': i, 'img': self.raw_vl.imgs[i][0],
                                   'gt_label': self.raw_vl.targets[i]} for i in range(num_vl)]
        self.DATA_INFOS['test'] = [{'no': - (i + 1), 'img': self.raw_te.imgs[i][0],
                                    'gt_label': self.raw_te.targets[i]} for i in range(num_te)]
        num_tr = len(self.DATA_INFOS['train_full'])
        self.num_samples = num_tr + num_te
        self.INDEX_LB = np.zeros(num_tr, dtype=bool)
        self.CLASSES = self.raw_tr.classes
