# Copyright 2022-present, Lorenzo Bonicelli, Pietro Buzzega, Matteo Boschini, Angelo Porrello, Simone Calderara.
# All rights reserved.
# This source code is licensed under the license found in the
# LICENSE file in the root directory of this source tree.

from typing import Tuple

import torch.nn.functional as F
import torch.optim
import torchvision.transforms as transforms
from backbone.ResNet18 import resnet18
from backbone.mobilenet_v2 import mobilenet_v2
from backbone.wideresnet import wrn3410
from backbone.CLIP import Clip
from PIL import Image
from torchvision.datasets import CIFAR100

from dataset.transforms.denormalization import DeNormalize
from dataset.utils.continual_dataset import (ContinualDataset,
                                              store_masked_loaders)
from dataset.utils.validation import get_train_val
from utils.conf import base_path_dataset as base_path


class TCIFAR100(CIFAR100):
    """Workaround to avoid printing the already downloaded messages."""
    def __init__(self, root, train=True, transform=None,
                 target_transform=None, download=False) -> None:
        self.root = root
        super(TCIFAR100, self).__init__(root, train, transform, target_transform, download=not self._check_integrity())

class MyCIFAR100(CIFAR100):
    """
    Overrides the CIFAR100 dataset to change the getitem function.
    """
    def __init__(self, root, train=True, transform=None,
                 target_transform=None, download=False) -> None:
        self.not_aug_transform = transforms.Compose([transforms.ToTensor()])
        self.root = root
        super(MyCIFAR100, self).__init__(root, train, transform, target_transform, not self._check_integrity())

    def __getitem__(self, index: int) -> Tuple[Image.Image, int, Image.Image]:
        """
        Gets the requested element from the dataset.
        :param index: index of the element to be returned
        :returns: tuple: (image, target) where target is index of the target class.
        """
        img, target = self.data[index], self.targets[index]

        # to return a PIL Image
        img = Image.fromarray(img, mode='RGB')
        original_img = img.copy()

        not_aug_img = self.not_aug_transform(original_img)

        if self.transform is not None:
            img = self.transform(img)

        if self.target_transform is not None:
            target = self.target_transform(target)

        if hasattr(self, 'logits'):
            return img, target, not_aug_img, self.logits[index]

        return img, target, not_aug_img


class SequentialCIFAR100(ContinualDataset):

    NAME = 'seq-cifar100'
    SETTING = 'class-il'
    N_CLASSES_PER_TASK = 10
    N_TASKS = 10
    TRANSFORM = transforms.Compose(
            [transforms.RandomCrop(32, padding=4),
             transforms.RandomHorizontalFlip(),
             transforms.ToTensor()
             # transforms.Normalize((0.5071, 0.4867, 0.4408), (0.2675, 0.2565, 0.2761))
                                  ])

    def get_examples_number(self):
        train_dataset = MyCIFAR100(base_path() + 'CIFAR10', train=True,
                                  download=True)
        return len(train_dataset.data)

    def get_data_loaders(self):
        transform_aug = []
        if self.args.aug == 'aua':
            transform_aug = [transforms.AutoAugment(policy=transforms.AutoAugmentPolicy.CIFAR10)]
        elif self.args.aug == 'ra':
            transform_aug = [transforms.RandAugment(2,8)]
        elif self.args.aug == 'none':
            transform_aug = []
        
        if self.args.model_type == 'clip':
            transform_aug.append(transforms.Resize((224, 224)))
            transform_aug.append(transforms.RandomCrop(224, padding=4))
            test_transform = transforms.Compose([transforms.Resize((224, 224)), transforms.ToTensor()])
        else:
            transform_aug.append(transforms.RandomCrop(32, padding=4))
            test_transform = transforms.Compose([transforms.ToTensor()])
        transform = transforms.Compose(transform_aug + 
            [#transforms.RandomCrop(32, padding=4),
             transforms.RandomHorizontalFlip(),
             transforms.ToTensor()])

        # test_transform = transforms.Compose(
        #     [transforms.ToTensor()
        #     #self.get_normalization_transform()
        #     ])

        train_dataset = MyCIFAR100(base_path() + 'CIFAR100', train=True,
                                  download=True, transform=transform)
        if self.args.validation:
            train_dataset, test_dataset = get_train_val(train_dataset,
                                                    test_transform, self.NAME)
        else:
            test_dataset = TCIFAR100(base_path() + 'CIFAR100',train=False,
                                   download=True, transform=test_transform)

        train, test = store_masked_loaders(train_dataset, test_dataset, self)

        return train, test

    @staticmethod
    def get_transform():
        transform = transforms.Compose(
            [transforms.ToPILImage(), SequentialCIFAR100.TRANSFORM])
        return transform

    @staticmethod
    def get_backbone(args):
        mean = torch.tensor((0.5071, 0.4867, 0.4408)).cuda().view(-1, 1, 1)
        std = torch.tensor((0.2675, 0.2565, 0.2761)).cuda().view(-1, 1, 1)
        if args.architecture=="RES-18":
            return resnet18(mean, std, SequentialCIFAR100.N_CLASSES_PER_TASK * SequentialCIFAR100.N_TASKS)
        elif args.architecture=="MN-V2":
            return mobilenet_v2(mean,std,SequentialCIFAR100.N_CLASSES_PER_TASK * SequentialCIFAR100.N_TASKS)
        elif args.architecture=="WRN-34-10":
            return wrn3410(mean,std,SequentialCIFAR100.N_CLASSES_PER_TASK * SequentialCIFAR100.N_TASKS)
        elif args.model_type=="clip":
            return Clip(args, mean, std)
        else:
            raise NotImplementedError

    @staticmethod
    def get_loss():
        return F.cross_entropy

    @staticmethod
    def get_normalization_transform():
        transform = transforms.Normalize((0.5071, 0.4867, 0.4408),
                                         (0.2675, 0.2565, 0.2761))
        return transform

    @staticmethod
    def get_denormalization_transform():
        transform = DeNormalize((0.5071, 0.4867, 0.4408),
                                (0.2675, 0.2565, 0.2761))
        return transform

    @staticmethod
    def get_epochs():
        return 50

    @staticmethod
    def get_batch_size():
        ## revised 32 --> 128
        return 32

    @staticmethod
    def get_minibatch_size():
        return SequentialCIFAR100.get_batch_size()

    @staticmethod
    def get_scheduler(model, args):
        # return None
        if args.model_type == 'clip':
            if hasattr(model, 'get_optimizer'):
                scheduler = model.get_optimizer(args)
                return scheduler
            else:
                model.opt = torch.optim.SGD(model.parameters(args), lr=args.lr, weight_decay=args.optim_wd, momentum=args.optim_mom)
                scheduler = torch.optim.lr_scheduler.MultiStepLR(model.opt, [35, 45], gamma=0.1, verbose=False)
        else:
            model.opt = torch.optim.SGD(model.net.parameters(), lr=args.lr, weight_decay=args.optim_wd, momentum=args.optim_mom)
            scheduler = torch.optim.lr_scheduler.MultiStepLR(model.opt, [35, 45], gamma=0.1, verbose=False)
        return scheduler

    @staticmethod
    def get_robust_scheduler(model, args) -> torch.optim.lr_scheduler:
        if hasattr(model, 'get_optimizer'):
            scheduler = model.get_optimizer(args)
            return scheduler
        else:
            model.opt = torch.optim.SGD(model.parameters(args), lr=args.lr, weight_decay=args.optim_wd, momentum=args.optim_mom)
            scheduler = torch.optim.lr_scheduler.MultiStepLR(model.opt, [int(args.n_epochs * 0.48), int(args.n_epochs * 0.62), int(args.n_epochs * 0.80)], gamma=0.1, verbose=False)
        return scheduler