# Copyright 2022-present, Lorenzo Bonicelli, Pietro Buzzega, Matteo Boschini, Angelo Porrello, Simone Calderara.
# All rights reserved.
# This source code is licensed under the license found in the
# LICENSE file in the root directory of this source tree.

from copy import deepcopy
from typing import Tuple
import torchvision.transforms as transforms
import numpy as np
import torch
import torch.nn as nn
from dataset.seq_tinyimagenet import MyTinyImagenet
from torch.utils.data import DataLoader

def icarl_replay(self, dataset, val_set_split=0):
    """
    Merge the replay buffer with the current task data.
    Optionally split the replay buffer into a validation set.

    :param self: the model instance
    :param dataset: the dataset
    :param val_set_split: the fraction of the replay buffer to be used as validation set
    """
    if dataset.NAME == 'seq-tinyimg':
        icarl_replay_tinyimg(self, dataset, val_set_split)
        return
    if self.task > 0:
        buff_val_mask = torch.rand(len(self.buffer)) < val_set_split
        val_train_mask = torch.zeros(len(dataset.train_loader.dataset.data)).bool()
        val_train_mask[torch.randperm(len(dataset.train_loader.dataset.data))[:buff_val_mask.sum()]] = True

        if val_set_split > 0:
            self.val_loader = deepcopy(dataset.train_loader)

        data_concatenate = torch.cat if isinstance(dataset.train_loader.dataset.data, torch.Tensor) else np.concatenate
        need_aug = hasattr(dataset.train_loader.dataset, 'not_aug_transform')
        if not need_aug:
            def refold_transform(x): return x.cpu()
        else:
            data_shape = len(dataset.train_loader.dataset.data[0].shape)
            if dataset.NAME == 'seq-SVHN':
                def refold_transform(x): return (x.cpu() * 255).squeeze(1).type(torch.uint8)
            elif data_shape == 3:
                def refold_transform(x): return (x.cpu() * 255).permute([0, 2, 3, 1]).numpy().astype(np.uint8)
            elif data_shape == 2:
                def refold_transform(x): return (x.cpu() * 255).squeeze(1).type(torch.uint8)

        # REDUCE AND MERGE TRAINING SET
        dataset.train_loader.dataset.targets = np.concatenate([
            dataset.train_loader.dataset.targets[~val_train_mask],
            self.buffer.labels.cpu().numpy()[:len(self.buffer)][~buff_val_mask]
        ])
        if self.args.dataset == 'seq-stl10':
            dataset.train_loader.dataset.data = data_concatenate([
                dataset.train_loader.dataset.data[~val_train_mask],
                np.transpose(refold_transform((self.buffer.examples)[:len(self.buffer)][~buff_val_mask]), (0, 3, 1, 2))
            ])
        else:
            dataset.train_loader.dataset.data = data_concatenate([
                dataset.train_loader.dataset.data[~val_train_mask],
                refold_transform((self.buffer.examples)[:len(self.buffer)][~buff_val_mask])
            ])
        # print(len(dataset.train_loader.dataset.data))
        if val_set_split > 0:
            # REDUCE AND MERGE VALIDATION SET
            self.val_loader.dataset.targets = np.concatenate([
                self.val_loader.dataset.targets[val_train_mask],
                self.buffer.labels.cpu().numpy()[:len(self.buffer)][buff_val_mask]
            ])
            if self.args.dataset == 'seq-stl10':
                dataset.val_loader.dataset.data = data_concatenate([
                    dataset.val_loader.dataset.data[~val_train_mask],
                    np.transpose(refold_transform((self.buffer.examples)[:len(self.buffer)][~buff_val_mask]), (0, 3, 1, 2))
                ])
            else:
                dataset.val_loader.dataset.data = data_concatenate([
                    dataset.val_loader.dataset.data[~val_train_mask],
                    refold_transform((self.buffer.examples)[:len(self.buffer)][~buff_val_mask])
                ])


def icarl_replay_tinyimg(self, dataset, val_set_split=0):
    """
    Merge the replay buffer with the current task data.
    Optionally split the replay buffer into a validation set.

    :param self: the model instance
    :param dataset: the dataset
    :param val_set_split: the fraction of the replay buffer to be used as validation set
    """

    if self.task > 0:
        buff_val_mask = torch.rand(len(self.buffer)) < val_set_split
        val_train_mask = torch.zeros(len(dataset.train_loader.dataset.Dataset.samples)).bool()
        val_train_mask[torch.randperm(len(dataset.train_loader.dataset.Dataset.samples))[:buff_val_mask.sum()]] = True

        if val_set_split > 0:
            self.val_loader = deepcopy(dataset.train_loader)

        data_concatenate = torch.cat if isinstance(dataset.train_loader.dataset.Dataset.samples, torch.Tensor) else np.concatenate
        need_aug = hasattr(dataset.train_loader.dataset.Dataset, 'not_aug_transform')
        if not need_aug:
            def refold_transform(x): return x.cpu()
        else:
            data_shape = len(dataset.train_loader.dataset.Dataset.samples[0].shape)
            if dataset.NAME == 'seq-SVHN':
                def refold_transform(x): return (x.cpu() * 255).squeeze(1).type(torch.uint8)
            elif data_shape == 3:
                def refold_transform(x): return (x.cpu() * 255).permute([0, 2, 3, 1]).numpy().astype(np.uint8)
            elif data_shape == 2:
                def refold_transform(x): return (x.cpu() * 255).squeeze(1).type(torch.uint8)

        # REDUCE AND MERGE TRAINING SET
        dataset.train_loader.dataset.Dataset.targets = np.concatenate([
            dataset.train_loader.dataset.Dataset.targets[~val_train_mask],
            self.buffer.labels.cpu().numpy()[:len(self.buffer)][~buff_val_mask]
        ])
        dataset.train_loader.dataset.Dataset.samples = [s for s, keep in zip(dataset.train_loader.dataset.Dataset.samples, ~val_train_mask) if keep] + \
            [s[0] for s, keep in zip((self.buffer.examples)[:len(self.buffer)], ~buff_val_mask) if keep]
        # print(len(dataset.train_loader.dataset.data))
        if val_set_split > 0:
            # REDUCE AND MERGE VALIDATION SET
            self.val_loader.dataset.Dataset.targets = np.concatenate([
                self.val_loader.dataset.Dataset.targets[val_train_mask],
                self.buffer.labels.cpu().numpy()[:len(self.buffer)][buff_val_mask]
            ])
            self.val_loader.dataset.Dataset.samples = [s for s, keep in zip(self.val_loader.dataset.Dataset.samples, val_train_mask) if keep] + \
                [s[0] for s, keep in zip((self.buffer.examples)[:len(self.buffer)], buff_val_mask) if keep]




def reservoir(num_seen_examples: int, buffer_size: int) -> int:
    """
    Reservoir sampling algorithm.
    :param num_seen_examples: the number of seen examples
    :param buffer_size: the maximum buffer size
    :return: the target index if the current image is sampled, else -1
    """
    if num_seen_examples < buffer_size:
        return num_seen_examples

    rand = np.random.randint(0, num_seen_examples + 1)
    if rand < buffer_size:
        return rand
    else:
        return -1


def ring(num_seen_examples: int, buffer_portion_size: int, task: int) -> int:
    return num_seen_examples % buffer_portion_size + task * buffer_portion_size


class Buffer:
    """
    The memory buffer of rehearsal method.
    """

    def __init__(self, buffer_size, device, n_tasks=None, mode='reservoir'):
        assert mode in ('ring', 'reservoir')
        self.buffer_size = buffer_size
        self.device = device
        self.num_seen_examples = 0
        self.functional_index = eval(mode)
        if mode == 'ring':
            assert n_tasks is not None
            self.task_number = n_tasks
            self.buffer_portion_size = buffer_size // n_tasks
        self.attributes = ['examples', 'labels', 'logits', 'task_labels']

    def to(self, device):
        self.device = device
        for attr_str in self.attributes:
            if hasattr(self, attr_str):
                setattr(self, attr_str, getattr(self, attr_str).to(device))
        return self

    def __len__(self):
        return min(self.num_seen_examples, self.buffer_size)

    def init_tensors(self, examples: torch.Tensor, labels: torch.Tensor,
                     logits: torch.Tensor, task_labels: torch.Tensor) -> None:
        """
        Initializes just the required tensors.
        :param examples: tensor containing the images
        :param labels: tensor containing the labels
        :param logits: tensor containing the outputs of the network
        :param task_labels: tensor containing the task labels
        """
        for attr_str in self.attributes:
            attr = eval(attr_str)
            if attr is not None and not hasattr(self, attr_str):
                typ = torch.int64 if attr_str.endswith('els') else torch.float32
                if torch.is_tensor(attr):
                    setattr(self, attr_str, torch.zeros((self.buffer_size,
                            *attr.shape[1:]), dtype=typ, device=self.device))
                else:
                    setattr(self, attr_str, [None] * self.buffer_size)

    def add_data(self, examples, labels=None, logits=None, task_labels=None):
        """
        Adds the data to the memory buffer according to the reservoir strategy.
        :param examples: tensor containing the images
        :param labels: tensor containing the labels
        :param logits: tensor containing the outputs of the network
        :param task_labels: tensor containing the task labels
        :return:
        """
        if not hasattr(self, 'examples'):
            self.init_tensors(examples, labels, logits, task_labels)

        for i in range(labels.shape[0]):
            index = reservoir(self.num_seen_examples, self.buffer_size)
            self.num_seen_examples += 1
            if index >= 0:
                if torch.is_tensor(self.examples):
                    self.examples[index] = examples[i].to(self.device)
                else:
                    self.examples[index] = [examples[i]]
                if labels is not None:
                    self.labels[index] = labels[i].to(self.device)
                if logits is not None:
                    self.logits[index] = logits[i].to(self.device)
                if task_labels is not None:
                    self.task_labels[index] = task_labels[i].to(self.device)

    def add_data_rm(self, examples, labels=None, logits=None, task_labels=None):
        """
        Adds the data to the memory buffer according to the reservoir strategy.
        :param examples: tensor containing the images
        :param labels: tensor containing the labels
        :param logits: tensor containing the outputs of the network
        :param task_labels: tensor containing the task labels
        :return:
        """
        if not hasattr(self, 'examples'):
            self.init_tensors(examples, labels, logits, task_labels)

        for i in range(examples.shape[0]):
            index = self.num_seen_examples
            self.num_seen_examples += 1
            if index >= 0:
                self.examples[index] = examples[i].to(self.device)
                if labels is not None:
                    self.labels[index] = labels[i].to(self.device)
                if logits is not None:
                    self.logits[index] = logits[i].to(self.device)
                if task_labels is not None:
                    self.task_labels[index] = task_labels[i].to(self.device)


    def get_data(self, size: int, transform: nn.Module = None, return_index=False) -> Tuple:
        """
        Random samples a batch of size items.
        :param size: the number of requested items
        :param transform: the transformation to be applied (data augmentation)
        :return:
        """
        if size > min(self.num_seen_examples, self.examples.shape[0]):
            size = min(self.num_seen_examples, self.examples.shape[0])

        choice = np.random.choice(min(self.num_seen_examples, self.examples.shape[0]),
                                  size=size, replace=False)
        if transform is None:
            def transform(x): return x
        ret_tuple = (torch.stack([transform(ee.cpu()) for ee in self.examples[choice]]).to(self.device),)
        for attr_str in self.attributes[1:]:
            if hasattr(self, attr_str):
                attr = getattr(self, attr_str)
                ret_tuple += (attr[choice],)

        if not return_index:
            return ret_tuple
        else:
            return (torch.tensor(choice).to(self.device), ) + ret_tuple

    def get_data_by_index(self, indexes, transform: nn.Module = None) -> Tuple:
        """
        Returns the data by the given index.
        :param index: the index of the item
        :param transform: the transformation to be applied (data augmentation)
        :return:
        """
        if transform is None:
            def transform(x): return x
        ret_tuple = (torch.stack([transform(ee.cpu())
                                  for ee in self.examples[indexes]]).to(self.device),)
        for attr_str in self.attributes[1:]:
            if hasattr(self, attr_str):
                attr = getattr(self, attr_str).to(self.device)
                ret_tuple += (attr[indexes],)
        return ret_tuple

    def is_empty(self) -> bool:
        """
        Returns true if the buffer is empty, false otherwise.
        """
        if self.num_seen_examples == 0:
            return True
        else:
            return False

    def get_all_data(self, transform: nn.Module = None) -> Tuple:
        """
        Return all the items in the memory buffer.
        :param transform: the transformation to be applied (data augmentation)
        :return: a tuple with all the items in the memory buffer
        """
        if transform is None:
            def transform(x): return x
        if torch.is_tensor(self.examples):
            ret_tuple = (torch.stack([transform(ee.cpu())
                                      for ee in self.examples]).to(self.device),)
        else:
            ret_tuple = [[s[0] if s is not None else self.examples[0][0] for s in self.examples]]
        for attr_str in self.attributes[1:]:
            if hasattr(self, attr_str):
                attr = getattr(self, attr_str)
                ret_tuple += (attr,)
        return ret_tuple

    def empty(self) -> None:
        """
        Set all the tensors to None.
        """
        for attr_str in self.attributes:
            if hasattr(self, attr_str):
                delattr(self, attr_str)
        self.num_seen_examples = 0


def fill_buffer_tinyimg(self, mem_buffer: Buffer, dataset, t_idx: int, train_texts=None) -> None:
    """
    Adds examples from the current task to the memory buffer
    by means of the herding strategy.
    :param mem_buffer: the memory buffer
    :param dataset: the dataset from which take the examples
    :param t_idx: the task index
    """
    mode = self.net.training
    self.net.eval()
    samples_per_class = mem_buffer.buffer_size // len(self.classes_so_far)
    if t_idx > 0:
        # 1) First, subsample prior classes
        buf_x, buf_y, buf_l = self.buffer.get_all_data()

        mem_buffer.empty()
        for _y in buf_y.unique():
            idx = (buf_y == _y)
            _y_x = [s for s, keep in zip(buf_x, idx) if keep]
            _y_y, _y_l = buf_y[idx], buf_l[idx]
            mem_buffer.add_data(
                examples=_y_x[:samples_per_class],
                labels=_y_y[:samples_per_class],
                logits=_y_l[:samples_per_class]
            )

    # 2) Then, fill with current tasks
    transform_aug = []
    if self.args.aug == 'aua':
        transform_aug = [transforms.AutoAugment(policy=transforms.AutoAugmentPolicy.CIFAR10)]
    elif self.args.aug == 'ra':
        transform_aug = [transforms.RandAugment(2,8)]
    elif self.args.aug == 'none':
        transform_aug = []
    
    if self.args.model_type == 'clip':
        transform_aug.append(transforms.Resize((224,224)))
        transform_aug.append(transforms.RandomCrop(224, padding=4))
        test_transform = transforms.Compose([transforms.Resize((224,224)), transforms.ToTensor()])
    else:
        transform_aug.append(transforms.RandomCrop(64, padding=4))
        test_transform = transforms.Compose([transforms.ToTensor()])
    transform = transforms.Compose(transform_aug + 
        [#transforms.RandomCrop(64, padding=4),
            transforms.RandomHorizontalFlip(),
            transforms.ToTensor()])
    train_dataset = MyTinyImagenet('./tinyImageNet/tiny-imagenet-200/train/', train=True,
                                    download=True, transform=transform)
    loader = DataLoader(train_dataset, batch_size=self.args.batch_size, num_workers=4)
    classes_start, classes_end = t_idx * dataset.N_CLASSES_PER_TASK, (t_idx + 1) * dataset.N_CLASSES_PER_TASK

    # 2.1 Extract all features
    a_x, a_y, a_f, a_l = [], [], [], []
    for x, y, not_norm_x in loader:
        mask = (y >= classes_start) & (y < classes_end)
        x, y, not_norm_x = x[mask], y[mask], not_norm_x[mask]
        if not x.size(0):
            continue
        x, y, not_norm_x = (a.to(self.device) for a in (x, y, not_norm_x))
        a_x.append(not_norm_x.to('cpu'))
        a_y.append(y.to('cpu'))
        if train_texts == None:
            feats = self.net(not_norm_x, returnt='features')
            outs = self.net.classifier(feats)
        else:
            not_norm_x_224 = torch.nn.functional.interpolate(not_norm_x, size=(224, 224), mode='bicubic')
            if self.NAME == 'proof':
                train_texts_features = self.net.convnet.encode_text(train_texts)
                feats, text_embed, _, _ = self.net(not_norm_x_224, train_texts_features)
                outs = feats @ text_embed.t()
            elif self.NAME == 'rapf':          
                ac = (self.task + 1) * self.dataset.N_CLASSES_PER_TASK
                outs, _, feats = self.net(not_norm_x_224, train_texts = train_texts, ori_ima_f=True)
            else:
                features, text_embed = self.net(not_norm_x_224, train_texts)
                feats = features[:, 0, :]
                outs = feats @ text_embed.t()
        a_f.append(feats.cpu())
        a_l.append(torch.sigmoid(outs).cpu())
    a_x, a_y, a_f, a_l = torch.cat(a_x), torch.cat(a_y), torch.cat(a_f), torch.cat(a_l)

    # 2.2 Compute class means
    for _y in a_y.unique():
        idx = (a_y == _y)
        _x = [s for s, keep in zip(dataset.train_loader.dataset.Dataset.samples, idx) if keep]
        _y, _l = a_y[idx], a_l[idx]
        feats = a_f[idx]
        mean_feat = feats.mean(0, keepdim=True)

        running_sum = torch.zeros_like(mean_feat)
        i = 0
        while i < samples_per_class and i < feats.shape[0]:
            cost = (mean_feat - (feats + running_sum) / (i + 1)).norm(2, 1)

            idx_min = cost.argmin().item()

            mem_buffer.add_data(
                examples=_x[idx_min:idx_min + 1],
                labels=_y[idx_min:idx_min + 1].to(self.device),
                logits=_l[idx_min:idx_min + 1].to(self.device)
            )

            running_sum += feats[idx_min:idx_min + 1]
            feats[idx_min] = feats[idx_min] + 1e6
            i += 1

    assert len(mem_buffer.examples) <= mem_buffer.buffer_size
    assert mem_buffer.num_seen_examples <= mem_buffer.buffer_size

    self.net.train(mode)