import logging
import numpy as np
from PIL import Image
from torch.utils.data import Dataset
from torchvision import transforms
from utils.data import iCIFAR10, iCIFAR100, iImageNet100, iImageNet1000, TinyImageNet200
import torch, copy
import os, ipdb, random
import numpy as np
import torch.backends.cudnn as cudnn


def setup_seed(seed):
    torch.manual_seed(seed)
    torch.cuda.manual_seed_all(seed)
    torch.cuda.manual_seed(seed)
    np.random.seed(seed)
    random.seed(seed)
    cudnn.deterministic = True


def average_bias_vector(bias_list):
    """
    聚合客户端上传的 bias 向量。

    参数：
    - bias_list: List[Tensor], 每个 bias 向量形状为 [d]

    返回：
    - avg_bias: Tensor [d]
    """
    # 过滤掉 None 的情况（若有客户端未返回 bias）
    bias_list = [b for b in bias_list if b is not None]
    if len(bias_list) == 0:
        return None
    return torch.stack(bias_list, dim=0).mean(dim=0)


def average_weights(w):
    """
    Returns the average of the weights.
    """
    w_avg = copy.deepcopy(w[0])
    for key in w_avg.keys():
        for i in range(1, len(w)):
            w_avg[key] += w[i][key]
        if 'num_batches_tracked' in key:
            w_avg[key] = w_avg[key].true_divide(len(w))
        else:
            w_avg[key] = torch.div(w_avg[key], len(w))
    return w_avg


def average_weights_with_loss(w, loss_weight):
    """
    Returns the average of the weights.
    """
    wloss = torch.softmax(loss_weight)
    w_avg = copy.deepcopy(w[0])
    for key in w_avg.keys():
        for i in range(1, len(w)):
            w_avg[key] += w[i][key]
        if 'num_batches_tracked' in key:
            w_avg[key] = w_avg[key].true_divide(len(w))
        else:
            w_avg[key] = torch.div(w_avg[key], len(w))
    return w_avg


class DatasetSplit(Dataset):
    """An abstract Dataset class wrapped around Pytorch Dataset class.
    """

    def __init__(self, dataset, idxs):
        self.dataset = dataset
        self.idxs = [int(i) for i in idxs]
        self.images = self.dataset.images[self.idxs]
        self.labels = self.dataset.labels[self.idxs]

    def __len__(self):
        return len(self.idxs)

    def __getitem__(self, item):
        idx, image, label = self.dataset[self.idxs[item]]
        return idx, image, label


def record_net_data_stats(y_train, net_dataidx_map):
    net_cls_counts = {}

    for net_i, dataidx in net_dataidx_map.items():
        unq, unq_cnt = np.unique(y_train[dataidx], return_counts=True)
        tmp = {unq[i]: unq_cnt[i] for i in range(len(unq))}
        net_cls_counts[net_i] = tmp

    print('Data statistics: %s' % str(net_cls_counts))

    return net_cls_counts


def partition_data(y_train, beta=0.4, n_parties=5):
    data_size = y_train.shape[0]
    np.random.seed(2023)
    if beta == 0:  # for iid
        idxs = np.random.permutation(data_size)
        batch_idxs = np.array_split(idxs, n_parties)
        net_dataidx_map = {i: batch_idxs[i] for i in range(n_parties)}

    elif beta > 0:  # for niid
        min_size = 0
        min_require_size = 1
        # label = np.unique(y_train).shape[0]
        labels = np.unique(y_train)
        net_dataidx_map = {}

        while min_size < min_require_size:
            idx_batch = [[] for _ in range(n_parties)]
            for k in labels:
                idx_k = np.where(y_train == k)[0]
                np.random.shuffle(idx_k)  # shuffle the label
                proportions = np.random.dirichlet(np.repeat(beta, n_parties))
                proportions = np.array(  # 0 or x
                    [p * (len(idx_j) < data_size / n_parties) for p, idx_j in zip(proportions, idx_batch)])
                proportions = proportions / proportions.sum()
                proportions = (np.cumsum(proportions) * len(idx_k)).astype(int)[:-1]
                idx_batch = [idx_j + idx.tolist() for idx_j, idx in zip(idx_batch, np.split(idx_k, proportions))]
                min_size = min([len(idx_j) for idx_j in idx_batch])

        for j in range(n_parties):
            np.random.shuffle(idx_batch[j])
            net_dataidx_map[j] = idx_batch[j]
    # record_net_data_stats(y_train, net_dataidx_map)
    train_data_cls_counts = record_net_data_stats(y_train, net_dataidx_map)
    return net_dataidx_map, train_data_cls_counts


class DataManager(object):
    def __init__(self, dataset_name, shuffle, seed, init_cls, increment, args):
        self.args = args
        self.dataset_name = dataset_name
        self._setup_data(dataset_name, shuffle, seed)
        assert init_cls <= len(self._class_order), "No enough classes."
        self._increments = [init_cls]
        while sum(self._increments) + 2 * increment <= len(self._class_order):
            self._increments.append(increment)
        offset = len(self._class_order) - sum(self._increments)
        if offset > 0:
            self._increments.append(offset)

    @property
    def nb_tasks(self):
        return len(self._increments)

    def get_task_size(self, task):
        return self._increments[task]

    def get_total_classnum(self):
        return len(self._class_order)

    def get_class_order(self):
        return self._class_order

    def get_dataset(
            self, indices, source, mode, appendent=None, ret_data=False, m_rate=None
    ):
        if source == "train":
            x, y = self._train_data, self._train_targets
        elif source == "test":
            x, y = self._test_data, self._test_targets
        else:
            raise ValueError("Unknown data source {}.".format(source))

        if mode == "train":
            trsf = transforms.Compose([*self._train_trsf, *self._common_trsf])
        elif mode == "flip":
            trsf = transforms.Compose(
                [*self._test_trsf, transforms.RandomHorizontalFlip(p=1.0), *self._common_trsf]
            )
        elif mode == "test":
            trsf = transforms.Compose([*self._test_trsf, *self._common_trsf])
        else:
            raise ValueError("Unknown mode {}.".format(mode))

        data, targets, indices_record = [], [], []

        for idx in indices:
            if m_rate is None:
                class_data, class_targets, class_indices = self._select(
                    x, y, low_range=idx, high_range=idx + 1
                )
            else:
                class_data, class_targets, class_indices = self._select_rmm(
                    x, y, low_range=idx, high_range=idx + 1, m_rate=m_rate
                )

            data.append(class_data)
            targets.append(class_targets)
            indices_record.append(class_indices)

        if appendent is not None and len(appendent) != 0:
            appendent_data, appendent_targets = appendent
            data.append(appendent_data)
            targets.append(appendent_targets)
            # 可选：处理 appendent 的原始索引记录

        data = np.concatenate(data)
        targets = np.concatenate(targets)
        indices_record = np.concatenate(indices_record)

        if ret_data:
            return data, targets, DummyDataset(data, targets, trsf, self.use_path), indices_record
        else:
            return DummyDataset(data, targets, trsf, self.use_path), indices_record

    def get_dataset_with_split(
            self, indices, source, mode, appendent=None, val_samples_per_class=0
    ):
        if source == "train":
            x, y = self._train_data, self._train_targets
        elif source == "test":
            x, y = self._test_data, self._test_targets
        else:
            raise ValueError("Unknown data source {}.".format(source))

        if mode == "train":
            trsf = transforms.Compose([*self._train_trsf, *self._common_trsf])
        elif mode == "test":
            trsf = transforms.Compose([*self._test_trsf, *self._common_trsf])
        else:
            raise ValueError("Unknown mode {}.".format(mode))

        train_data, train_targets = [], []
        val_data, val_targets = [], []
        for idx in indices:
            # ipdb.set_trace()
            class_data, class_targets = self._select(
                x, y, low_range=idx, high_range=idx + 1
            )
            val_indx = np.random.choice(
                len(class_data), val_samples_per_class, replace=False
            )
            train_indx = list(set(np.arange(len(class_data))) - set(val_indx))
            val_data.append(class_data[val_indx])
            val_targets.append(class_targets[val_indx])
            train_data.append(class_data[train_indx])
            train_targets.append(class_targets[train_indx])

        if appendent is not None:
            appendent_data, appendent_targets = appendent
            for idx in range(0, int(np.max(appendent_targets)) + 1):
                append_data, append_targets = self._select(
                    appendent_data, appendent_targets, low_range=idx, high_range=idx + 1
                )
                val_indx = np.random.choice(
                    len(append_data), val_samples_per_class, replace=False
                )
                train_indx = list(set(np.arange(len(append_data))) - set(val_indx))
                val_data.append(append_data[val_indx])
                val_targets.append(append_targets[val_indx])
                train_data.append(append_data[train_indx])
                train_targets.append(append_targets[train_indx])

        train_data, train_targets = np.concatenate(train_data), np.concatenate(
            train_targets
        )
        val_data, val_targets = np.concatenate(val_data), np.concatenate(val_targets)

        return DummyDataset(
            train_data, train_targets, trsf, self.use_path
        ), DummyDataset(val_data, val_targets, trsf, self.use_path)

    def set_class_order(self, order):
        self._class_order = order

    # def _setup_data(self, dataset_name, shuffle, seed):
    #     idata = _get_idata(dataset_name, self.args)
    #     idata.download_data()
    #
    #     # Data
    #     self._train_data, self._train_targets = idata.train_data, idata.train_targets
    #     self._test_data, self._test_targets = idata.test_data, idata.test_targets
    #     self.use_path = idata.use_path
    #
    #     # Transforms
    #     self._train_trsf = idata.get_train_trsf()
    #     self._test_trsf = idata.get_test_trsf()
    #     self._common_trsf = idata.get_common_trsf()
    #
    #     # Original class order
    #     order = [i for i in range(len(np.unique(self._train_targets)))]
    #     if shuffle == 1:
    #         np.random.seed(seed)
    #         order = np.random.permutation(len(order)).tolist()
    #     else:
    #         order = idata.get_class_order()
    #
    #     # ✅ 只保留前 K 类（例如前 50 类）
    #     topk = 50  # 默认使用所有类
    #     order = order[:topk]
    #     self._class_order = order
    #
    #     # ✅ 筛选训练和测试数据，仅保留前 K 类
    #     train_mask = np.isin(self._train_targets, self._class_order)
    #     test_mask = np.isin(self._test_targets, self._class_order)
    #     self._train_data = self._train_data[train_mask]
    #     self._train_targets = self._train_targets[train_mask]
    #     self._test_data = self._test_data[test_mask]
    #     self._test_targets = self._test_targets[test_mask]
    #
    #     # ✅ 将原始标签重新映射为 0~(K-1)
    #     self._train_targets = _map_new_class_index(self._train_targets, self._class_order)
    #     self._test_targets = _map_new_class_index(self._test_targets, self._class_order)

    def _setup_data(self, dataset_name, shuffle, seed):
        idata = _get_idata(dataset_name, self.args)
        idata.download_data()

        # Data
        self._train_data, self._train_targets = idata.train_data, idata.train_targets
        self._test_data, self._test_targets = idata.test_data, idata.test_targets
        self.use_path = idata.use_path

        # Transforms
        self._train_trsf = idata.get_train_trsf()
        self._test_trsf = idata.get_test_trsf()
        self._common_trsf = idata.get_common_trsf()

        # Order
        order = [i for i in range(len(np.unique(self._train_targets)))]
        if shuffle == 1:
            np.random.seed(seed)
            order = np.random.permutation(len(order)).tolist()
        else:
            order = idata.get_class_order()
        self._class_order = order
        # print(self._class_order)

        # Map indices
        self._train_targets = _map_new_class_index(
            self._train_targets, self._class_order
        )
        self._test_targets = _map_new_class_index(self._test_targets, self._class_order)

    def _select(self, x, y, low_range, high_range):
        mask = (y >= low_range) & (y < high_range)
        selected_indices = np.where(mask)[0]
        return x[mask], y[mask], selected_indices

    # 修改 _select_rmm 函数

    def _select_rmm(self, x, y, low_range, high_range, m_rate):
        assert m_rate is not None
        idxes = np.where(np.logical_and(y >= low_range, y < high_range))[0]

        if m_rate != 0:
            selected_idxes = np.random.randint(
                0, len(idxes), size=int((1 - m_rate) * len(idxes))
            )
            new_idxes = idxes[selected_idxes]
        else:
            new_idxes = idxes

        new_idxes = np.sort(new_idxes)
        return x[new_idxes], y[new_idxes], new_idxes

    def getlen(self, index):
        y = self._train_targets
        return np.sum(np.where(y == index))


class DummyDataset(Dataset):
    def __init__(self, images, labels, trsf, use_path=False):
        assert len(images) == len(labels), "Data size error!"
        self.images = images
        self.labels = labels
        self.trsf = trsf
        self.use_path = use_path

    def __len__(self):
        return len(self.images)

    def __getitem__(self, idx):
        if self.use_path:
            image = self.trsf(pil_loader(self.images[idx]))
        else:
            image = self.trsf(Image.fromarray(self.images[idx]))
        label = self.labels[idx]

        return idx, image, label


def _map_new_class_index(y, order):
    return np.array(list(map(lambda x: order.index(x), y)))


def _get_idata(dataset_name, args):
    name = dataset_name.lower()
    if name == "cifar10":
        return iCIFAR10(args)
    elif name == "cifar100":
        return iCIFAR100(args)
    elif name == "imagenet":
        return iImageNet1000(args)
    elif name == "imagenet100":
        return iImageNet100(args)
    elif name == "tiny_imagenet":
        return TinyImageNet200(args)
    else:
        raise NotImplementedError("Unknown dataset {}.".format(dataset_name))


def pil_loader(path):
    """
    Ref:
    https://pytorch.org/docs/stable/_modules/torchvision/datasets/folder.html#ImageFolder
    """
    # open path as file to avoid ResourceWarning (https://github.com/python-pillow/Pillow/issues/835)
    with open(path, "rb") as f:
        img = Image.open(f)
        return img.convert("RGB")

# def accimage_loader(path):
#     """
#     Ref:
#     https://pytorch.org/docs/stable/_modules/torchvision/datasets/folder.html#ImageFolder
#     accimage is an accelerated Image loader and preprocessor leveraging Intel IPP.
#     accimage is available on conda-forge.
#     """
#     import accimage

#     try:
#         return accimage.Image(path)
#     except IOError:
#         # Potentially a decoding problem, fall back to PIL.Image
#         return pil_loader(path)


# def default_loader(path):
#     """
#     Ref:
#     https://pytorch.org/docs/stable/_modules/torchvision/datasets/folder.html#ImageFolder
#     """
#     from torchvision import get_image_backend

#     if get_image_backend() == "accimage":
#         return accimage_loader(path)
#     else:
#         return pil_loader(path)
