import torch
import numpy as np

def keep_top_k(p,k,n_classes=1000):
    if k == n_classes:
        return p

    values, indices = p.topk(k, dim=1)

    mask_topk = torch.zeros_like(p)
    mask_topk.scatter_(-1, indices, 1.0)
    top_p = mask_topk * p

    minor_value = (1 - torch.sum(values, dim=1)) / (n_classes-k)
    minor_value = minor_value.unsqueeze(1).expand(p.shape)
    mask_smooth = torch.ones_like(p)
    mask_smooth.scatter_(-1, indices, 0)
    smooth_p = mask_smooth * minor_value

    topk_smooth_p = top_p + smooth_p
    assert np.isclose(topk_smooth_p.sum().item(), p.shape[0]), f'{topk_smooth_p.sum().item()} not close to {p.shape[0]}'
    return topk_smooth_p


class AverageMeter(object):
    def __init__(self):
        self.reset()

    def reset(self):
        self.avg = 0
        self.sum = 0
        self.cnt = 0
        self.val = 0

    def update(self, val, n=1):
        self.val = val
        self.sum += val * n
        self.cnt += n
        self.avg = self.sum / self.cnt


def accuracy(output, target, topk=(1,)):
    maxk = max(topk)
    batch_size = target.size(0)

    _, pred = output.topk(maxk, 1, True, True)
    pred = pred.t()
    correct = pred.eq(target.reshape(1, -1).expand_as(pred))

    res = []
    for k in topk:
        correct_k = correct[:k].reshape(-1).float().sum(0)
        res.append(correct_k.mul_(100.0 / batch_size))
    return res


def get_parameters(model):
    group_no_weight_decay = []
    group_weight_decay = []
    for pname, p in model.named_parameters():
        if pname.find('weight') >= 0 and len(p.size()) > 1:
            group_weight_decay.append(p)
        else:
            group_no_weight_decay.append(p)
    assert len(list(model.parameters())) == len(
        group_weight_decay) + len(group_no_weight_decay)
    groups = [dict(params=group_weight_decay), dict(
        params=group_no_weight_decay, weight_decay=0.)]
    return groups


import os
import torch,random
import torch.distributed
import torchvision
from torchvision.transforms import functional as t_F
import numpy as np


class RandomResizedCropWithCoords(torchvision.transforms.RandomResizedCrop):
    def __init__(self, **kwargs):
        super(RandomResizedCropWithCoords, self).__init__(**kwargs)

    def __call__(self, img, coords):
        try:
            reference = (coords.any())
        except:
            reference = False
        if not reference:
            i, j, h, w = self.get_params(img, self.scale, self.ratio)
            coords = (i / img.shape[2],
                      j / img.shape[1],
                      h / img.shape[2],
                      w / img.shape[1])
            coords = torch.FloatTensor(coords)
        else:
            i = round(coords[0].item() * img.shape[2])
            j = round(coords[1].item() * img.shape[1])
            h = round(coords[2].item() * img.shape[2])
            w = round(coords[3].item() * img.shape[1])
        return t_F.resized_crop(img, i, j, h, w, self.size,
                                self.interpolation,antialias=True), coords

class ShufflePatchesWithIndex(torch.nn.Module):
    def shuffle_weight(self, img, factor,indices=None):
        h, w = img.shape[1:]
        th, tw = h // factor, w // factor
        patches = []
        for i in range(factor):
            i = i * tw
            if i != factor - 1:
                patches.append(img[..., i : i + tw])
            else:
                patches.append(img[..., i:])
        if indices is None:
            indices = np.random.choice(list(range(len(patches))),len(patches),replace=False)
        new_patches = []
        for indice in indices:
            new_patches.append(patches[indice])
        img = torch.cat(patches, -1)
        return img, indices

    def __init__(self, factor):
        super().__init__()
        self.factor = factor

    def forward(self, img, indices):
        try:
            reference = (indices.any())
        except:
            reference = False
        if not reference:
            img,indices1 = self.shuffle_weight(img, self.factor)
            img = img.permute(0, 2, 1)
            img,indices2 = self.shuffle_weight(img, self.factor)
            img = img.permute(0, 2, 1)
            indices = torch.stack([torch.LongTensor(indices1),torch.LongTensor(indices2)],0)
            return img, indices
        else:
            img,indices1 = self.shuffle_weight(img, self.factor, indices[0].cpu().tolist())
            img = img.permute(0, 2, 1)
            img,indices2 = self.shuffle_weight(img, self.factor, indices[1].cpu().tolist())
            img = img.permute(0, 2, 1)
            return img, indices

class ComposeWithCoords(torchvision.transforms.Compose):
    def __init__(self, ap_shuffle=True,**kwargs):
        super(ComposeWithCoords, self).__init__(**kwargs)
        self.ap_shuffle = ap_shuffle

    def __call__(self, img, coords, status, indices):
        for t in self.transforms:
            if type(t).__name__ == 'RandomResizedCropWithCoords':
                img, coords = t(img, coords)
            elif type(t).__name__ == 'RandomCropWithCoords':
                img, coords = t(img, coords)
            elif type(t).__name__ == 'RandomHorizontalFlipWithRes':
                img, status = t(img, status)
            elif type(t).__name__ == 'ShufflePatchesWithIndex':
                if self.ap_shuffle:
                    img, indices = t(img, indices)
                if indices is None:
                    indices = torch.zeros(2,2).int()
            else:
                img = t(img)
        return img, status, coords, indices


class RandomHorizontalFlipWithRes(torch.nn.Module):
    def __init__(self, p=0.5):
        super().__init__()
        self.p = p

    def forward(self, img, status):
        if status is not None:
            if status == True:
                return t_F.hflip(img), status
            else:
                return img, status
        else:
            status = False
            if torch.rand(1) < self.p:
                status = True
                return t_F.hflip(img), status
            return img, status

    def __repr__(self):
        return self.__class__.__name__ + '(p={})'.format(self.p)


def get_FKD_info(fkd_path):
    def custom_sort_key(s):
      
        numeric_part = int(s.split('_')[1].split('.tar')[0])
        return numeric_part

    max_epoch = len(os.listdir(fkd_path))
    batch_list = sorted(os.listdir(os.path.join(
        fkd_path, 'epoch_0')), key=custom_sort_key)
    batch_size = torch.load(os.path.join(
        fkd_path, 'epoch_0', batch_list[0]))[1].size()[0]
    last_batch_size = torch.load(os.path.join(
        fkd_path, 'epoch_0', batch_list[-1]))[1].size()[0]
    num_img = batch_size * (len(batch_list) - 1) + last_batch_size

    print('======= FKD: dataset info ======')
    print('path: {}'.format(fkd_path))
    print('num img: {}'.format(num_img))
    print('batch size: {}'.format(batch_size))
    print('max epoch: {}'.format(max_epoch))
    print('================================')
    return max_epoch, batch_size, num_img


class ImageFolder_FKD_MIX(torchvision.datasets.ImageFolder):
    def __init__(self, fkd_path, mode, args_epoch=None, args_bs=None, seed=42, **kwargs):
        self.fkd_path = fkd_path
        self.mode = mode
        super(ImageFolder_FKD_MIX, self).__init__(**kwargs)
        self.batch_config = None  
        self.batch_config_idx = 0  
        self.config_list = None
        if self.mode == 'fkd_load':
            max_epoch, batch_size, num_img = get_FKD_info(self.fkd_path)
            if args_epoch > max_epoch:
                raise ValueError(f'`--epochs` should be no more than max epoch.')
            if args_bs != batch_size:
                raise ValueError(
                    '`--batch-size` should be same in both saving and loading phase. Please use `--gradient-accumulation-steps` to control batch size in model forward phase.')
            self.epoch = None
            self.batch_size = batch_size

    def __getitem__(self, index):
        if self.mode == 'fkd_save':
            path, target = self.samples[index]
            coords_ = None
            flip_ = None
            indices_ = None
        elif self.mode == 'fkd_load':
            if self.config_list is None:
                self.load_epoch_config()
            else:
                pass
            batch_config = self.config_list[int(index // self.batch_size)]
            batch_config_idx = int(index % self.batch_size)

            coords_ = batch_config[0][batch_config_idx]
            flip_ = batch_config[1][batch_config_idx]
            mix_index = batch_config[2][batch_config_idx]
            mix_lam = batch_config[3]
            min_bbox = batch_config[4]
            soft_label = batch_config[5][batch_config_idx]
            new_index = batch_config[6][batch_config_idx]
            indices_ = batch_config[7][batch_config_idx]
            path, target = self.samples[new_index]
        else:
            raise ValueError('mode should be fkd_save or fkd_load')

        sample = self.loader(path)

        if self.transform is not None:
            sample_new, flip_status, coords_status, indices_status = self.transform(sample, coords_, flip_, indices_)
        else:
            sample_new = sample
            flip_status = None
            coords_status = None
            indices_status = None

        if self.target_transform is not None:
            target = self.target_transform(target)

        if self.mode == "fkd_save":
            return sample_new, target, flip_status, coords_status, indices_status, index
        elif self.mode == "fkd_load":
            return sample_new, target, flip_status, coords_status, indices_status, mix_index, mix_lam, min_bbox, soft_label
        else:
            raise ValueError('mode should be fkd_save or fkd_load')

    def load_epoch_config(self):
        import glob
        batch_config_path = os.path.join(self.fkd_path, 'epoch_{}'.format(self.epoch), 'batch_*.tar')
        def sort_key(_filename):
            return int(_filename.split("batch_")[1].split(".")[0])
        filename_list = sorted(glob.glob(batch_config_path),key=sort_key)
        config_list = []
        for filename in filename_list:
            config = torch.load(filename)
            config_list.append(config)
        self.config_list = config_list

    def set_epoch(self, epoch):
        self.epoch = epoch
        self.load_epoch_config()

    
class ImageFolder_FKD_MIX_CL(ImageFolder_FKD_MIX):
    def __init__(self,class_number=1000,*args,**kwargs):
        super(ImageFolder_FKD_MIX_CL, self).__init__(*args,**kwargs)
        self.class_number=class_number
        self.label2img = [[] for _ in range(len(self.classes))]
        for k, v in self.samples:
            self.label2img[v].append(k)
        new_samples = []
        for i in range(class_number):
            for j in self.label2img[i]:
                new_samples.append((j,i))
        self.samples = new_samples
        self.imgs = self.samples

def rand_bbox(size, lam):
    W = size[2]
    H = size[3]
    cut_rat = np.sqrt(1. - lam)
    cut_w = int(W * cut_rat)
    cut_h = int(H * cut_rat)

    cx = np.random.randint(W)
    cy = np.random.randint(H)

    bbx1 = np.clip(cx - cut_w // 2, 0, W)
    bby1 = np.clip(cy - cut_h // 2, 0, H)
    bbx2 = np.clip(cx + cut_w // 2, 0, W)
    bby2 = np.clip(cy + cut_h // 2, 0, H)

    return bbx1, bby1, bbx2, bby2


def cutmix(images, args, rand_index=None, lam=None, bbox=None):
    if args.mode == 'fkd_save':
        rand_index = torch.randperm(images.size()[0]).cuda()
        lam = np.random.beta(args.cutmix, args.cutmix)
        bbx1, bby1, bbx2, bby2 = rand_bbox(images.size(), lam)
    elif args.mode == 'fkd_load':
        assert rand_index is not None and lam is not None and bbox is not None
        rand_index = rand_index.cuda()
        lam = lam
        bbx1, bby1, bbx2, bby2 = bbox
    else:
        raise ValueError('mode should be fkd_save or fkd_load')

    images[:, :, bbx1:bbx2, bby1:bby2] = images[rand_index, :, bbx1:bbx2, bby1:bby2]
    return images, rand_index.cpu(), lam, [bbx1, bby1, bbx2, bby2]


def mixup(images, args, rand_index=None, lam=None):
    if args.mode == 'fkd_save':
        rand_index = torch.randperm(images.size()[0]).cuda()
        lam = np.random.beta(args.mixup, args.mixup)
    elif args.mode == 'fkd_load':
        assert rand_index is not None and lam is not None
        rand_index = rand_index.cuda()
        lam = lam
    else:
        raise ValueError('mode should be fkd_save or fkd_load')

    mixed_images = lam * images + (1 - lam) * images[rand_index]
    return mixed_images, rand_index.cpu(), lam, None


def mix_aug(images, args, rand_index=None, lam=None, bbox=None):
    if args.mix_type == 'mixup':
        return mixup(images, args, rand_index, lam)
    elif args.mix_type == 'cutmix':
        return cutmix(images, args, rand_index, lam, bbox)
    else:
        return images, None, None, None


def get_img2batch_idx_list(num_img=50000, batch_size=1024, seed=42, epochs=300):
    train_dataset = torch.utils.data.TensorDataset(torch.arange(num_img))
    generator = torch.Generator()
    generator.manual_seed(seed)
    sampler = torch.utils.data.RandomSampler(train_dataset, generator=generator)
    batch_sampler = torch.utils.data.BatchSampler(sampler, batch_size=batch_size, drop_last=False)

    img2batch_idx_list = []
    for epoch in range(epochs):
        img2batch_idx = {}
        for batch_idx, img_indices in enumerate(batch_sampler):
            for img_indice in img_indices:
                img2batch_idx[img_indice] = batch_idx
        img2batch_idx_list.append(img2batch_idx)
    return img2batch_idx_list


