import torch
from torch import nn
from plot_samples import plot_samples
import torchvision.transforms as transforms
import torchvision
import numpy as np
import os

def step(
    image_size, n_epochs, test_noise,
    generator, inference_generator, discriminator, accumulate,
    generator_function, inference_generator_function, discriminator_function,
    generator_optimizer, discriminator_optimizer,
    dataroot, device
):
    start_epoch = 0
    for ckpt in os.listdir('./checkpoints/'):
        if f'generator_step_{image_size}' in ckpt:
            start_epoch = int(ckpt.split('_')[-1])
            generator.load_state_dict(torch.load('./checkpoints/'+ckpt))
            discriminator.load_state_dict(torch.load('./checkpoints/'+ckpt.replace('generator','discriminator')))
    print(f'Step for image size {image_size}')
    # allowed = [
    #     'mushroom', 'house', 'sunflower', 'tulip', 'mountain',
    #     'orchid', 'bed', 'castle', 'table', 'palm_tree'
    # ]

    # vehicles = 'bicycle, bus, motorcycle, pickup_truck, train, lawn_mower, rocket, streetcar, tank, tractor'
    # allowed = vehicles.replace(' ', '').split(',')
    dataset = torchvision.datasets.CIFAR100(
        root = '../../../datasets',
        train = True,
        download = True,
        transform = torchvision.transforms.Compose([
            torchvision.transforms.Resize(image_size),
            # torchvision.transforms.Grayscale(),
            torchvision.transforms.ToTensor(),
            torchvision.transforms.Normalize(
                [.5], [.5]
            )
        ])
    )
    # print(dataset.class_to_idx.keys())
    # allowed = [
    #     dataset.class_to_idx[a]
    #     for a in allowed
    # ]
    forbidden = [i for i in range(90,100)]
    indexes = [i for i, value in enumerate(dataset.train_labels) if value not in forbidden]
    dataset.train_data = dataset.train_data[indexes]
    dataset.train_labels = [dataset.train_labels[i] for i in indexes]

    for epoch in range(start_epoch+1,n_epochs):
        if epoch % 50 == 0:
            print(f'Epoch: {epoch}/{n_epochs}')
        dataloader = torch.utils.data.DataLoader(
            dataset,
            batch_size = 256,
            shuffle = True,
            num_workers = 2,
            drop_last = True
        )
        n_iterations = len(dataloader)
        for iter_n, samples in enumerate(dataloader):
            # print(
            #     f'Size: {image_size} - Epoch: {epoch + 1}/{n_epochs}' +
            #     f' - Done: {np.round(iter_n / n_iterations, 2)}',
            #     end = '\r'
            # )
            samples = samples[0].to(device)

            generator.zero_grad()
            discriminator.zero_grad()

            discriminator_samples = discriminator_function(samples)
            generated_samples = generator_function(
                torch.Tensor(
                    # np.random.normal(size = (256, 256))
                    np.random.uniform(-5., 5., size = (256, 256))
                ).to(device)
            )
            discriminator_generated = discriminator_function(generated_samples)
            alpha = torch.Tensor(
                np.random.uniform(size = (1,))
            ).to(device)
            x_hat = alpha * samples + (1. - alpha) * generated_samples
            gradient = torch.autograd.grad(
                outputs = torch.mean(discriminator_function(x_hat)),
                inputs = x_hat
            )[0]
            gamma = 750.
            gradient = torch.pow(torch.sqrt(
                torch.sum(
                    torch.pow(gradient, 2),
                    dim = [1, 2, 3]
                )
            ) - gamma, 2) / gamma / gamma
            discriminator_loss = torch.mean(
                discriminator_generated - discriminator_samples +
                10. * gradient +
                .005 * torch.pow(discriminator_generated, 2) +
                .005 * torch.pow(discriminator_samples, 2)
            )
            discriminator_loss.backward()
            discriminator_optimizer.step()

            generator.zero_grad()
            discriminator.zero_grad()
            generated_samples = generator_function(torch.Tensor(
                # np.random.normal(size = (256, 256))
                np.random.uniform(-5., 5., size = (256, 256))
            ).to(device))
            discriminator_generated = discriminator_function(generated_samples)
            generator_loss = torch.mean(-1. * discriminator_generated)
            generator_loss.backward()
            generator_optimizer.step()

            accumulate(inference_generator, generator)

            # with torch.no_grad():
            #     generated_samples = generator_function(test_noise)
                # plot_samples(generated_samples)
        with torch.no_grad():
            generated_samples = inference_generator_function(test_noise)
            plot_samples(generated_samples, save = f'{image_size}_{100 + epoch}')
        torch.save(generator.state_dict(), f'./checkpoints/generator_step_{image_size}_{epoch}')
        torch.save(discriminator.state_dict(), f'./checkpoints/discriminator_step_{image_size}_{epoch}')
        if epoch >= 2:
            os.unlink(f'./checkpoints/generator_step_{image_size}_{epoch-1}')
            os.unlink(f'./checkpoints/discriminator_step_{image_size}_{epoch-1}')

    return generator, inference_generator, discriminator, generator_optimizer, discriminator_optimizer 

