import scipy.io
import random
import hydra
from omegaconf import DictConfig, OmegaConf
import signatory
import os
import os.path as osp
import sys
current_directory = os.path.dirname(os.path.abspath(__file__))
sys.path.append(osp.join(current_directory, "..",".."))
from model.NRDE.NRDE import *
from model.utilities import *
import warnings
warnings.filterwarnings('ignore')

device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')

def train(config):

    os.makedirs(config.save_dir, exist_ok=True)
    checkpoint_file = config.save_dir + config.checkpoint_file

    # Load data
    data = scipy.io.loadmat(config.data_path)
    W, Sol = data['W'], data['sol']
    print('W shape:', W.shape)
    print('Sol shape:', Sol.shape)

    xi = torch.from_numpy(W.astype(np.float32))
    data = torch.from_numpy(Sol.astype(np.float32))

    ntrain, nval, ntest = config.ntrain, config.nval, config.ntest

    train_loader, test_loader, I, noise_dim, norm = dataloader_nrde_1d(u=data, xi=xi,
                                                                       ntrain=ntrain,
                                                                       ntest=ntest,
                                                                       T=config.T,
                                                                       sub_t=config.sub_t,
                                                                       batch_size=config.batch_size,
                                                                       dim_x=config.dim_x,
                                                                       depth=config.depth,
                                                                       window_length=config.window_length,
                                                                       normalizer=config.normalizer,
                                                                       interpolation=config.interpolation)

    _, val_loader, _, _, _ = dataloader_nrde_1d(u=data[:ntrain + nval],
                                                xi=xi[:ntrain + nval],
                                                ntrain=ntrain, ntest=nval,
                                                T=config.T,
                                                sub_t=config.sub_t,
                                                batch_size=config.batch_size,
                                                dim_x=config.dim_x,
                                                depth=config.depth,
                                                window_length=config.window_length,
                                                normalizer=config.normalizer,
                                                interpolation=config.interpolation)

    model = NeuralRDE(control_channels=noise_dim,
                      input_channels=config.dim_x,
                      hidden_channels=config.hidden_channels,
                      output_channels=config.dim_x,
                      interval=I,
                      interpolation=config.interpolation,
                      solver=config.solver).cuda()

    print('The model has {} parameters'.format(count_params(model)))

    loss = LpLoss(size_average=False)

    _, _, _ = train_nrde_1d(model, train_loader, val_loader, norm, device, loss,
                               batch_size=config.batch_size,
                               epochs=config.epochs,
                               learning_rate=config.learning_rate,
                               plateau_patience=config.plateau_patience,
                               plateau_terminate=config.plateau_terminate,
                               delta=config.delta,
                               print_every=config.print_every,
                               checkpoint_file=checkpoint_file)

    model.load_state_dict(torch.load(checkpoint_file))
    loss_train = eval_nrde_1d(model, train_loader, loss, config.batch_size, device, norm)
    loss_val = eval_nrde_1d(model, val_loader, loss, config.batch_size, device, norm)
    loss_test = eval_nrde_1d(model, test_loader, loss, config.batch_size, device, norm)
    print('loss_train (model saved in checkpoint):', loss_train)
    print('loss_val (model saved in checkpoint):', loss_val)
    print('loss_test (model saved in checkpoint):', loss_test)


def hyperparameter_search(config):
    os.makedirs(config.save_dir, exist_ok=True)
    checkpoint_file = config.save_dir + config.checkpoint_file
    tmp_checkpoint_file = config.save_dir + 'tmp_checkpoint.pth'

    # Load data
    data = scipy.io.loadmat(config.data_path)
    W, Sol = data['W'], data['sol']
    xi = torch.from_numpy(W.astype(np.float32))
    data = torch.from_numpy(Sol.astype(np.float32))

    ntrain, nval, ntest = config.ntrain, config.nval, config.ntest

    train_loader, test_loader, I, noise_dim, norm = dataloader_nrde_1d(u=data, xi=xi,
                                                                       ntrain=ntrain,
                                                                       ntest=ntest,
                                                                       T=config.T,
                                                                       sub_t=config.sub_t,
                                                                       batch_size=config.batch_size,
                                                                       dim_x=config.dim_x,
                                                                       depth=config.depth,
                                                                       window_length=config.window_length,
                                                                       normalizer=config.normalizer,
                                                                       interpolation=config.interpolation)

    _, val_loader, _, _, _ = dataloader_nrde_1d(u=data[:ntrain + nval],
                                                xi=xi[:ntrain + nval],
                                                ntrain=ntrain, ntest=nval,
                                                T=config.T,
                                                sub_t=config.sub_t,
                                                batch_size=config.batch_size,
                                                dim_x=config.dim_x,
                                                depth=config.depth,
                                                window_length=config.window_length,
                                                normalizer=config.normalizer,
                                                interpolation=config.interpolation)

    hyperparams = list(itertools.product(config.hidden_channels, config.solver))

    loss = LpLoss(size_average=False)

    fieldnames = ['hidden_channels', 'solver', 'nb_params', 'loss_train', 'loss_val', 'loss_test']
    log_file = config.save_dir + config.log_file
    with open(log_file, 'w', encoding='UTF8', newline='') as f:
        writer = csv.writer(f)
        writer.writerow(fieldnames)

    best_loss_val = 1000.

    for (_hidden_channels, _solver) in hyperparams:

        print('\n hidden_channels:{}, solver:{}'.format(_hidden_channels, _solver))

        model = NeuralRDE(control_channels=noise_dim,
                          input_channels=config.dim_x,
                          hidden_channels=_hidden_channels,
                          output_channels=config.dim_x,
                          interval=I,
                          interpolation=config.interpolation,
                          solver=_solver).cuda()
        nb_params = count_params(model)
        print('\n The model has {} parameters'.format(nb_params))

        # Train the model. The best model is checkpointed.
        _, _, _ = train_nrde_1d(model, train_loader, val_loader, norm, device, loss,
                                batch_size=config.batch_size,
                                epochs=config.epochs,
                                learning_rate=config.learning_rate,
                                plateau_patience=config.plateau_patience,
                                plateau_terminate=config.plateau_terminate,
                                delta=config.delta,
                                print_every=config.print_every,
                                checkpoint_file=tmp_checkpoint_file)
        # load the best trained model
        model.load_state_dict(torch.load(tmp_checkpoint_file))
        loss_train = eval_nrde_1d(model, train_loader, loss, config.batch_size, device, norm)
        loss_val = eval_nrde_1d(model, val_loader, loss, config.batch_size, device, norm)
        loss_test = eval_nrde_1d(model, test_loader, loss, config.batch_size, device, norm)
        print('loss_train (model saved in tmp_checkpoint):', loss_train)
        print('loss_val (model saved in tmp_checkpoint):', loss_val)
        print('loss_test (model saved in tmp_checkpoint):', loss_test)

        # if this configuration of hyperparameters is the best so far (determined wihtout using the test set), save it
        if loss_val < best_loss_val:
            torch.save(model.state_dict(), checkpoint_file)
            best_loss_val = loss_val

        # write results
        with open(log_file, 'a', encoding='UTF8', newline='') as f:
            writer = csv.writer(f)
            writer.writerow([_hidden_channels, _solver, nb_params, loss_train, loss_val, loss_test])

    print('Best model saved in:', checkpoint_file)


@hydra.main(version_base=None, config_path="../config/", config_name="nrde")
def main(cfg: DictConfig):
    # print(OmegaConf.to_yaml(cfg, resolve=True))

    # Set random seed
    seed = cfg.seed
    torch.manual_seed(seed)
    torch.cuda.manual_seed(seed)
    torch.cuda.manual_seed_all(seed)
    np.random.seed(seed)
    random.seed(seed)
    torch.backends.cudnn.deterministic = True
    torch.backends.cudnn.benchmark = False

    train(cfg)
    # hyperparameter_search(cfg)


if __name__ == '__main__':
    main()