# Copyright 2022-present, Lorenzo Bonicelli, Pietro Buzzega, Matteo Boschini, Angelo Porrello, Simone Calderara.
# All rights reserved.
# This source code is licensed under the license found in the
# LICENSE file in the root directory of this source tree.
# import os
# os.environ["CUDA_VISIBLE_DEVICES"] = "6"
import numpy  # needed (don't change it)
import importlib
import os, pdb
import socket
import sys
from argparse import Namespace


mammoth_path = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
sys.path.append(mammoth_path)
sys.path.append(mammoth_path + '/dataset')
sys.path.append(mammoth_path + '/backbone')
sys.path.append(mammoth_path + '/models')

import datetime
import uuid
from argparse import ArgumentParser

import setproctitle
import torch
from dataset.utils.gcl_dataset import GCLDataset
from dataset.utils.continual_dataset import ContinualDataset#, get_dataset
from dataset import get_dataset
from models import get_all_models, get_model

from utils.args import add_management_args
from utils.conf import set_random_seed
from utils.continual_training import train as ctrain
from utils.distributed import make_dp
from utils.training import train

torch.manual_seed(0)
torch.cuda.manual_seed_all(0)
torch.backends.cudnn.deterministic = True
torch.backends.cudnn.benchmark = False
torch.cuda.manual_seed(0)
numpy.random.seed(0)

def lecun_fix():
    # Yann moved his website to CloudFlare. You need this now
    from six.moves import urllib  # pyright: ignore
    opener = urllib.request.build_opener()
    opener.addheaders = [('User-agent', 'Mozilla/5.0')]
    urllib.request.install_opener(opener)


def parse_args():
    parser = ArgumentParser(description='mammoth', allow_abbrev=False)
    parser.add_argument('--model', type=str, required=True,
                        help='Model name.', choices=get_all_models())
    torch.set_num_threads(4)
    add_management_args(parser)
    args = parser.parse_known_args()[0]
    mod = importlib.import_module('models.' + args.model)


    get_parser = getattr(mod, 'get_parser')
    parser = get_parser()
    args = parser.parse_args()
    args.train_eps = args.train_eps / 255.
    args.train_alpha = args.train_alpha / 255.
    args.test_eps = args.test_eps / 255.
    args.test_alpha = args.test_alpha / 255.
    
    if args.seed is not None:
        set_random_seed(args.seed)


    ## added for normalization
    if args.dataset == 'seq-cifar100':
        args.dataset_mean = (0.5071, 0.4867, 0.4408)
        args.dataset_std = (0.2675, 0.2565, 0.2761)
    elif args.dataset == 'seq-cifar10':
        args.dataset_mean = (0.4913, 0.4821, 0.4465)
        args.dataset_std = (0.2470, 0.2434, 0.2615)
    elif args.dataset == 'seq-tinyimg':
        args.dataset_mean = (0.4802, 0.4480, 0.3975)
        args.dataset_std = (0.2770, 0.2691, 0.2821)
    elif args.dataset == 'seq-stl10':
        args.dataset_mean = (0.4914, 0.4822, 0.4465)
        args.datatset_std = (0.2470, 0.2435, 0.2615)
    else :
        args.dataset_mean = None
        args.dataset_std = None
    ###
    return args


def main(args=None):
    lecun_fix()
    if args is None: 
        args = parse_args()
    # Add uuid, timestamp and hostname for logging
    args.conf_jobnum = str(uuid.uuid4())
    args.conf_timestamp = str(datetime.datetime.now())
    args.conf_host = socket.gethostname()
    dataset = get_dataset(args)

    if args.n_epochs is None and isinstance(dataset, ContinualDataset):
        args.n_epochs = dataset.get_epochs()
    if args.batch_size is None:
        args.batch_size = dataset.get_batch_size()
    if hasattr(importlib.import_module('models.' + args.model), 'Buffer') and args.minibatch_size is None:
        args.minibatch_size = dataset.get_minibatch_size()

    backbone = dataset.get_backbone(args)
    loss = dataset.get_loss()
    model = get_model(args, backbone, loss, dataset.get_transform())

    if args.distributed == 'dp':
        model.net = make_dp(model.net)
        model.to('cuda:0')
        args.conf_ngpus = torch.cuda.device_count()
    elif args.distributed == 'ddp':
        # DDP breaks the buffer, it has to be synchronized.
        raise NotImplementedError('Distributed Data Parallel not supported yet.')

    # set job name
    setproctitle.setproctitle('{}_{}_{}'.format(args.model, args.buffer_size if 'buffer_size' in args else 0, args.dataset))

    if isinstance(dataset, ContinualDataset):
        train(model, dataset, args)
    else:
        assert not hasattr(model, 'end_task') or model.NAME == 'joint_gcl'
        ctrain(args)


if __name__ == '__main__':
    main()
