import os
import time

from copy import deepcopy

import numpy as np
import torch

from torch.utils.data import DataLoader

# from torchsummary import summary
from expmanager.utils_manager import (
    ExpDataset,
    add_log,
    compare_result,
    print_metrics,
    prob_to_gpu,
    save_pd,
)
from method.Models.utils_loss import l1_penalty, l2_penalty, str2twoStageLoss
from method.Predicts.wrapper_predicts import pred_model_wrapper
from method.utils_method import do_reduction, ndiv, to_array, to_device
from method.Optimizers.wrapper_opti import optimizer_wrapper

class ExpManager:
    """
    Experiment management class to enable running multiple experiment.

    Parameters
    ----------
    """

    def __init__(self, pred_model_args, args, conf, logger):
        self.args = args
        self.conf = conf
        self.logger = logger
        self.batch_size = self.args.batch_size
        self.model_args = self.conf["models"][self.args.opt_model]
        self.device = torch.device(
            f"cuda:{args.gpu}"
            if torch.cuda.is_available() and int(args.gpu) >= 0
            else "cpu"
        )
        self.logger.info(f"--- Running on {self.device}")
        # prediction model
        self.pred_model = pred_model_wrapper(args, pred_model_args)
        # print("self.pred_model: ", self.pred_model)
        self.logger.info(f"--- Built [{args.pred_model}] Prediction Model")
        # optimizer
        # optimizer:
        # self.optimizer = torch.optim.Adam(self.pred_model.parameters(), lr=args.lr)
        self.optimizer = optimizer_wrapper(args, self.pred_model.parameters())
        if args.use_lr_scheduling:
            self.scheduler = torch.optim.lr_scheduler.MultiStepLR(
                self.optimizer,
                milestones=[args.lr_milestone_1, args.lr_milestone_2],
                gamma=0.3162,
            )

    def run(self, problem, loss_fn, smooth_loss_fn, ptoSolver=None, n_epochs=1, do_debug=False):
        #   Move everything to device
        prob_to_gpu(problem, self.device)
        prob_to_gpu(ptoSolver, self.device)
        problem.device = self.device
        self.pred_model = self.pred_model.to(self.device)

        ############################## Data ##############################
        # Get data
        X_train, Y_train, Y_train_aux = problem.get_train_data()
        X_val, Y_val, Y_val_aux = problem.get_val_data()
        X_test, Y_test, Y_test_aux = problem.get_test_data()

        ############################## Preliminary Evaluation ##############################
        #   Document the optimal value
        # TODO: !!! use exact sovler for optimal
        Z_train_opt, Objs_train_opt = problem.get_decision(
            Y_train,
            params=Y_train_aux,
            ptoSolver=ptoSolver,
            isTrain=False,
            **problem.init_API(),
        )
        Z_val_opt, Objs_val_opt = problem.get_decision(
            Y_val,
            params=Y_val_aux,
            ptoSolver=ptoSolver,
            isTrain=False,
            **problem.init_API(),
        )

        Objs_val_opt = to_array(Objs_val_opt)
        #
        Z_test_opt, Objs_test_opt = problem.get_decision(
            Y_test,
            params=Y_test_aux,
            ptoSolver=ptoSolver,
            isTrain=False,
            **problem.init_API(),
        )
        Objs_test_opt = to_array(Objs_test_opt)
        # save
        problem.z_train_opt = Z_train_opt
        problem.z_val_opt = Z_val_opt
        problem.z_test_opt = Z_test_opt
        ###   Document the value of a random guess
        # objs_rand = list()
        # for _ in range(10):
        #     rand_Y = rand_like(Y_test, device=self.device)
        #     Z_test_rand, Objs_test_rand = problem.get_decision(
        #         rand_Y,
        #         params=Y_test_aux,
        #         ptoSolver=ptoSolver,
        #         isTrain=False,
        #         **problem.init_API(),
        #     )
        #     objs_rand.append(Objs_test_rand)
        # objs_rand = torch.stack(to_tensor(objs_rand))
        objs_rand = torch.zeros(10)
        ############################# Load previous model #############################
        if self.args.trained_path != "":
            self.pred_model.load_state_dict(torch.load(self.args.trained_path))
            self.logger.info(f"--- Loaded model from {self.args.trained_path}")
        ############################# Pretrain #############################
        if self.args.pretrain == True:
            # fetch pretrain data:
            if hasattr(problem, "get_pretrain_data"):
                X_pretrain, Y_pretrain, Y_pretrain_aux = problem.get_pretrain_data()
            else:  # pretrain with DFL train data
                X_pretrain, Y_pretrain, Y_pretrain_aux = X_train, Y_train, Y_train_aux

            # Pretrain prediction model
            total_train_time = 0.0
            best = (float("inf"), None)
            time_since_best = 0
            train_logs = {
                "epoch": [],
                "obj": [],
                "loss": [],
                "pred_loss": [],
                "eval": [],
            }
            val_logs = {
                "epoch": [],
                "obj": [],
                "loss": [],
                "pred_loss": [],
                "eval": [],
            }
            # loss function
            twostage_criterion = str2twoStageLoss(problem)
            self.logger.info("Pretraining Prediction Model...")
            self.pred_model.train()
            best_epoch = 0
            for ptr_epoch in range(1, self.args.n_ptr_epochs + 1):
                ###### one-shot training
                time_train_start = time.time()
                preds = self.pred_model(X_pretrain)
                loss = twostage_criterion(problem, preds, Y_pretrain, **self.model_args)

                self.optimizer.zero_grad()
                loss.backward()
                self.optimizer.step()
                # update time
                time_since_best += 1
                total_train_time += time.time() - time_train_start

                if do_debug:
                    torch.save(
                        preds.detach().cpu(),
                        os.path.join(
                            self.args.bkup_log_dir, "tensors", f"preds-ptr-EP{ptr_epoch}.pt"
                        ),
                    )
                ###### Check metrics on val set
                self.logger.info(
                    f"Previous best epoch: {best_epoch}, time since best: {time_since_best}"
                )
                if ptr_epoch % self.args.valfreq != 0:
                    datasets = [
                        (X_pretrain, Y_pretrain, Y_pretrain_aux, "pretrain"),
                    ]
                    metrics = print_metrics(
                        datasets,
                        self.pred_model,
                        problem,
                        twostage_criterion,
                        twostage_criterion,
                        ptoSolver,
                        f"Ptr iter {ptr_epoch},",
                        self.logger,
                        do_debug=do_debug,
                        batch_size=self.args.batch_size,
                        **self.model_args,
                    )
                    add_log(train_logs, "Ptr-" + str(ptr_epoch), metrics, "pretrain")
                else:
                    # Compute metrics
                    datasets = [
                        (X_pretrain, Y_pretrain, Y_pretrain_aux, "pretrain"),
                        (X_val, Y_val, Y_val_aux, "val"),
                    ]
                    metrics = print_metrics(
                        datasets,
                        self.pred_model,
                        problem,
                        twostage_criterion,
                        twostage_criterion,
                        ptoSolver,
                        f"Ptr iter {ptr_epoch},",
                        self.logger,
                        do_debug=do_debug,
                        batch_size=self.args.batch_size,
                        **self.model_args,
                    )
                    add_log(train_logs, "Ptr-" + str(ptr_epoch), metrics, "pretrain")
                    add_log(val_logs, "Ptr-" + str(ptr_epoch), metrics, "val")
                    # Save model if it's the best one
                    if best[1] is None or compare_result(metrics["val"], best):
                        best = (metrics["val"]["eval"]["value"], deepcopy(self.pred_model))
                        time_since_best = 0
                        best_epoch = ptr_epoch
                        # save
                        torch.save(
                            self.pred_model.state_dict(),
                            os.path.join(
                                self.args.log_dir, "checkpoints", "ptr_pred_best.pt"
                            ),
                        )
                        torch.save(
                            self.pred_model.state_dict(),
                            os.path.join(
                                self.args.bkup_log_dir, "checkpoints", "ptr_pred_best.pt"
                            ),
                        )
                # Stop if model hasn't improved for patience steps
                if self.args.earlystopping and time_since_best > self.args.patience:
                    break

            if best[1]:
                self.pred_model = deepcopy(best[1])
        else:
            self.pred_model.load_state_dict(torch.load(os.path.join(self.args.log_dir, "checkpoints", "ptr_pred_best.pt")))

        ############################# Train #############################
        # optimizer:
        # self.optimizer = torch.optim.Adam(self.pred_model.parameters(), lr=self.args.lr)
        self.optimizer = optimizer_wrapper(self.args, self.pred_model.parameters())
        # dataset loader
        train_dataset = ExpDataset(X_train, Y_train, Y_train_aux)
        train_loader = DataLoader(
            train_dataset, batch_size=self.args.batch_size, shuffle=True
        )
        # Train PTO
        time_since_best = 0
        self.logger.info("Training Model...")
        self.pred_model.train()
        best_epoch = 0
        for iter_idx in range(1, n_epochs + 1):
            time_train_start = time.time()
            losses = list()
            for batch_id, batch in enumerate(train_loader):
                X_batch, Y_batch, Y_aux_batch = batch["X"], batch["Y"], batch["Y_aux"]
                preds = self.pred_model(X_batch)
                loss = loss_fn(
                    problem,
                    coeff_hat=preds,
                    coeff_true=Y_batch,
                    params=Y_aux_batch,
                    partition="train",
                    index=batch_id,
                    do_debug=do_debug,
                    **self.model_args,
                ) + smooth_loss_fn(
                    problem,
                    coeff_hat=preds,
                    coeff_true=Y_batch,
                    params=Y_aux_batch,
                    partition="train",
                    index=batch_id,
                    do_debug=do_debug,
                    **self.model_args,
                )
                if self.args.opt_name == "sgd":
                    loss = do_reduction(loss, self.model_args["reduction"])
                    # add penalty
                    if self.args.l1_weight > 0:
                        loss += self.args.l1_weight * l1_penalty(self.pred_model)
                    if self.args.l2_weight > 0:
                        loss += self.args.l2_weight * l2_penalty(self.pred_model)

                    self.optimizer.zero_grad()
                    loss.backward()
                    self.optimizer.step()
                    # losses.append(loss_idx)
                    if self.args.use_lr_scheduling:
                        self.scheduler.step()
                elif self.args.opt_name == "gd":
                    losses.append(loss)
                else:
                    raise NotImplementedError

            if self.args.opt_name == "gd":
                losses = do_reduction(torch.stack(losses), self.model_args["reduction"])
                self.optimizer.zero_grad()
                losses.backward()
                self.optimizer.step()
                if self.args.use_lr_scheduling:
                    self.scheduler.step()

            # accuracy = (preds.round() * Y_train).sum() / Y_train.sum()
            # print("accuracy: ", accuracy)
            # loss = torch.stack(losses)
            time_since_best += 1
            total_train_time += time.time() - time_train_start

            ###### Check metrics on val set
            self.logger.info(
                f"Previous best epoch: {best_epoch}, time since best: {time_since_best}"
            )
            if iter_idx % self.args.valfreq != 0:
                datasets = [
                    (X_train, Y_train, Y_train_aux, "train"),
                ]
                metrics = print_metrics(
                    datasets,
                    self.pred_model,
                    problem,
                    loss_fn,
                    twostage_criterion,
                    ptoSolver,
                    f"Iter {iter_idx},",
                    self.logger,
                    do_debug=do_debug,
                    batch_size=self.args.batch_size,
                    **self.model_args,
                )
                add_log(train_logs, "Tr-" + str(iter_idx), metrics, "train")
            else:
                # Compute metrics
                datasets = [
                    (X_train, Y_train, Y_train_aux, "train"),
                    (X_val, Y_val, Y_val_aux, "val"),
                ]
                metrics = print_metrics(
                    datasets,
                    self.pred_model,
                    problem,
                    loss_fn,
                    twostage_criterion,
                    ptoSolver,
                    f"Iter {iter_idx},",
                    self.logger,
                    do_debug=do_debug,
                    batch_size=self.args.batch_size,
                    **self.model_args,
                )
                add_log(train_logs, "Tr-" + str(iter_idx), metrics, "train")
                add_log(val_logs, "Tr-" + str(iter_idx), metrics, "val")
                # Save model if it's the best one
                if best[1] is None or compare_result(metrics["val"], best):
                    best = (metrics["val"]["eval"]["value"], deepcopy(self.pred_model))
                    time_since_best = 0
                    best_epoch = iter_idx
                    # save
                    torch.save(
                        self.pred_model.state_dict(),
                        os.path.join(self.args.log_dir, "checkpoints", "tr_pred_best.pt"),
                    )
                    torch.save(
                        self.pred_model.state_dict(),
                        os.path.join(
                            self.args.bkup_log_dir, "checkpoints", "tr_pred_best.pt"
                        ),
                    )
                # Stop if model hasn't improved for patience steps
                if self.args.earlystopping and time_since_best > self.args.patience:
                    break

        if best[1]:
            self.pred_model = deepcopy(best[1])

        ############################# Evaluate final model #############################
        # Document how well this trained model does
        self.logger.info("Benchmarking Model...")
        # Print final metrics
        datasets = [
            (X_train, Y_train, Y_train_aux, "train"),
            (X_val, Y_val, Y_val_aux, "val"),
            (X_test, Y_test, Y_test_aux, "test"),
        ]
        results = print_metrics(
            datasets,
            self.pred_model,
            problem,
            loss_fn,
            twostage_criterion,
            ptoSolver,
            "Final",
            self.logger,
            do_debug=do_debug,
            batch_size=self.args.batch_size,
            **self.model_args,
        )
        total_test_time = results["test"]["time"]
        eval_value = results["test"]["eval"]["value"]
        ############################ Save to file ############################
        # save logs
        save_pd(train_logs, os.path.join(self.args.log_dir, "train_logs.csv"))
        save_pd(val_logs, os.path.join(self.args.log_dir, "val_logs.csv"))
        # save logs 2
        save_pd(train_logs, os.path.join(self.args.bkup_log_dir, "train_logs.csv"))
        save_pd(val_logs, os.path.join(self.args.bkup_log_dir, "val_logs.csv"))
        # save objectives
        np.save(
            os.path.join(self.args.log_dir, "results.npy"),
            [to_device(Objs_test_opt, "cpu"), to_device(eval_value, "cpu")],
        )
        np.save(
            os.path.join(self.args.bkup_log_dir, "results.npy"),
            [to_device(Objs_test_opt, "cpu"), to_device(eval_value, "cpu")],
        )
        # save solutions
        if do_debug:
            Z_test_opt_array = to_array(Z_test_opt)
            np.save(
                os.path.join(self.args.bkup_log_dir, "tensors", "solution.npy"),
                Z_test_opt_array,
            )
            torch.save(
                results["test"]["preds"].cpu().detach(),
                os.path.join(self.args.bkup_log_dir, "tensors", "preds.pt"),
            )

        ############################ Logging ############################
        avg_train_time = ndiv(total_train_time, (self.args.n_ptr_epochs + n_epochs))
        avg_test_time = total_test_time
        self.logger.info(
            f"[Random Obj]: {objs_rand.mean().item():.5f} "
            f"[Optimal Obj]: {Objs_test_opt.mean().item():.5f} "
            f"[{problem.get_eval_metric()}]: {eval_value.mean():.5f} "
            f"[avg Train Time]: {avg_train_time:.5f} "
            f"[avg Test Time]: {avg_test_time:.5f} "
        )
        self.logger.info(
            f"[{self.args.opt_model}]  {results['test']['objective'].mean():.5f}  {eval_value.mean():.5f}  "
            f"{avg_train_time:.5f}  {avg_test_time:.5f}"
        )
        return True
