import datetime as dt
import os
import random

import pandas as pd
import quandl
import torch

from gurobipy import GRB  # pylint: disable=no-name-in-module
import numpy as np
from openpto.method.utils_method import to_tensor,to_array
from openpto.problems.PTOProblem import PTOProblem
from openpto.method.Solvers.cvxpy.cp_port import PortfolioSolver

quandl.ApiConfig.api_key = "3Uxzq4TZV5V9RghuRYsY"


class PortfolioOpt(PTOProblem):
    """ """

    def __init__(
        self,
        num_train_instances=200,  # number of *days* to use from the dataset to train
        num_test_instances=200,  # number of *days* to use from the dataset to test
        num_stocks=50,  # number of stocks per instance to choose from
        val_frac=0.2,  # fraction of training data reserved for test
        rand_seed=0,  # for reproducibility
        alpha=0.1,  # risk aversion constant
        prob_version="real",
        data_dir="openpto/data",  # directory to store data
    ):
        super(PortfolioOpt, self).__init__()
        # Do some random seed fu
        self.rand_seed = rand_seed
        self._set_seed(self.rand_seed)

        # Load train and test labels
        self.num_stocks = num_stocks
        self.Xs, self.Ys, self.covar_mat = self._load_instances(data_dir, num_stocks)
        # Split data into train/val/test
        # Sanity check and initialisations
        total_days = self.Xs.shape[0]
        self.num_train_instances = num_train_instances
        self.num_test_instances = num_test_instances
        num_days = self.num_train_instances + self.num_test_instances
        assert self.num_train_instances + self.num_test_instances < total_days
        assert 0 < val_frac < 1
        self.val_frac = val_frac

        #   Creating "days" for train/valid/test
        idxs = list(range(num_days))
        num_val = int(self.val_frac * self.num_train_instances)
        self.train_idxs = idxs[: self.num_train_instances - num_val]
        self.val_idxs = idxs[
            self.num_train_instances - num_val : self.num_train_instances
        ]
        self.test_idxs = idxs[self.num_train_instances :]
        assert all(
            x is not None for x in [self.train_idxs, self.val_idxs, self.test_idxs]
        )

        # Create functions for optimisation
        # TODO: Try larger constant
        self.alpha = alpha
        #self.opt = self._create_cvxpy_problem(alpha=self.alpha)

        # Undo random seed setting
        self._set_seed()

    def init_API(self):
        return {
            "modelSense": GRB.MAXIMIZE,
            "alpha": self.alpha,
            "num_stocks": self.num_stocks,
        }

    def _load_instances(
        self,
        data_dir,
        stocks_per_instance,
        reg=0.1,
    ):
        # Get raw data
        feature_mat, target_mat, _, future_mat, _, dates, symbols = self._get_data(
            data_dir=data_dir
        )

        # Split into instances
        # Sample stocks in a day to define an instance
        total_stocks = len(symbols)
        stocks_subset = random.sample(range(total_stocks), stocks_per_instance)
        feature_mat = feature_mat[:, stocks_subset]
        target_mat = target_mat[:, stocks_subset]
        future_mat = future_mat[:, stocks_subset]

        # Calculate covariances
        def computeCovariance(
            future_mat,
            correl=True,  # Normalise covariance matrix to get correlation matrix
        ):
            # Normalize
            mean = future_mat.mean(dim=-1, keepdim=True)
            fm_norm = future_mat - mean  # normalised future matrix
            if correl is True:
                std = (
                    future_mat.square().mean(dim=-1, keepdim=True) - mean.square()
                ).sqrt()
                fm_norm = fm_norm / std

            # Compute covariance
            # TODO: See if things change if you get rid of num_samples
            num_samples = future_mat.shape[-1]
            spi = future_mat.shape[-2]  # stocks per instance
            covar_raw = [
                (
                    fm_norm
                    * fm_norm[..., i : i + 1, :].repeat(
                        (*((1,) * (fm_norm.ndim - 2)), spi, 1)
                    )
                ).sum(dim=-1)
                for i in range(spi)
            ]
            covar_mat_unreg = torch.stack(covar_raw, dim=-1) / (num_samples - 1)

            # Add regularisation to make sure that the covariance matrix is positive-definite
            covar_mat = covar_mat_unreg + reg * torch.eye(spi)

            return covar_mat

        covar_mat = computeCovariance(future_mat)

        # Normalize features
        num_features = feature_mat.shape[-1]
        feature_mat_flat = feature_mat.reshape(-1, num_features)
        feature_mat = torch.div(
            (feature_mat - torch.mean(feature_mat_flat, dim=0)),
            (torch.std(feature_mat_flat, dim=0) + 1e-12),
        )

        return feature_mat.float(), target_mat.float(), covar_mat.float()
    
    def _get_price_feature_df(
        self,
        overwrite=False,
    ):
        """
        Loads raw historical price data if it exists, otherwise compute the file on the fly, this adds other timeseries
        features based on rolling windows of the price
        :return:
        """
        if not overwrite and os.path.exists(self.price_feature_file):
            print("Loading dataset...")
            price_feature_df = pd.read_csv(
                self.price_feature_file, index_col=["Date", "Symbol"]
            )
        else:
            # download prices
            if not overwrite and os.path.exists(self.raw_historical_price_file):
                raw_price_df = pd.read_csv(
                    self.raw_historical_price_file, index_col=["Date", "Symbol"]
                )
            else:
                symbol_df = self._load_raw_symbols()
                raw_price_df = self._download_prices(symbol_df)
                print("saving the data to ...", self.raw_historical_price_file)
                raw_price_df.to_csv(self.raw_historical_price_file)

            # filter out symbols without right number of timesteps
            max_num_timesteps = (
                raw_price_df.groupby("Symbol").apply(lambda x: x.shape[0]).max()
            )
            raw_price_feature_df = raw_price_df.groupby("Symbol").filter(
                lambda x: x.shape[0] == max_num_timesteps
            )

            # compute features for each symbol
            feature_df = (
                raw_price_feature_df.groupby("Symbol", as_index=False)
                .apply(self._compute_monthly_cols)
                .droplevel(0)
            )

            price_feature_df = feature_df.join(raw_price_df, on=["Date", "Symbol"])
            price_feature_df.index = price_feature_df.index.remove_unused_levels()
            price_feature_df.to_csv(self.price_feature_file)

        return price_feature_df

    def _compute_monthly_cols(self, symbol_df):
        returns = symbol_df.Close.pct_change()

        prev_365_returns = symbol_df.Close.pct_change(365)
        prev_120_returns = symbol_df.Close.pct_change(120)
        prev_30_returns = symbol_df.Close.pct_change(30)
        prev_7_returns = symbol_df.Close.pct_change(7)

        rolling_365 = symbol_df.Close.rolling(window=365)
        rolling_120 = symbol_df.Close.rolling(window=120)
        rolling_30 = symbol_df.Close.rolling(window=30)
        rolling_7 = symbol_df.Close.rolling(window=7)
        rolling_3 = symbol_df.Close.rolling(window=3)

        rolling_returns = returns.rolling(7)

        result_data = {
            # "next10_return": returns.shift(-10),
            # "next9_return": returns.shift(-9),
            # "next8_return": returns.shift(-8),
            # "next7_return": returns.shift(-7),
            # "next6_return": returns.shift(-6),
            # "next5_return": returns.shift(-5),
            # "next4_return": returns.shift(-4),
            # "next3_return": returns.shift(-3),
            # "next2_return": returns.shift(-2),
            # "next1_return": returns.shift(-1),
            "cur_return": returns,
            "prev1_return": returns.shift(1),
            "prev2_return": returns.shift(2),
            "prev3_return": returns.shift(3),
            "prev4_return": returns.shift(4),
            "prev5_return": returns.shift(5),
            "prev6_return": returns.shift(6),
            "prev7_return": returns.shift(7),
            "prev8_return": returns.shift(8),
            "prev9_return": returns.shift(9),
            "prev10_return": returns.shift(10),
            "prev_year_return": prev_365_returns,
            "prev_qtr_return": prev_120_returns,
            "prev_month_returns": prev_30_returns,
            "prev_week_returns": prev_7_returns,
            "return_rolling_mean": rolling_returns.mean(),
            "return_rolling_var": rolling_returns.var(),
            "rolling_365_mean": rolling_365.mean(),
            "rolling_365_var": rolling_365.var(),
            "rolling_120_mean": rolling_120.mean(),
            "rolling_120_var": rolling_120.var(),
            "rolling_30_mean": rolling_30.mean(),
            "rolling_30_var": rolling_30.var(),
            "rolling_7_mean": rolling_7.mean(),
            "rolling_7_var": rolling_7.var(),
            "rolling_3_mean": rolling_3.mean(),
            "rolling_3_var": rolling_3.var(),
        }
        feature_data = pd.DataFrame(result_data).dropna()
        return feature_data

    def _download_symbols(self):
        print("Downloading data from wiki...")
        raw_symbol_df = pd.read_html(
            "https://en.wikipedia.org/wiki/List_of_S%26P_500_companies", header=0
        )[0]
        return raw_symbol_df

    def _download_prices(self, symbol_df):
        print("Downloading data from quandl...")

        raw_tickers = symbol_df.Symbol
        tickers = "WIKI/" + raw_tickers.str.replace(".", "_", regex=False)
        partial_request = list(tickers + ".11") + list(tickers + ".12")
        request_field = list(sorted(partial_request))

        print("requesting {} tickers".format(len(request_field)))

        raw_s_data = quandl.get(
            request_field,
            start_date=self.start_date,
            end_date=self.end_date,
            collapse=self.collapse,
        )
        print("processing data...")

        # only keep columns where data was found, and parse column names
        cols_to_keep = list(
            raw_s_data.columns[raw_s_data.columns.str.find(" - Not Found") == -1]
        )
        raw_good_data = raw_s_data[cols_to_keep]
        raw_good_data.columns = raw_good_data.columns.str.replace("WIKI/", "")

        # split column names to form multiindex
        raw_good_data.columns = pd.MultiIndex.from_arrays(
            list(zip(*raw_good_data.columns.str.split(" - "))),
            names=["Symbol", "Feature"],
        )

        # get partially pivoted df with indices being Date and Symbol, columns representing the different features etc.
        price_df = pd.pivot_table(
            raw_good_data.reset_index().melt(id_vars=["Date"]),
            values="value",
            index=["Date", "Symbol"],
            columns="Feature",
            aggfunc="first",
        )

        good_tickers = list(price_df.index.levels[1])
        print("found {} tickers".format(len(good_tickers)))

        price_df.rename(
            columns={"Adj. Close": "Close", "Adj. Volume": "Volume"}, inplace=True
        )

        price_df.sort_index(inplace=True)
        return price_df

    def _load_raw_symbols(
        self,
        overwrite=False,
    ):
        """
        Loads symbols if they exist otherwise download them using download symbols
        :return:
        """
        if not overwrite and os.path.exists(self.raw_symbol_file):
            print("Loading dataset...")
            return pd.read_csv(self.raw_symbol_file)
        else:
            symbol_df = self._download_symbols()
            symbol_df.to_csv(self.raw_symbol_file, index=False)
            return symbol_df

    def _get_price_feature_matrix(self, price_feature_df):
        num_dates, num_assets = map(len, price_feature_df.index.levels)
        price_matrix = price_feature_df.values.reshape((num_dates, num_assets, -1))
        return price_matrix

    def _get_data(
        self,
        data_dir,
        start_date=dt.datetime(2004, 1, 1),
        end_date=dt.datetime(2017, 1, 1),
        collapse="daily",
        overwrite=False,
    ):
        if not os.path.exists(data_dir):
            os.makedirs(data_dir)

        # Save constants
        self.start_date = start_date
        self.end_date = end_date
        self.collapse = collapse

        # Define data directories to write to
        self.raw_historical_price_file = os.path.join(
            data_dir,
            "raw_historical_prices_{}_{}_{}.csv".format(
                start_date.date(), end_date.date(), collapse
            ),
        )
        self.raw_symbol_file = os.path.join(data_dir, "raw_symbols.csv")
        self.price_feature_file = os.path.join(
            data_dir,
            "price_feature_mat_{}_{}_{}.csv".format(
                start_date.date(), end_date.date(), collapse
            ),
        )
        self.torch_file = os.path.join(
            data_dir,
            "price_data_{}_{}_{}.pt".format(start_date.date(), end_date.date(), collapse),
        )

        # Load data if it exists
        if not overwrite and os.path.exists(self.torch_file):
            print(f"Portfolio: Loading pytorch data... {self.torch_file}")
            (
                feature_mat,
                target_mat,
                feature_cols,
                future_mat,
                target_names,
                dates,
                symbols,
            ) = torch.load(self.torch_file)
        else:
            price_feature_df = self._get_price_feature_df()
            target_names = ["next1_return"]
            covariance_names = ["next{}_return".format(i) for i in range(2, 11)]
            feature_cols = [
                c
                for c in price_feature_df.columns
                if c not in target_names + covariance_names + ["Volume"]
            ]
            target_mat = torch.tensor(
                self._get_price_feature_matrix(price_feature_df[target_names])
            ).unsqueeze(-1)
            future_mat = torch.tensor(
                self._get_price_feature_matrix(price_feature_df[covariance_names])
            )
            feature_mat = torch.tensor(
                self._get_price_feature_matrix(price_feature_df[feature_cols])
            )
            dates = list(price_feature_df.index.levels[0])
            symbols = list(price_feature_df.index.levels[1])
            torch.save(
                [
                    feature_mat,
                    target_mat,
                    feature_cols,
                    future_mat,
                    target_names,
                    dates,
                    symbols,
                ],
                self.torch_file,
            )
        return (
            feature_mat,
            target_mat,
            feature_cols,
            future_mat,
            target_names,
            dates,
            symbols,
        )

    def get_train_data(self, **kwargs):
        return (
            self.Xs[self.train_idxs],
            self.Ys[self.train_idxs],
            self.covar_mat[self.train_idxs],
        )

    def get_val_data(self, **kwargs):
        return (
            self.Xs[self.val_idxs],
            self.Ys[self.val_idxs],
            self.covar_mat[self.val_idxs],
        )

    def get_test_data(self, **kwargs):
        return (
            self.Xs[self.test_idxs],
            self.Ys[self.test_idxs],
            self.covar_mat[self.test_idxs],
        )

    def get_model_shape(self):
        return self.Xs.shape[-1], 1

    def get_twostageloss(self):
        return "mse"

    def _get_covar_mat(self, instance_idxs):
        return self.covar_mat.reshape((-1, *self.covar_mat.shape[2:]))[instance_idxs]

    def get_decision(
        self, Y, aux_data=None, ptoSolver=None, max_instances_per_batch=1500, **kwargs
    ):
        # Get the sqrt of the covariance matrix
        covar_mat = self.covar_mat if aux_data is None else aux_data
        sqrt_covar = torch.linalg.cholesky(covar_mat)
        #print(Y.shape,sqrt_covar.shape) #torch.Size([320, 50, 1]) torch.Size([2898, 50, 50])
        # device
        Y = Y.cpu()
        def is_positive_definites   (Q_numpy):
         try:
            eigenvalues = np.linalg.eigvalsh(Q_numpy)
            return np.all(eigenvalues > 0)
         except np.linalg.LinAlgError:
            return False
        sqrt_covar = sqrt_covar.cpu()
        # Split Y into reasonably sized chunks so that we don't run into memory issues
        # Assumption Y is only 2D at max
        assert Y.ndim <= 3
        if Y.ndim == 3 or Y.ndim == 2:
            #print(Y.ndim)
            #print(Y.shape,sqrt_covar.shape)
            if Y.ndim == 3:
                Y = Y.squeeze(-1)
           ## print(Y.shape,sqrt_covar.shape)([320, 50]) torch.Size([2898, 50, 50])
            sols, objs = list(), list()
            for start in range(0, Y.shape[0], max_instances_per_batch):
                end = min(Y.shape[0], start + max_instances_per_batch)
                #print(Y.shape,sqrt_covar[start:end].shape) torch.Size([320, 50]) torch.Size([320, 50, 50])
                length=end-start
                for i in range(0,length):  
                        sol = ptoSolver.solve(Y[i], sqrt_covar[i])[0]

                        obj = self.get_objective(Y[i], sol, sqrt_covar[i])
                        sols.append(sol.tolist())
                        objs.append(obj.tolist())
            objs = torch.tensor(objs)
            sols = torch.tensor(sols)
        else:
            sols = ptoSolver.solve(Y, sqrt_covar)[0]
            objs = self.get_objective(Y, sols, sqrt_covar)
        return (
            sols,
            objs,
        )

    def get_objective(self, Y, Z, aux_data=None, **kwargs):
        # TODO: look at either torch.bmm or torch.matmul
        covar_mat = (
            torch.linalg.cholesky(self.covar_mat) if aux_data is None else aux_data
        )
        # convert tensor
        Y = to_tensor(Y).to(covar_mat.device)
        Z = to_tensor(Z).to(covar_mat.device)
        if Y.ndim == 3:
            Y = Y.squeeze(-1)
        #
        covar_mat_Z_t = (covar_mat * Z.unsqueeze(dim=-2)).sum(dim=-1)
        quad_term = covar_mat_Z_t.square().sum(dim=-1)
        obj = (Y * Z).sum(dim=-1) - self.alpha * quad_term
        return obj

    def get_output_activation(self):
        return "tanh"


if __name__ == "__main__":
    problem = PortfolioOpt()
    X_train, Y_train, Y_train_aux = problem.get_train_data()

    Z_train = problem.get_decision(Y_train, aux_data=Y_train_aux)
    obj = problem.get_objective(Y_train, Z_train, aux_data=Y_train_aux)
