import numpy as np
from econml.utilities import cross_product
from statsmodels.tools.tools import add_constant
from utility import new_cov_matrix, generate_coefs, simulate_residuals_all, generate_dgp
import pandas as pd
import matplotlib.pyplot as plt
import joblib


class AbstracDynamicPanelDGP:

    def __init__(self, n_periods, n_treatments, n_x):
        self.n_periods = n_periods
        self.n_treatments = n_treatments
        self.n_x = n_x
        return

    def create_instance(self, *args, **kwargs):
        pass

    def _gen_data_with_policy(self, n_units, policy_gen, random_seed=123):
        pass

    def static_policy_data(self, n_units, tau, random_seed=123):
        def policy_gen(Tpre, X, period):
            return tau[period]
        return self._gen_data_with_policy(n_units, policy_gen, random_seed=random_seed)

    def adaptive_policy_data(self, n_units, policy_gen, random_seed=123):
        return self._gen_data_with_policy(n_units, policy_gen, random_seed=random_seed)

    def static_policy_effect(self, tau, mc_samples=1000):
        Y_tau, _, _, _ = self.static_policy_data(mc_samples, tau)
        Y_zero, _, _, _ = self.static_policy_data(
            mc_samples, np.zeros((self.n_periods, self.n_treatments)))
        return np.mean(Y_tau[np.arange(Y_tau.shape[0]) % self.n_periods == self.n_periods - 1]) - \
            np.mean(Y_zero[np.arange(Y_zero.shape[0]) %
                           self.n_periods == self.n_periods - 1])

    def adaptive_policy_effect(self, policy_gen, mc_samples=1000):
        Y_tau, _, _, _ = self.adaptive_policy_data(mc_samples, policy_gen)
        Y_zero, _, _, _ = self.static_policy_data(
            mc_samples, np.zeros((self.n_periods, self.n_treatments)))
        return np.mean(Y_tau[np.arange(Y_tau.shape[0]) % self.n_periods == self.n_periods - 1]) - \
            np.mean(Y_zero[np.arange(Y_zero.shape[0]) %
                           self.n_periods == self.n_periods - 1])


class DynamicPanelDGP(AbstracDynamicPanelDGP):

    def __init__(self, n_periods, n_treatments, n_x):
        super().__init__(n_periods, n_treatments, n_x)

    def create_instance(self, s_x, sigma_x, sigma_y, conf_str, epsilon, Alpha_unnormalized,
                        hetero_strength=0, hetero_inds=None,
                        autoreg=.5, state_effect=.5, random_seed=123):
        random_state = np.random.RandomState(random_seed)
        self.s_x = s_x
        self.conf_str = conf_str
        self.sigma_x = sigma_x
        self.sigma_y = sigma_y
        self.hetero_inds = hetero_inds.astype(
            int) if hetero_inds is not None else hetero_inds
        self.hetero_strength = hetero_strength
        self.autoreg = autoreg
        self.state_effect = state_effect
        self.random_seed = random_seed
        self.endo_inds = np.setdiff1d(
            np.arange(self.n_x), hetero_inds).astype(int)
        # The first s_x state variables are confounders. The final s_x variables are exogenous and can create
        # heterogeneity
        self.Alpha = Alpha_unnormalized
        self.Alpha /= np.linalg.norm(self.Alpha, axis=1, ord=1, keepdims=True)
        self.Alpha *= state_effect
        if self.hetero_inds is not None:
            self.Alpha[self.hetero_inds] = 0

        self.Beta = np.zeros((self.n_x, self.n_x))
        for t in range(self.n_x):
            self.Beta[t, :] = autoreg * np.roll(random_state.uniform(low=4.0**(-np.arange(
                0, self.n_x)), high=4.0**(-np.arange(1, self.n_x + 1))), t)
        if self.hetero_inds is not None:
            self.Beta[np.ix_(self.endo_inds, self.hetero_inds)] = 0
            self.Beta[np.ix_(self.hetero_inds, self.endo_inds)] = 0

        self.epsilon = epsilon
        self.zeta = np.zeros(self.n_x)
        self.zeta[:self.s_x] = self.conf_str / self.s_x

        self.y_hetero_effect = np.zeros(self.n_x)
        self.x_hetero_effect = np.zeros(self.n_x)
        if self.hetero_inds is not None:
            self.y_hetero_effect[self.hetero_inds] = random_state.uniform(.5 * hetero_strength, 1.5 * hetero_strength) / \
                len(self.hetero_inds)
            self.x_hetero_effect[self.hetero_inds] = random_state.uniform(.5 * hetero_strength, 1.5 * hetero_strength) / \
                len(self.hetero_inds)

        self.true_effect = np.zeros((self.n_periods, self.n_treatments))
        self.true_effect[0] = self.epsilon
        for t in np.arange(1, self.n_periods):
            self.true_effect[t, :] = (self.zeta.reshape(
                1, -1) @ np.linalg.matrix_power(self.Beta, t - 1) @ self.Alpha)

        self.true_hetero_effect = np.zeros(
            (self.n_periods, (self.n_x + 1) * self.n_treatments))
        self.true_hetero_effect[0, :] = cross_product(add_constant(self.y_hetero_effect.reshape(1, -1), has_constant='add'),
                                                      self.epsilon.reshape(1, -1))
        for t in np.arange(1, self.n_periods):
            self.true_hetero_effect[t, :] = cross_product(add_constant(self.x_hetero_effect.reshape(1, -1), has_constant='add'),
                                                          self.zeta.reshape(1, -1) @ np.linalg.matrix_power(self.Beta, t - 1) @ self.Alpha)

        return self

    def hetero_effect_fn(self, t, x):
        if t == 0:
            return (np.dot(self.y_hetero_effect, x.flatten()) + 1) * self.epsilon
        else:
            return (np.dot(self.x_hetero_effect, x.flatten()) + 1) *\
                (self.zeta.reshape(1, -1) @ np.linalg.matrix_power(self.Beta, t - 1)
                    @ self.Alpha).flatten()

    def _gen_data_with_policy(self, n_units, policy_gen, random_seed=123):
        random_state = np.random.RandomState(random_seed)
        Y = np.zeros(n_units * self.n_periods)
        T = np.zeros((n_units * self.n_periods, self.n_treatments))
        X = np.zeros((n_units * self.n_periods, self.n_x))
        groups = np.zeros(n_units * self.n_periods)
        for t in range(n_units * self.n_periods):
            period = t % self.n_periods
            if period == 0:
                X[t] = random_state.normal(0, self.sigma_x, size=self.n_x)
                T[t] = policy_gen(np.zeros(self.n_treatments), X[t], period, random_state)
            else:
                X[t] = (np.dot(self.x_hetero_effect, X[t - 1]) + 1) * np.dot(self.Alpha, T[t - 1]) + \
                    np.dot(self.Beta, X[t - 1]) + \
                    random_state.normal(0, self.sigma_x, size=self.n_x)
                T[t] = policy_gen(T[t - 1], X[t], period, random_state)
            Y[t] = (np.dot(self.y_hetero_effect, X[t]) + 1) * np.dot(self.epsilon, T[t]) + \
                np.dot(X[t], self.zeta) + \
                random_state.normal(0, self.sigma_y)
            groups[t] = t // self.n_periods

        return Y, T, X, groups

    def observational_data(self, n_units, gamma, s_t, sigma_t, random_seed=123):
        """ Generated observational data with some observational treatment policy parameters

        Parameters
        ----------
        n_units : how many units to observe
        gamma : what is the degree of auto-correlation of the treatments across periods
        s_t : sparsity of treatment policy; how many states does it depend on
        sigma_t : what is the std of the exploration/randomness in the treatment
        """
        Delta = np.zeros((self.n_treatments, self.n_x))
        Delta[:, :s_t] = self.conf_str / s_t

        def policy_gen(Tpre, X, period, random_state):
            return gamma * Tpre + (1 - gamma) * np.dot(Delta, X) + \
                random_state.normal(0, sigma_t, size=self.n_treatments)
        return self._gen_data_with_policy(n_units, policy_gen, random_seed=random_seed)


class SemiSynthetic:

    def create_instance(self):
        # get new covariance matrix
        self.cov_new = joblib.load('cov_new.jbl')

        # get coefs
        self.index = ["proxy1", "proxy2", "proxy3", "proxy4",
                      "investment1", "investment2", "investment3", ]
        self.columns = [f"{ind}_{i}" for ind in self.index for i in range(-6, 0)] +\
            [f"demo_{i}" for i in range(47)]

        self.coef_df = generate_coefs(self.index, self.columns)
        self.n_proxies = 4
        self.n_treatments = 3

        # get residuals
        res_df = pd.DataFrame(columns = self.index)
        self.new_res_df = simulate_residuals_all(res_df)

    def gen_data(self, n, n_periods, thetas, random_seed):
        random_state = np.random.RandomState(random_seed)
        n_proxies = self.n_proxies
        n_treatments = self.n_treatments
        coef_matrix = self.coef_df.values
        residual_matrix = self.new_res_df.values
        n_x = len(self.columns)
        # proxy 1 is the outcome
        outcome = "proxy1"

        # make fixed residuals
        all_residuals = []
        for t in range(n_periods):
            sample_residuals = []
            for i in range(7):
                sample_residuals.append(
                    random_state.choice(residual_matrix[:, i], n))
            sample_residuals = np.array(sample_residuals).T
            all_residuals.append(sample_residuals)
        all_residuals = np.array(all_residuals)

        fn_df_control = generate_dgp(self.cov_new, n, n_periods,
                                     coef_matrix, all_residuals, thetas,
                                     [0, 0, 0], self.columns, self.index, False)

        fn_df_cf_control = generate_dgp(self.cov_new, n, n_periods,
                                        coef_matrix, all_residuals, thetas,
                                        [0, 0, 0], self.columns, self.index, True)
        true_effect = np.zeros((n_periods, n_treatments))
        for i in range(n_treatments):
            intervention = [0, 0, 0]
            intervention[i] = 1
            fn_df_treated = generate_dgp(self.cov_new, n, n_periods,
                                         coef_matrix, all_residuals, thetas,
                                         intervention, self.columns, self.index, True)
            for t in range(n_periods):
                ate_control = fn_df_cf_control.loc[
                    fn_df_control["datetime"] == t + 1, outcome
                ].mean()
                ate_treated = fn_df_treated.loc[
                    fn_df_treated["datetime"] == t + 1, outcome
                ].mean()
                true_effect[t, i] = ate_treated - ate_control

        panelX = fn_df_control[self.columns].values.reshape(-1, n_periods, n_x)
        panelT = fn_df_control[self.index[n_proxies:]
                               ].values.reshape(-1, n_periods, n_treatments)
        panelY = fn_df_control[outcome].values.reshape(-1, n_periods)
        panelGroups = fn_df_control["id"].values.reshape(-1, n_periods)
        return panelX, panelT, panelY, panelGroups, true_effect

    def plot_coefs(self):
        coef_df = self.coef_df
        plt.figure(figsize=(20, 20))
        for i in range(7):
            outcome = coef_df.index[i]
            plt.subplot(2, 4, i + 1)
            coef_list = coef_df.iloc[i]
            coef_list = coef_list[coef_list != 0]
            plt.plot(coef_list)
            plt.xticks(rotation=90)
            plt.title(f"outcome:{outcome}")
        plt.show()

    def plot_cov(self):
        plt.imshow(self.cov_new)
        plt.colorbar()
        plt.show()
