 # !/usr/bin/env python
# coding: utf-8

# Importing python packages
import numpy as np
import matplotlib.pyplot as plt
import scipy.stats as ss


# ### Plotting ###
# Getting Average regret and Confidence interval
def cumulative_regret_error(regret):
    time_horizon = [0]
    samples = len(regret[0])
    runs = len(regret)
    batch = samples / 20
    # batch = 40

    # Time horizon
    t = 0
    while True:
        t += 1
        if time_horizon[-1] + batch > samples:
            if time_horizon[-1] != samples:
                time_horizon.append(time_horizon[-1] + samples % batch)
            break
        time_horizon.append(time_horizon[-1] + batch)

    # Mean batch regret of R runs
    avg_batched_regret = []
    for r in range(runs):
        count = 0
        accumulative_regret = 0
        batch_regret = [0]
        for s in range(samples):
            count += 1
            accumulative_regret += regret[r][s]
            if count == batch:
                batch_regret.append(accumulative_regret)
                count = 0

        if samples % batch != 0:
            batch_regret.append(accumulative_regret)
        avg_batched_regret.append(batch_regret)

    regret = np.mean(avg_batched_regret, axis=0)

    # Confidence interval
    conf_regret = []
    freedom_degree = runs - 1
    for r in range(len(avg_batched_regret[0])):
        conf_regret.append(ss.t.ppf(0.95, freedom_degree) *
                           ss.sem(np.array(avg_batched_regret)[:, r]))
    return time_horizon, regret, conf_regret


# # ### Plotting Regret ###
# Plot and problem details
plot_types = ['algo_regret']
file_location = "data/plots/"
problem = "linear"      # "linear", levy", "cosine", "square", "ackley"
contexts = 1000
agents = 5
arm_copies = 1
dim = 5
eta = 0.1
eta_noise = 0.1
seed = 1
problem_instance = problem + "_{}_{}_{}_{}_{}_{}_{}".format(contexts, agents, arm_copies, dim, eta, eta_noise, seed)

# Learner details
lamdba = 0.01
delta = 0.05
sigma = 0.1
runs = 50
learner_info = "{}_{}_{}_{}".format(lamdba, delta, sigma, runs)

# Algorithms to compare
algos = [
    # 'Uniform',
    # 'LinUCB',
    # 'LinTS',
    # 'OptGTM',
    'COBRA (UCB)',
    'COBRA (TS)'
]

# Plotting the average regret
colors = list("rgbcmkyrb")
shape = ['--^', '--v', '--*', '--H', '--d', '--+', '--v', '--^']
x_axis = [i for i in range(1, contexts+1)]


############ Ploting the average regret vs. eta ############
eta_values = [0.1, 0.2, 0.3, 0.4, 0.5, 0.6]
# Fetching data from the files 
for a in algos:
    for e in range(len(eta_values)):
        problem_instance = problem + "_{}_{}_{}_{}_{}_{}_{}".format(contexts, agents, arm_copies, dim, eta_values[e], eta_noise, seed)
        if a == 'COBRA (UCB)':
            data_file = problem_instance + "_cobra_ucb_loom_" + learner_info

        elif a == 'COBRA (TS)':
            data_file = problem_instance + "_cobra_ts_loom_" + learner_info
        
        else:
            raise RuntimeError('Learner not exist')

        # Load data
        all_data = np.load(file_location + data_file + ".npz")
        plot_data = all_data['algo_regret']

        # Scatter Error bar with scatter plot
        horizon, batched_regret, error = cumulative_regret_error(np.array(plot_data))
        plt.errorbar(horizon, batched_regret, error, color=colors[e])
        plt.plot(horizon, batched_regret, colors[e] + shape[e], label=a + " [$\eta$ = {}]".format(str(eta_values[e])))

    # Average regret plotting
    plot_file = problem_instance + "_eta{}_".format(len(eta_values)) + learner_info
    file_to_save = "results/" + plot_file + "_{}.png".format(a)

    # Plot details
    plt.rc('font', size=12)                     # controls default text sizes
    plt.legend(loc="upper right", numpoints=1)  # Location of the legend
    plt.xlabel("Rounds", fontsize=20)
    y_label = "Cumulative Regret"
    plt.ylabel(y_label, fontsize=20)
        
    # Saving plot
    plt.savefig(file_to_save, bbox_inches='tight', dpi=600)
    plt.close()


############ Ploting the average regret vs. eta ############
eta_noise_values = [0.1, 0.15, 0.2, 0.25, 0.35, 0.5]
# Fetching data from the files 
for a in algos:
    for e in range(len(eta_noise_values)):
        problem_instance = problem + "_{}_{}_{}_{}_{}_{}_{}".format(contexts, agents, arm_copies, dim, eta, eta_noise_values[e], seed)
        if a == 'COBRA (UCB)':
            data_file = problem_instance + "_cobra_ucb_loom_" + learner_info

        elif a == 'COBRA (TS)':
            data_file = problem_instance + "_cobra_ts_loom_" + learner_info
        
        else:
            raise RuntimeError('Learner not exist')

        # Load data
        all_data = np.load(file_location + data_file + ".npz")
        plot_data = all_data['algo_regret']

        # Scatter Error bar with scatter plot
        horizon, batched_regret, error = cumulative_regret_error(np.array(plot_data))
        plt.errorbar(horizon, batched_regret, error, color=colors[e])
        plt.plot(horizon, batched_regret, colors[e] + shape[e], label=a + " [$\epsilon_\eta$ = {}]".format(str(eta_noise_values[e])))

    # Average regret plotting
    plot_file = problem_instance + "_eta_noise{}_".format(len(eta_noise_values)) + learner_info
    file_to_save = "results/" + plot_file + "_{}.png".format(a)

    # Plot details
    plt.rc('font', size=12)                     # controls default text sizes
    plt.legend(loc="upper right", numpoints=1)  # Location of the legend
    plt.xlabel("Rounds", fontsize=20)
    y_label = "Cumulative Regret"
    plt.ylabel(y_label, fontsize=20)
        
    # Saving plot
    plt.savefig(file_to_save, bbox_inches='tight', dpi=600)
    plt.close()


############ Ploting the average regret vs. agents ############
agents_values = [5, 10, 15, 20, 25, 30]
# Fetching data from the files 
for a in algos:
    for e in range(len(agents_values)):
        problem_instance = problem + "_{}_{}_{}_{}_{}_{}_{}".format(contexts, agents_values[e], arm_copies, dim, eta, eta_noise, seed)
        if a == 'COBRA (UCB)':
            data_file = problem_instance + "_cobra_ucb_loom_" + learner_info

        elif a == 'COBRA (TS)':
            data_file = problem_instance + "_cobra_ts_loom_" + learner_info
        
        else:
            raise RuntimeError('Learner not exist')

        # Load data
        all_data = np.load(file_location + data_file + ".npz")
        plot_data = all_data['algo_regret']

        # Scatter Error bar with scatter plot
        horizon, batched_regret, error = cumulative_regret_error(np.array(plot_data))
        plt.errorbar(horizon, batched_regret, error, color=colors[e])
        plt.plot(horizon, batched_regret, colors[e] + shape[e], label=a + " [$N$ = {}]".format(str(agents_values[e])))

    # Average regret plotting
    plot_file = problem_instance + "_agents{}_".format(len(agents_values)) + learner_info
    file_to_save = "results/" + plot_file + "_{}.png".format(a)

    # Plot details
    plt.rc('font', size=12)                     # controls default text sizes
    plt.legend(loc="upper right", numpoints=1)  # Location of the legend
    plt.xlabel("Rounds", fontsize=20)
    y_label = "Cumulative Regret"
    plt.ylabel(y_label, fontsize=20)
        
    # Saving plot
    plt.savefig(file_to_save, bbox_inches='tight', dpi=600)
    plt.close()


############ Ploting the average regret vs. dimension ############
dim_values = [5, 10, 15, 20, 25, 30]
# Fetching data from the files 
for a in algos:
    for e in range(len(dim_values)):
        problem_instance = problem + "_{}_{}_{}_{}_{}_{}_{}".format(contexts, agents, arm_copies, dim_values[e], eta, eta_noise, seed)
        if a == 'COBRA (UCB)':
            data_file = problem_instance + "_cobra_ucb_loom_" + learner_info

        elif a == 'COBRA (TS)':
            data_file = problem_instance + "_cobra_ts_loom_" + learner_info
        
        else:
            raise RuntimeError('Learner not exist')

        # Load data
        all_data = np.load(file_location + data_file + ".npz")
        plot_data = all_data['algo_regret']

        # Scatter Error bar with scatter plot
        horizon, batched_regret, error = cumulative_regret_error(np.array(plot_data))
        plt.errorbar(horizon, batched_regret, error, color=colors[e])
        plt.plot(horizon, batched_regret, colors[e] + shape[e], label=a + " [$d$ = {}]".format(str(dim_values[e])))

    # Average regret plotting
    plot_file = problem_instance + "_dim{}_".format(len(dim_values)) + learner_info
    file_to_save = "results/" + plot_file + "_{}.png".format(a)

    # Plot details
    plt.rc('font', size=12)                     # controls default text sizes
    plt.legend(loc="upper right", numpoints=1)  # Location of the legend
    plt.xlabel("Rounds", fontsize=20)
    y_label = "Cumulative Regret"
    plt.ylabel(y_label, fontsize=20)
        
    # Saving plot
    plt.savefig(file_to_save, bbox_inches='tight', dpi=600)
    plt.close()

