 # !/usr/bin/env python
# coding: utf-8

# Importing python packages
import numpy as np
import matplotlib.pyplot as plt
import scipy.stats as ss


# ### Plotting ###
# Getting Average regret and Confidence interval
def cumulative_regret_error(regret):
    time_horizon = [0]
    samples = len(regret[0])
    runs = len(regret)
    batch = samples / 20
    # batch = 40

    # Time horizon
    t = 0
    while True:
        t += 1
        if time_horizon[-1] + batch > samples:
            if time_horizon[-1] != samples:
                time_horizon.append(time_horizon[-1] + samples % batch)
            break
        time_horizon.append(time_horizon[-1] + batch)

    # Mean batch regret of R runs
    avg_batched_regret = []
    for r in range(runs):
        count = 0
        accumulative_regret = 0
        batch_regret = [0]
        for s in range(samples):
            count += 1
            accumulative_regret += regret[r][s]
            if count == batch:
                batch_regret.append(accumulative_regret)
                count = 0

        if samples % batch != 0:
            batch_regret.append(accumulative_regret)
        avg_batched_regret.append(batch_regret)

    regret = np.mean(avg_batched_regret, axis=0)

    # Confidence interval
    conf_regret = []
    freedom_degree = runs - 1
    for r in range(len(avg_batched_regret[0])):
        conf_regret.append(ss.t.ppf(0.95, freedom_degree) *
                           ss.sem(np.array(avg_batched_regret)[:, r]))
    return time_horizon, regret, conf_regret


# # ### Plotting Regret ###
regret_types = ['average', 'weak']
file_location = "data/plots/"
problem = "square"      # "linear", levy", "cosine", "square", "ackley"
learner_udpate = 1
lamdba = 1.0
nu = 1.0
runs = 20
algos = [
    'NeuralDB-UCB',
    'NeuralDB-TS',
]
algos_in_plots = [
    'NDB-UCB',
    'NDB-TS'
]

arms = [5, 10, 15, 20, 25]

# Plotting the average regret
colors = list("gbcmrykbcmrykg")
shape = ['--^', '--v', '--+', '--H', '--d', '--*', '--v', '--^', '--v', '--*', '--+', '--d', '--H', '--v']

# Different set of hyperpaprameters
for regret_type in regret_types:
    for a in range(len(algos)):
        alg             = algos[a]
        algo_in_plot    = algos_in_plots[a]
        alg_cases       = [algo_in_plot + r' ($K$ = ' + str(k) + ')' for k in arms]
        cases           = len(alg_cases)
        c = 0
        for k in arms:
            problem_instance = problem + F"_5_{k}_1000_0.1_0.0_1" 
            learner_info = "{}_{}_{}_{}".format(lamdba, nu, learner_udpate, runs)
            if alg == 'LinDB-UCB':
                data_file = problem_instance + "_linear_ucb_" + learner_info
            
            elif alg == 'LinDB-TS':
                data_file = problem_instance + "_linear_ts_" + learner_info
                
            elif alg == 'NeuralDB-UCB':
                data_file = problem_instance + "_neural_ucb_False_" + learner_info
                
            elif alg == 'NeuralDB-TS':
                data_file = problem_instance + "_neural_ts_False_" + learner_info

            else:
                raise RuntimeError('Learner not exist')

            # Load data
            all_data = np.load(file_location + data_file + ".npz")
            algo_regret = all_data['{}_regret'.format(regret_type)]
            # algo_regret = all_data['weak_regret']

            # Scatter Error bar with scatter plot
            horizon, batched_regret, error = cumulative_regret_error(np.array(algo_regret))
            plt.errorbar(horizon, batched_regret, error, color=colors[c])
            plt.plot(horizon, batched_regret, colors[c] + shape[c], label=alg_cases[c])
            c += 1
        
        # Average regret plotting
        file_to_save = "plots/" + problem_instance + "_{}_{}_arms.png".format(alg, regret_type)
        file_to_save = "" + problem_instance + "_{}_{}_arms.png".format(alg, regret_type)
            
        # Plot details
        plt.rc('font', size=12)                     # controls default text sizes
        plt.legend(loc="upper left", numpoints=1)  # Location of the legend
        plt.xlabel("Rounds", fontsize=20)
        plt.ylabel("Cumulative Regret ({})".format(regret_type), fontsize=18)

        # plt.title("Comparison of Algorithms")
        # plt.axis([0, samples, -20, samples])
        # plt.xscale('log')
            
        # Saving plot
        plt.savefig(file_to_save, bbox_inches='tight', dpi=600)
        plt.close()