# !/usr/bin/env python
# coding: utf-8

# Importing python packages
import numpy as np
from tqdm import tqdm
import matplotlib.pyplot as plt
import os.path

import warnings
warnings.filterwarnings("ignore")

# Plotting functions
from plotting_functions import average_plotting_x_axis

# Environment
from environment import problem_instance_fixed

# Online fair division algorithms
from learners import ofd_linear
from learners import ofd_uniform


# Comparing characterstics of algorithms for different rho values
def compare_algorithms_rho(algorithm_parameters, R, save_regret_data):
    # Different algorithms and weights
    algos       = ['OFD-Uniform', 'OFD-Greedy', 'OFD-UCB', 'OFD-TS'] 
    rho_values  = [0, 0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0.75, 0.8, 0.82, 0.84, 0.86, 0.88, 0.9, 0.92, 0.94, 0.96, 0.98, 1.0]
    rho_values  = [0, 0.1, 0.2, 0.4, 0.6, 0.8, 0.85, 0.88, 0.89, 0.9, 0.91, 0.92, 0.93, 0.94, 0.95, 0.96, 0.97, 0.98, 0.99, 1.0]

    # File to save or read
    agents  = len(algorithm_parameters[0][0])
    items   = len(algorithm_parameters[0]) - agents
    dim     = algorithm_parameters[2]
    file_name = F"rho2_{items}_{agents}_{dim}_{rho}_{R}"
    path_to_file = "results/data/{}.npz".format(file_name)
    
    if os.path.exists(path_to_file):
        # Loading existing regret data
        load_data = np.load(path_to_file)    
        overall_regret = load_data['overall_regret']
        overall_total_utility = load_data['overall_total_utility']
        overall_gini_coefficient = load_data['overall_gini_coefficient']
        overall_min_total_utility_ratio = load_data['overall_min_total_utility_ratio']
        
    else:
        overall_regret = []
        overall_total_utility = []
        overall_gini_coefficient = []
        overall_min_total_utility_ratio = []
        
        for alg in algos:
            cases = len(rho_values)            
            algos_regret = []
            algos_total_utility = []
            algos_gini_coefficient = []
            algos_min_total_utility_ratio = []
            print(F"Running for algorithm: {alg}")
            for _ in tqdm(range(R)):
                run_regret = []
                run_total_utility = []
                run_gini_coefficient = []
                run_min_total_utility_ratio = []

                for c in range(cases):
                    # print(F"Running for algorithm: {alg} with rho value {rho_values[c]}")
                    algorithm_parameters[8] = np.array([(rho_values[c]**a) for a in range(agents)])
                    if alg == 'OFD-Uniform':
                        iter_regret, all_stats = ofd_uniform(algorithm_parameters)
                    
                    elif alg == 'OFD-Greedy':
                        iter_regret, all_stats = ofd_linear(algorithm_parameters, strategy='greedy')
                        
                    elif alg == 'OFD-UCB':
                        iter_regret, all_stats = ofd_linear(algorithm_parameters, strategy='ucb')

                    elif alg == 'OFD-TS':
                        iter_regret, all_stats = ofd_linear(algorithm_parameters, strategy='ts')
                            
                    run_regret.append(sum(iter_regret))
                    run_total_utility.append(all_stats[0][-1])
                    run_gini_coefficient.append(all_stats[1][-1])
                    run_min_total_utility_ratio.append(all_stats[2][-1])
                    
                algos_regret.append(run_regret)
                algos_total_utility.append(run_total_utility)
                algos_gini_coefficient.append(run_gini_coefficient)
                algos_min_total_utility_ratio.append(run_min_total_utility_ratio)
            
            overall_regret.append(algos_regret)
            overall_total_utility.append(algos_total_utility)
            overall_gini_coefficient.append(algos_gini_coefficient)
            overall_min_total_utility_ratio.append(algos_min_total_utility_ratio)
            
        # Save regret data
        if save_regret_data:
            np.savez(path_to_file,
                    overall_regret = overall_regret,
                    overall_total_utility = overall_total_utility,
                    overall_gini_coefficient = overall_gini_coefficient,
                    overall_min_total_utility_ratio = overall_min_total_utility_ratio
                )        

    # ### Plotting Regret ###
    file_to_save = "results/plots/{}_regret.png".format(file_name)
    x_label = r'Values of $\rho$'
    y_label = "Cumulative Regret"
    # print (overall_regret)
    average_plotting_x_axis(overall_regret, rho_values, algos, file_to_save, 'upper right', runs, x_label=x_label, y_label=y_label)
    
    # ### Plotting Total Utility ###
    file_to_save = "results/plots/{}_total_utility.png".format(file_name)
    y_label = "Total Utility"
    average_plotting_x_axis(overall_total_utility, rho_values, algos, file_to_save, 'upper left', runs, x_label=x_label, y_label=y_label)
    
    # ### Plotting Gini Coefficient ###
    file_to_save = "results/plots/{}_gini_coefficient.png".format(file_name)
    y_label = "Gini Coefficient"
    average_plotting_x_axis(overall_gini_coefficient, rho_values, algos, file_to_save, 'upper left', runs, x_label=x_label, y_label=y_label)
    
    # ### Plotting ratio between minimum utility and total utility ###
    file_to_save = "results/plots/{}_min_total_utility_ratio.png".format(file_name)
    y_label = "Minimum Utility/Total Utility"
    average_plotting_x_axis(overall_min_total_utility_ratio, rho_values, algos, file_to_save, 'lower left', runs, x_label=x_label, y_label=y_label)
        
    
# ########################### Bandit problem ###########################
# ### Problem Instance ###
d           = 20
items       = 1000
item_copies = 1
agents      = 10
rho         = 0.85  # 0: Max-min <= rho <= 1: Efficiency
runs        = 20

# Initializing the problem instance
np.random.seed(0)
save_data = True

# Varying value of rho
algorithm_parameters = problem_instance_fixed(d, items, item_copies, agents, rho)
compare_algorithms_rho(algorithm_parameters, runs, save_data)
