import numpy as np
import matplotlib.pyplot as plt
import pandas as pd
from scipy.optimize import linear_sum_assignment
from scipy.stats import kendalltau
from scipy.spatial.distance import pdist, sqeuclidean, euclidean, squareform, cdist
from scipy.linalg import eigh # For symmetric matrix eigenvalues/vectors
from scipy.sparse import lil_matrix, csr_matrix, vstack as sp_vstack
from scipy.sparse.linalg import lsqr # Solver for sparse least squares
import pprint
import time

N_POINTS_LIST = np.array([500, 1000, 3000])
NOISE_STD_LIST = np.array(0.05*np.arange(1, 11))
N_RUNS = 10
results = {}
algs = ["fiedler", "UMAP", "t_SNE", "spectral_lin_reg", "spectral_order"]


for alg in algs:
    results[alg] = {}
    for N_POINTS in N_POINTS_LIST:
        results[alg][N_POINTS] = {}
        filename = "{0}_N_{1}_NOISE_{2}_v3.txt"
        for NOISE_STD in NOISE_STD_LIST:
            true_order_indices = np.loadtxt(filename.format("true_labels", N_POINTS, NOISE_STD))
            taus = np.empty(N_RUNS)
            recovered_order_indices = np.loadtxt(filename.format(alg, N_POINTS, NOISE_STD))
            for i in np.arange(N_RUNS):
                taus[i], _ = np.abs(kendalltau(true_order_indices[i, :], recovered_order_indices[i, :]))
            results[alg][N_POINTS][NOISE_STD] = {"mean": np.mean(taus), "sd": np.std(taus), "min": np.min(taus), "max": np.max(taus)}

res  = {NOISE_STD: np.empty((len(algs), len(N_POINTS_LIST))) for NOISE_STD in NOISE_STD_LIST}
for alg in algs:
    df = pd.DataFrame(index = N_POINTS_LIST, columns = NOISE_STD_LIST)
    for N_POINTS in N_POINTS_LIST:
        for NOISE_STD in NOISE_STD_LIST:
            df.loc[[N_POINTS],[NOISE_STD]] = "{} ({})".format(round(results[alg][N_POINTS][NOISE_STD]["mean"]*100, 2), round(results[alg][N_POINTS][NOISE_STD]["sd"]*100, 2))
    print("Algorithm: ", alg)
    print(df)

for NOISE_STD in NOISE_STD_LIST:
    for i in np.arange(len(algs)):
        for j in np.arange(len(N_POINTS_LIST)):
            res[NOISE_STD][i, j] = results[algs[i]][N_POINTS_LIST[j]][NOISE_STD]["mean"]
for NOISE_STD in NOISE_STD_LIST:
    fig, ax = plt.subplots()
    ax.set_ylabel("Kendall's Tau")
    ax.set_xlabel("Sample Size")
    ax.set_ylim(0, 1)
    for i in np.arange(len(algs)):
        plt.plot(N_POINTS_LIST, res[NOISE_STD][i,], label = algs[i], marker = "o")
    plt.title("Kendall Tau with $\sigma$ = {}".format(round(NOISE_STD, 2)))
    plt.legend()
    plt.savefig("Kendall_tau_sigma_{}.png".format(str(round(NOISE_STD, 2))))
    


