# -*- coding: utf-8 -*-
"""
Created on Fri Sep 15 09:13:47 2023

@author: xiato
"""

# -*- coding: utf-8 -*-
"""
Created on Sat Sep  2 16:42:19 2023

@author: xiatong

For introduction and feature analysis 
"""
import seaborn as sns
sns.set_theme(style="ticks")


import numpy as np
import pandas as pd

import numpy as np
import matplotlib.pyplot as plt
from sklearn.manifold import TSNE
from sklearn.datasets import load_digits
from sklearn.preprocessing import StandardScaler
from sklearn.decomposition import PCA

from sklearn.metrics import silhouette_score, davies_bouldin_score

import pandas as pd

plt.figure(dpi=300, figsize=(5,2))

 
X = ['Initial','$|\mathcal{D}_k|=5000$','$|\mathcal{D}_k|=100$','$|\mathcal{D}_k|=100+1000$']
D1 = [0,1.4,0.79,2.6]
D2 = [0, 3.2, 6.0, 4.6]
D3 = [4.8, 3.2, 5.9, 4.5]
  
X_axis = np.array([-0.5,0.5, 1.5,2.5])
  
plt.bar(X_axis - 0.2, D1, 0.2, label = 'Local model (training set)')
plt.bar(X_axis, D2, 0.2, label = 'Local model (testing set)')
plt.bar(X_axis + 0.2, D3, 0.2, label = 'Global model (testing set)')
  
plt.xticks(X_axis, X,  size=10)
plt.ylabel("DB")
plt.xlim([-0.6,2.9])
plt.legend(loc='lower right', bbox_to_anchor=(1,1))
plt.show()



# ###########
# test_fea = np.load('logs_all//features//FedAvg_IID_500_global//0_test_feature.npy')
# test_label = np.load('logs_all//features//FedAvg_IID_500_global//0_test_label.npy' )
 
# for i in range(1,100):
#       test_ = np.load('logs_all//features//FedAvg_IID_500_global//' + str(i) + '_test_feature.npy')
#       test_l = np.load('logs_all//features//FedAvg_IID_500_global//' + str(i) + '_test_label.npy' )
#       test_fea = np.concatenate((test_fea,test_)) 
#       test_label = np.concatenate((test_label,test_l)) 

 
# ss = davies_bouldin_score(test_fea, test_label)
# print(ss)


  
# data = test_fea 
# n = 0

# # Create a scatter plot of the t-SNE results
# plt.figure(figsize=(3,2), dpi=300)

# data = StandardScaler().fit_transform(data)
# tsne = TSNE(n_components=2, random_state=0)
# tsne_result = tsne.fit_transform(data)

# tsne = TSNE(n_components=2, random_state=0)
# tsne_test = tsne.fit_transform(test_fea)
 
# # pca = PCA(n_components=2, random_state=0)
# # tsne_test = pca.fit_transform(test_fea)

# plt.scatter(tsne_result[n:, 0], tsne_result[n:, 1], c=test_label, cmap=plt.cm.get_cmap("jet", 10), alpha = 0.3, s=8, linewidths=0)

# #plt.scatter(tsne_result[:n, 0], tsne_result[:n, 1], c=train_label, cmap=plt.cm.get_cmap("jet", 10), linewidths = 0.5, edgecolors='black', s=8)
 
# #plt.scatter(tsne_result[:n, 0], tsne_result[:n, 1], c=train_label, cmap=plt.cm.get_cmap("jet", 10), linewidths = 1, edgecolors='black')


# # plt.xlim([-15,15])
# # plt.ylim([-10,10])
# plt.xticks([])
# plt.yticks([])
# plt.show()


# ###########
# test_fea = np.load('logs_all//features//FedAvg_IID_100_3//0_test_feature.npy')
# test_label = np.load('logs_all//features//FedAvg_IID_100_3//0_test_label.npy' )
 
# for i in range(1,100):
#       test_ = np.load('logs_all//features//FedAvg_IID_100_3//' + str(i) + '_test_feature.npy')
#       test_l = np.load('logs_all//features//FedAvg_IID_100_3//' + str(i) + '_test_label.npy' )
#       test_fea = np.concatenate((test_fea,test_)) 
#       test_label = np.concatenate((test_label,test_l)) 

 
# ss = davies_bouldin_score(test_fea, test_label)
# print(ss)


  
# data = test_fea 
# n = 0

# # Create a scatter plot of the t-SNE results
# plt.figure(figsize=(3,2), dpi=300)

# data = StandardScaler().fit_transform(data)
# tsne = TSNE(n_components=2, random_state=0)
# tsne_result = tsne.fit_transform(data)

# tsne = TSNE(n_components=2, random_state=0)
# tsne_test = tsne.fit_transform(test_fea)
 
# # pca = PCA(n_components=2, random_state=0)
# # tsne_test = pca.fit_transform(test_fea)

# plt.scatter(tsne_result[n:, 0], tsne_result[n:, 1], c=test_label, cmap=plt.cm.get_cmap("jet", 10), alpha = 0.3, s=8, linewidths=0)

# #plt.scatter(tsne_result[:n, 0], tsne_result[:n, 1], c=train_label, cmap=plt.cm.get_cmap("jet", 10), linewidths = 0.5, edgecolors='black', s=8)
 
# #plt.scatter(tsne_result[:n, 0], tsne_result[:n, 1], c=train_label, cmap=plt.cm.get_cmap("jet", 10), linewidths = 1, edgecolors='black')


# # plt.xlim([-15,15])
# # plt.ylim([-10,10])
# plt.xticks([])
# plt.yticks([])
# plt.show()



# ###########
# test_fea = np.load('logs_all//features//FedAvg_global//0_test_feature.npy')
# test_label = np.load('logs_all//features//FedAvg_global//0_test_label.npy' )
 
# for i in range(1,100):
#       test_ = np.load('logs_all//features//FedAvg_global//' + str(i) + '_test_feature.npy')
#       test_l = np.load('logs_all//features//FedAvg_global//' + str(i) + '_test_label.npy' )
#       test_fea = np.concatenate((test_fea,test_)) 
#       test_label = np.concatenate((test_label,test_l)) 

 
# ss = davies_bouldin_score(test_fea, test_label)
# print(ss)


  
# data = test_fea 
# n = 0

# # Create a scatter plot of the t-SNE results
# plt.figure(figsize=(3,2), dpi=300)

# data = StandardScaler().fit_transform(data)
# tsne = TSNE(n_components=2, random_state=0)
# tsne_result = tsne.fit_transform(data)

# tsne = TSNE(n_components=2, random_state=0)
# tsne_test = tsne.fit_transform(test_fea)
 
# # pca = PCA(n_components=2, random_state=0)
# # tsne_test = pca.fit_transform(test_fea)

# plt.scatter(tsne_result[n:, 0], tsne_result[n:, 1], c=test_label, cmap=plt.cm.get_cmap("jet", 10), alpha = 0.3, s=8, linewidths=0)

# #plt.scatter(tsne_result[:n, 0], tsne_result[:n, 1], c=train_label, cmap=plt.cm.get_cmap("jet", 10), linewidths = 0.5, edgecolors='black', s=8)
 
# #plt.scatter(tsne_result[:n, 0], tsne_result[:n, 1], c=train_label, cmap=plt.cm.get_cmap("jet", 10), linewidths = 1, edgecolors='black')


# # plt.xlim([-15,15])
# # plt.ylim([-10,10])
# plt.xticks([])
# plt.yticks([])
# plt.show()


# ###########
# test_fea = np.load('logs_all//features//FedAvg_IID_10_global//0_test_feature.npy')
# test_label = np.load('logs_all//features//FedAvg_IID_10_global//0_test_label.npy' )
 
# for i in range(1,100):
#       test_ = np.load('logs_all//features//FedAvg_IID_10_global//' + str(i) + '_test_feature.npy')
#       test_l = np.load('logs_all//features//FedAvg_IID_10_global//' + str(i) + '_test_label.npy' )
#       test_fea = np.concatenate((test_fea,test_)) 
#       test_label = np.concatenate((test_label,test_l)) 

 
# ss = davies_bouldin_score(test_fea, test_label)
# print(ss)


  
# data = test_fea 
# n = 0

# # Create a scatter plot of the t-SNE results
# plt.figure(figsize=(3,2), dpi=300)

# data = StandardScaler().fit_transform(data)
# tsne = TSNE(n_components=2, random_state=10)
# tsne_result = tsne.fit_transform(data)


# plt.scatter(tsne_result[n:, 0], tsne_result[n:, 1], c=test_label, cmap=plt.cm.get_cmap("jet", 10), alpha = 0.3, s=8, linewidths=0)

# #plt.scatter(tsne_result[:n, 0], tsne_result[:n, 1], c=train_label, cmap=plt.cm.get_cmap("jet", 10), linewidths = 0.5, edgecolors='black', s=8)
 
# #plt.scatter(tsne_result[:n, 0], tsne_result[:n, 1], c=train_label, cmap=plt.cm.get_cmap("jet", 10), linewidths = 1, edgecolors='black')


# # plt.xlim([-15,15])
# # plt.ylim([-10,10])
# plt.xticks([])
# plt.yticks([])
# plt.show()

# # ###############################

# ### training data, 64 x 8
# train_fea = np.load('logs_all//features//FedAvg_IID_10//0_train_feature.npy')
# train_label = np.load('logs_all//features//FedAvg_IID_10//0_train_label.npy' )


# for i in range(1,79):
#       test_ = np.load('logs_all//features//FedAvg_IID_10//' + str(i) + '_train_feature.npy')
#       test_l = np.load('logs_all//features//FedAvg_IID_10//' + str(i) + '_train_label.npy' )
#       train_fea = np.concatenate((train_fea,test_)) 
#       train_label = np.concatenate((train_label,test_l)) 

 

# n = len(train_fea)
 

# test_fea = np.load('logs_all//features//FedAvg_IID_10//0_test_feature.npy')
# test_label = np.load('logs_all//features//FedAvg_IID_10//0_test_label.npy' )
 
# for i in range(1,100):
#       test_ = np.load('logs_all//features//FedAvg_IID_10//' + str(i) + '_test_feature.npy')
#       test_l = np.load('logs_all//features//FedAvg_IID_10//' + str(i) + '_test_label.npy' )
#       test_fea = np.concatenate((test_fea,test_)) 
#       test_label = np.concatenate((test_label,test_l)) 



# ss = davies_bouldin_score(train_fea, train_label)
# print(ss)

# ss = davies_bouldin_score(test_fea, test_label)
# print(ss)


  
# data = np.concatenate((train_fea,test_fea)) 


# # Create a scatter plot of the t-SNE results
# plt.figure(figsize=(3,2), dpi=300)

# data = StandardScaler().fit_transform(data)
# tsne = TSNE(n_components=2, random_state=0)
# tsne_result = tsne.fit_transform(data)

# tsne = TSNE(n_components=2, random_state=0)
# tsne_test = tsne.fit_transform(test_fea)
 
# # pca = PCA(n_components=2, random_state=0)
# # tsne_test = pca.fit_transform(test_fea)

# #plt.scatter(tsne_result[n:, 0], tsne_result[n:, 1], c=test_label, cmap=plt.cm.get_cmap("jet", 10), alpha = 0.3, s=8, linewidths=0)

# #plt.scatter(tsne_result[:n, 0], tsne_result[:n, 1], c=train_label, cmap=plt.cm.get_cmap("jet", 10), alpha = 0.3, s=8, linewidths=0)
# plt.scatter(tsne_result[n:, 0], tsne_result[n:, 1], c=test_label, cmap=plt.cm.get_cmap("jet", 10), linewidths = 0.5, edgecolors='black', s=8)
# #plt.scatter(tsne_result[:n, 0], tsne_result[:n, 1], c=train_label, cmap=plt.cm.get_cmap("jet", 10), linewidths = 0.5, edgecolors='black', s=8)
 
# #plt.scatter(tsne_result[:n, 0], tsne_result[:n, 1], c=train_label, cmap=plt.cm.get_cmap("jet", 10), linewidths = 1, edgecolors='black')


# # plt.xlim([-15,15])
# # plt.ylim([-10,10])
# plt.xticks([])
# plt.yticks([])
# plt.show()



# #################################################################

# ### training data, 64 x 8
# train_fea = np.load('logs_all//features//FedAvg_IID_100_2//0_train_feature.npy')
# train_label = np.load('logs_all//features//FedAvg_IID_100_2//0_train_label.npy' )

# for i in range(1,2):
#      test_ = np.load('logs_all//features//FedAvg_IID_100_2//' + str(i) + '_train_feature.npy')
#      test_l = np.load('logs_all//features//FedAvg_IID_100_2//' + str(i) + '_train_label.npy' )
#      train_fea = np.concatenate((train_fea,test_)) 
#      train_label = np.concatenate((train_label,test_l)) 
# n = len(train_fea)  

# train_fea2 = np.load('logs_all//features//FedAvg_IID_100_2//1_train_feature.npy')
# train_label2 = np.load('logs_all//features//FedAvg_IID_100_2//1_train_label.npy' )


# for i in range(3,79):
#       test_ = np.load('logs_all//features//FedAvg_IID_100_2//' + str(i) + '_train_feature.npy')
#       test_l = np.load('logs_all//features//FedAvg_IID_100_2//' + str(i) + '_train_label.npy' )
#       train_fea2 = np.concatenate((train_fea2,test_)) 
#       train_label2 = np.concatenate((train_label2,test_l)) 

 

# n = len(train_fea)



# test_fea = np.load('logs_all//features//FedAvg_IID_100_2//0_test_feature.npy')
# test_label = np.load('logs_all//features//FedAvg_IID_100_2//0_test_label.npy' )
 
# for i in range(1,100):
#       test_ = np.load('logs_all//features//FedAvg_IID_100_2//' + str(i) + '_test_feature.npy')
#       test_l = np.load('logs_all//features//FedAvg_IID_100_2//' + str(i) + '_test_label.npy' )
#       test_fea = np.concatenate((test_fea,test_)) 
#       test_label = np.concatenate((test_label,test_l)) 

# n2 = n + len(train_fea2)

# ss = davies_bouldin_score(train_fea, train_label)
# print(ss)

# ss = davies_bouldin_score(test_fea, test_label)
# print(ss)


  
# data = np.concatenate((train_fea,train_fea2,test_fea)) 


# # Create a scatter plot of the t-SNE results
# plt.figure(figsize=(3,2), dpi=300)

# data = StandardScaler().fit_transform(data)
# tsne = TSNE(n_components=2, random_state=1)
# tsne_result = tsne.fit_transform(data)

# # pca = PCA(n_components=2, random_state=0)
# # tsne_test = pca.fit_transform(test_fea)

# #plt.scatter(tsne_result[n2:, 0], tsne_result[n2:, 1], c=test_label, cmap=plt.cm.get_cmap("jet", 10), alpha = 0.3, s=8, linewidths=0)

# plt.scatter(tsne_result[n:n2, 0], tsne_result[n:n2, 1], c=train_label2, cmap=plt.cm.get_cmap("jet", 10),linewidths = 0.1, edgecolors='gray', s=8,alpha = 0.6)
# plt.scatter(tsne_result[:n, 0], tsne_result[:n, 1], c=train_label, cmap=plt.cm.get_cmap("jet", 10), linewidths = 0.5, edgecolors='black', s=8)



# # plt.xlim([-15,15])
# # plt.ylim([-10,10])
# plt.xticks([])
# plt.yticks([])
# plt.show()

# # ############################################################################################
# ### training data, 64 x 8
# train_fea = np.load('logs_all//features//FedAvg_IID_500//0_train_feature.npy')
# train_label = np.load('logs_all//features//FedAvg_IID_500//0_train_label.npy' )

# for i in range(1,2):
#       test_ = np.load('logs_all//features//FedAvg_IID_500//' + str(i) + '_train_feature.npy')
#       test_l = np.load('logs_all//features//FedAvg_IID_500//' + str(i) + '_train_label.npy' )
#       train_fea = np.concatenate((train_fea,test_)) 
#       train_label = np.concatenate((train_label,test_l)) 


# n = len(train_fea)
 

# test_fea = np.load('logs_all//features//FedAvg_IID_500//0_test_feature.npy')
# test_label = np.load('logs_all//features//FedAvg_IID_500//0_test_label.npy' )
 
# for i in range(1,100):
#       test_ = np.load('logs_all//features//FedAvg_IID_500//' + str(i) + '_test_feature.npy')
#       test_l = np.load('logs_all//features//FedAvg_IID_500//' + str(i) + '_test_label.npy' )
#       test_fea = np.concatenate((test_fea,test_)) 
#       test_label = np.concatenate((test_label,test_l)) 



# ss = davies_bouldin_score(train_fea, train_label)
# print(ss)

# ss = davies_bouldin_score(test_fea, test_label)
# print(ss)


  
# data = np.concatenate((train_fea,test_fea)) 


# # Create a scatter plot of the t-SNE results
# plt.figure(figsize=(3,2), dpi=300)

# data = StandardScaler().fit_transform(data)
# tsne = TSNE(n_components=2, random_state=0)
# tsne_result = tsne.fit_transform(data)

# tsne = TSNE(n_components=2, random_state=0)
# tsne_test = tsne.fit_transform(test_fea)
 
# # pca = PCA(n_components=2, random_state=0)
# # tsne_test = pca.fit_transform(test_fea)

# #plt.scatter(tsne_result[n:, 0], tsne_result[n:, 1], c=test_label, cmap=plt.cm.get_cmap("jet", 10), alpha = 0.3, s=8, linewidths=0)

# #plt.scatter(tsne_result[:n, 0], tsne_result[:n, 1], c=train_label, cmap=plt.cm.get_cmap("jet", 10), linewidths = 0.5, edgecolors='black', s=8)
 
# plt.scatter(tsne_result[:n, 0], tsne_result[:n, 1], c=train_label, cmap=plt.cm.get_cmap("jet", 10), linewidths = 1, edgecolors='black', s=10)


# # plt.xlim([-15,15])
# # plt.ylim([-10,10])
# plt.xticks([])
# plt.yticks([])
# plt.show()