import numpy as np
from numpy import *
import matplotlib.pyplot as plt
from tqdm import tqdm
import matplotlib
import datetime
import torch



from decentralize import Decentralized
from decentralizeOPT import DecentralizeOPT
from decentralizeOPTN2 import DecentralizeOPTN2


# Beta = [-3,-2,-1,0,10,100,1000]
# Size = [5,10,15,20]




horizon = 100000
trials = 50


# beta = -3
# N = 5

# market = np.load('./Markets/beta_'+str(beta)+'N_'+str(N)+'.npz')
# num_players = N
# num_arms = N
# player_ranking = market['player_rank'].tolist()
# arm_ranking = market['arm_rank'].tolist()
# player_mean = market['player_mean'].tolist()


# test = Decentralized(horizon = horizon, trial=trials,  num_player=num_players, num_arm=num_arms, player_ranking=player_ranking, arm_ranking=arm_ranking, player_mean=player_mean)
# test.run_ETC(h=150, Beta=beta)

# test = Decentralized(horizon = horizon, trial=trials,  num_player=num_players, num_arm=num_arms, player_ranking=player_ranking, arm_ranking=arm_ranking, player_mean=player_mean)
# test.run_ETC(h=100, Beta=beta)

# test = Decentralized(horizon = horizon, trial=trials,  num_player=num_players, num_arm=num_arms, player_ranking=player_ranking, arm_ranking=arm_ranking, player_mean=player_mean)
# test.run_ETC(h=200, Beta=beta)



# # test = Decentralized(horizon = horizon, trial=trials,  num_player=num_players, num_arm=num_arms, player_ranking=player_ranking, arm_ranking=arm_ranking, player_mean=player_mean)
# # test.run_CA(alg='TS', Beta = beta)


# # test = Decentralized(horizon = horizon, trial=trials,  num_player=num_players, num_arm=num_arms, player_ranking=player_ranking, arm_ranking=arm_ranking, player_mean=player_mean)
# # test.run_CA(alg='UCB', Beta = beta)


# # test = Decentralized(horizon = horizon, trial=trials,  num_player=num_players, num_arm=num_arms, player_ranking=player_ranking, arm_ranking=arm_ranking, player_mean=player_mean)
# # test.run_phasedETC(Beta=beta)





# beta = -3
# N = 10

# market = np.load('./Markets/beta_'+str(beta)+'N_'+str(N)+'.npz')
# num_players = N
# num_arms = N
# player_ranking = market['player_rank'].tolist()
# arm_ranking = market['arm_rank'].tolist()
# player_mean = market['player_mean'].tolist()


# test = Decentralized(horizon = horizon, trial=trials,  num_player=num_players, num_arm=num_arms, player_ranking=player_ranking, arm_ranking=arm_ranking, player_mean=player_mean)
# test.run_ETC(h=150, Beta=beta)

# test = Decentralized(horizon = horizon, trial=trials,  num_player=num_players, num_arm=num_arms, player_ranking=player_ranking, arm_ranking=arm_ranking, player_mean=player_mean)
# test.run_ETC(h=100, Beta=beta)

# test = Decentralized(horizon = horizon, trial=trials,  num_player=num_players, num_arm=num_arms, player_ranking=player_ranking, arm_ranking=arm_ranking, player_mean=player_mean)
# test.run_ETC(h=200, Beta=beta)


# # test = Decentralized(horizon = horizon, trial=trials,  num_player=num_players, num_arm=num_arms, player_ranking=player_ranking, arm_ranking=arm_ranking, player_mean=player_mean)
# # test.run_CA(alg='TS', Beta = beta)


# # test = Decentralized(horizon = horizon, trial=trials,  num_player=num_players, num_arm=num_arms, player_ranking=player_ranking, arm_ranking=arm_ranking, player_mean=player_mean)
# # test.run_CA(alg='UCB', Beta = beta)


# test = Decentralized(horizon = horizon, trial=trials,  num_player=num_players, num_arm=num_arms, player_ranking=player_ranking, arm_ranking=arm_ranking, player_mean=player_mean)
# test.run_phasedETC(Beta=beta)






# beta = -3
# N = 15

# market = np.load('./Markets/beta_'+str(beta)+'N_'+str(N)+'.npz')
# num_players = N
# num_arms = N
# player_ranking = market['player_rank'].tolist()
# arm_ranking = market['arm_rank'].tolist()
# player_mean = market['player_mean'].tolist()


# test = Decentralized(horizon = horizon, trial=trials,  num_player=num_players, num_arm=num_arms, player_ranking=player_ranking, arm_ranking=arm_ranking, player_mean=player_mean)
# test.run_ETC(h=150, Beta=beta)

# test = Decentralized(horizon = horizon, trial=trials,  num_player=num_players, num_arm=num_arms, player_ranking=player_ranking, arm_ranking=arm_ranking, player_mean=player_mean)
# test.run_ETC(h=100, Beta=beta)

# test = Decentralized(horizon = horizon, trial=trials,  num_player=num_players, num_arm=num_arms, player_ranking=player_ranking, arm_ranking=arm_ranking, player_mean=player_mean)
# test.run_ETC(h=200, Beta=beta)


# # test = Decentralized(horizon = horizon, trial=trials,  num_player=num_players, num_arm=num_arms, player_ranking=player_ranking, arm_ranking=arm_ranking, player_mean=player_mean)
# # test.run_CA(alg='TS', Beta = beta)


# # test = Decentralized(horizon = horizon, trial=trials,  num_player=num_players, num_arm=num_arms, player_ranking=player_ranking, arm_ranking=arm_ranking, player_mean=player_mean)
# # test.run_CA(alg='UCB', Beta = beta)


# test = Decentralized(horizon = horizon, trial=trials,  num_player=num_players, num_arm=num_arms, player_ranking=player_ranking, arm_ranking=arm_ranking, player_mean=player_mean)
# test.run_phasedETC(Beta=beta)



# beta -5,-6,-7

# beta = -8
# N = 10

# market = np.load('./Markets/beta_'+str(beta)+'N_'+str(N)+'.npz')
# num_players = N
# num_arms = N
# player_ranking = market['player_rank'].tolist()
# arm_ranking = market['arm_rank'].tolist()
# player_mean = market['player_mean'].tolist()


# test = Decentralized(horizon = horizon, trial=trials,  num_player=num_players, num_arm=num_arms, player_ranking=player_ranking, arm_ranking=arm_ranking, player_mean=player_mean)
# test.run_ETC(h=200, Beta=beta)

# test = Decentralized(horizon = horizon, trial=trials,  num_player=num_players, num_arm=num_arms, player_ranking=player_ranking, arm_ranking=arm_ranking, player_mean=player_mean)
# test.run_phasedETC(Beta=beta)


# test = Decentralized(horizon = horizon, trial=trials,  num_player=num_players, num_arm=num_arms, player_ranking=player_ranking, arm_ranking=arm_ranking, player_mean=player_mean)
# test.run_CA(alg='TS', Beta = beta)


# test = Decentralized(horizon = horizon, trial=trials,  num_player=num_players, num_arm=num_arms, player_ranking=player_ranking, arm_ranking=arm_ranking, player_mean=player_mean)
# test.run_CA(alg='UCB', Beta = beta)









# test = Decentralized(horizon = horizon, trial=trials,  num_player=num_players, num_arm=num_arms, player_ranking=player_ranking, arm_ranking=arm_ranking, player_mean=player_mean)
# test.run_ETC(h=100, Beta=beta)

# test = Decentralized(horizon = horizon, trial=trials,  num_player=num_players, num_arm=num_arms, player_ranking=player_ranking, arm_ranking=arm_ranking, player_mean=player_mean)
# test.run_ETC(h=200, Beta=beta)

# test = Decentralized(horizon = horizon, trial=trials,  num_player=num_players, num_arm=num_arms, player_ranking=player_ranking, arm_ranking=arm_ranking, player_mean=player_mean)
# test.run_ETC(h=400, Beta=beta)



# beta=-1,N=5 #指比较ETGS 和 phasedETC的 (5 player; 5 arm)
# beta=K10,N=3 #指比较ETGS, ADA, 和 phasedETC的 (3 player ; 10 arm)


beta = 'K10'
N = 3

market = np.load('./Markets/beta_'+str(beta)+'N_'+str(N)+'.npz')
# num_players = N
# num_arms = N
player_ranking = market['player_rank'].tolist()
arm_ranking = market['arm_rank'].tolist()
player_mean = market['player_mean'].tolist()



# test = DecentralizeOPT(horizon = horizon, trial=trials,  num_player=num_players, num_arm=num_arms, player_ranking=player_ranking, arm_ranking=arm_ranking, player_mean=player_mean)
# test.run_ETGS(Beta=beta)


# test = DecentralizeOPT(horizon = horizon, trial=trials,  num_player=len(player_ranking), num_arm=len(arm_ranking), player_ranking=player_ranking, arm_ranking=arm_ranking, player_mean=player_mean)
# test.run_phasedETC(Beta=beta)


test = DecentralizeOPTN2(horizon = horizon, trial=trials,  num_player=len(player_ranking), num_arm=len(arm_ranking), player_ranking=player_ranking, arm_ranking=arm_ranking, player_mean=player_mean)
test.run_MLETC(Beta=beta)
# test.run_ETGS(Beta=beta)


# test = DecentralizeOPTN2(horizon = horizon, trial=trials,  num_player=len(player_ranking), num_arm=len(arm_ranking), player_ranking=player_ranking, arm_ranking=arm_ranking, player_mean=player_mean)
# test.run_ETGS(Beta=beta)


# test = DecentralizeOPTN2(horizon = horizon, trial=trials,  num_player=len(player_ranking), num_arm=len(arm_ranking), player_ranking=player_ranking, arm_ranking=arm_ranking, player_mean=player_mean)
# test.run_adaptiveGS(Beta=beta)