import random
import torch
import time
from flwr.common import parameters_to_ndarrays
from flwr.server.strategy.aggregate import aggregate
from datetime import datetime
from fedproto_local import local_train
from FedVTC import get_local_test_acc
from hyper_params import Z_Dim, CLASSES, DEVICE
from util import get_parameters
from resnet import build_model

Num_clients, Num_participants = 100, 10
ROUNDS = 100

def run_Fedproto(M=Num_clients, P=Num_participants, R=ROUNDS, Device=DEVICE, seed=2024, lr=1e-4, local_epoch=5, Batch=16):
    
    # Initialization:
    time0 = time.time()
    random.seed(seed)
    test_accuracies = []
    local_params = {}
    global_protos = {}

    for l in range(CLASSES):
        global_protos[l] = torch.randn(Z_Dim, device=Device, requires_grad=False)
    
    for cid in range(M):
        localmodel = build_model(cid, device=Device)
        local_params[cid] = get_parameters(localmodel)
        del localmodel
    
    # Start FL global iteration:
    for i in range(R):

        # Fit:
        print(f"Starting FL Round {i+1}......\n")

        clients = random.sample(list(range(M)),k=P)
        client_count = 0
        num_proto_cov = {}
        proto_average = {}

        for c in clients:

            local_param = local_params[c]
            cid = str(c)

            if i == 0:
                training_result = local_train(cid, local_param, i, client_count+1, E=local_epoch, learning_rate=lr, Btc=Batch)
            else:
                training_result = local_train(cid, local_param, i, client_count+1, E=local_epoch, learning_rate=lr, Btc=Batch, proto_Z=global_protos)
            new_local_param = parameters_to_ndarrays(training_result.parameters)
            local_proto = training_result.metrics["proto"]
            frequencies = training_result.metrics["count"]
            
            # Get the total number of samples, prototypes and covariances (in Dict[Tuple] format) of each class on each client:
            for label in local_proto.keys():
                if label in num_proto_cov.keys():
                    proto_average[label].append((local_proto[label].cpu().numpy(), frequencies[label]))
                else:
                    proto_average[label] = [(local_proto[label].cpu().numpy(), frequencies[label])]
            
            local_params[c] = new_local_param

            client_count += 1
            print(f"The {client_count}-th local training has been completed, cid = {cid}.\n")
         
        # Aggregating central prototypes:
        for idx in proto_average.keys():
            global_protos[idx] = torch.tensor(aggregate(proto_average[idx]), device=Device, requires_grad=False)
        print("Global prototype updated.")
        
    
        # Evaluate mean accuracy of local models on local datasets:
        print(f"Round {i+1}, evaluating......")
        time1 = time.time()
        if (i+1) % 10 == 0:
            total_acc = 0.0
            for cid in range(M):
                local_param = local_params[cid]
                _, acc = get_local_test_acc(cid, local_param, local_device=Device)
                total_acc += acc
            test_accuracies.append(total_acc / M)
            print(f"Fedproto: Round {i+1} completed, test accuracy = {total_acc / M}, time consumed = {time1-time0}")
        else:
            print("Skipping evaluation to save time...")
            print(f"Fedproto: Round {i+1} completed, time consumed = {time1-time0}")
        time0 = time1

    now = datetime.now()
    with open('results/Fedproto_accuracies_alpha0.1_' + now.strftime("%Y%m%d%H%M") + '.txt', 'w') as fp:
        for item in test_accuracies:
            # write each item on a new line
            fp.write("%f\n" % item)