from typing import List, Optional, Tuple, Union, Dict
from models import AlexNet, AlexNet_approximated, freeze_layer
import random
import torch
import time
import numpy as np
from flwr.common import EvaluateRes, Metrics, Scalar, Code
from flwr.common import FitIns, FitRes, Status
from flwr.server.client_manager import ClientManager
from flwr.server.client_proxy import ClientProxy
from flwr.common import ndarrays_to_parameters
from flwr.server.strategy.aggregate import weighted_loss_avg, aggregate
from flwr.common.logger import log
from logging import WARNING
from cifardataset import cifar10Dataset
from util import get_filters, get_updated_layers, set_filters, approximate_convolution, compute_sampling_prob
from torch.utils.data import DataLoader
from datetime import datetime
from feddrop import get_mean_test_acc
from FedLF_gpu import aggregate_updated_layer

CHANNEL = 3
Batch = 128
CLASSES = 10
DEVICE = "cuda" if torch.cuda.is_available() else "cpu"
Num_clients, Num_participants = 100, 10
ROUNDS = 500
K = 0.5

def weighted_average(metrics: List[Tuple[int, Metrics]]) -> Metrics:
  # Multiply accuracy of each client by number of examples used
  accuracies = [num_examples * m["accuracy"] for num_examples, m in metrics]
  examples = [num_examples for num_examples, _ in metrics]

  # Aggregate and return custom metric (weighted average)
  return {"accuracy": sum(accuracies) / sum(examples)}

def get_lf_number(cid):
   z = [6,4,2,0]
   return z[int(cid) % 4]

'''
def get_rate(cid):
    z = [0.625, 0.75, 0.875, 1.0]
    return z[int(cid) % 4]
'''
def local_train(cid, params, server_round, client_count, lf, rate=1.0, E=5, learn_rate=0.005) -> FitRes:
    epoch = E
    print(f"Server round {server_round+1}, training on the {client_count}-th client, id = {cid}, with {lf} layers frozen.")
    dataset = cifar10Dataset("clientdata/cifar10_client_"+ str(cid) + "_ALPHA_0.1.csv")
    trainloader = DataLoader(dataset, Batch, shuffle=True)
    localmodel = AlexNet_approximated(CHANNEL, outputs=CLASSES, lf=lf, rate=rate).to(DEVICE)
    set_filters(localmodel, params)
    freeze_layer(localmodel, lf)
    time1 = time.time()
    criterion = torch.nn.CrossEntropyLoss()
    optimizer = torch.optim.SGD(localmodel.parameters(), lr=learn_rate)
    localmodel.train()
    for e in range(epoch):
        for samples, labels in trainloader:
            samples, labels = samples.to(DEVICE), labels.to(DEVICE)
            optimizer.zero_grad()
            outputs = localmodel(samples)
            loss = criterion(outputs, labels)
            loss.backward()
            optimizer.step()
    time2 = time.time()
    print(f"Training done, time cost = {time2-time1} seconds\n")
    layers_updated = get_updated_layers(localmodel, lf)
    #sparcified_layer, weights = sparcify_layer(layers_updated, rate=0.75, num_examples=len(dataset))
    status = Status(code=Code.OK, message="Success")
    #return FitRes(status=status, parameters=ndarrays_to_parameters(layers_updated), num_examples=len(dataset), metrics={"updated layer":sparcified_layer, "weights":weights})
    return FitRes(status=status, parameters=ndarrays_to_parameters(layers_updated), num_examples=len(dataset), metrics={"updated layer":layers_updated})

def run_LFaprox(M=Num_clients, P=Num_participants, R=ROUNDS, seed=2024, approx_rate=K, lr=0.005):
    global_model = AlexNet(CHANNEL, outputs=CLASSES).to(DEVICE)
    time0 = time.time()
    random.seed(seed)
    test_accuracies = []
    
    for i in range(R):
        # Fit:
        print(f"Starting FL Round {i+1}......\n")
        fit_results = []
        clients = random.sample(list(range(M)),k=P)
        client_count = 0
        total_examples = 0
        for c in clients:
            cid = str(c)
            lf = get_lf_number(cid)
            sampling_weights = compute_sampling_prob(global_model)
            gloabl_parameters = approximate_convolution(global_model, sampling_probs=sampling_weights, lf=lf, prob=approx_rate)
            fitres = local_train(cid, gloabl_parameters, i, client_count+1, lf, rate=approx_rate, E=5, learn_rate=lr)
            client_count += 1
            #fit_results.append((fitres.metrics["updated layer"], fitres.metrics["weights"], fitres.num_examples))
            fit_results.append((fitres.metrics["updated layer"], fitres.num_examples))
            total_examples += fitres.num_examples
        # Aggregate:
        print(f"Aggregating and updating global model.....\n")
        #new_model_dict = aggregate_updated_layer(global_model, fit_results, total_examples)
        new_model_dict = aggregate_updated_layer(global_model, fit_results)
        global_model.load_state_dict(new_model_dict, strict=False)

        # Evaluate:
        print(f"Round {i+1}, evaluating......")
        _, acc = get_mean_test_acc(global_model)
        test_accuracies.append(acc)
        time1 = time.time()
        print(f"Round {i+1} completed, test accuracy = {acc}, time consumed = {time1-time0}")
        time0 = time1
    
    now = datetime.now()
    with open('results/LFaprox_accuracies_alpha0.1_rate_' + str(approx_rate) + '_' + now.strftime("%Y%m%d%H%M") + '.txt', 'w') as fp:
        for item in test_accuracies:
            # write each item on a new line
            fp.write("%f\n" % item)