
import torch
import torch.backends.cudnn
import torchvision
from torchvision import transforms
import numpy as np
from prepare_datasets import get_real_subdataset, get_full_dataset, get_transformations, extend_dataset,get_two_real_subsets
from resnet_training import train_resnet

torch.backends.cudnn.benchmark = True

real_subset_fraction = 0.02
leak_subset_fraction = 0.2
n_generated = 800
experiment_count = 10
do_clip =False

print(f"TRAIN WITH LEAK: {real_subset_fraction},{leak_subset_fraction},{n_generated}")
transform_test = get_transformations("cifar10")[2]
train_set_full = torchvision.datasets.CIFAR10(root='./data', train=True, download=True, transform=None)
test_set = torchvision.datasets.CIFAR10(root='./data', train=False, download=True, transform=transform_test)

targets = np.array(train_set_full.targets)

settings = [
    {"label": "real-only", "use_generative": False, "method": None,"leak": False},
    {"label": "l2-near", "use_generative": True, "method": "l2-near", "leak": False},
    {"label": "l2-near w/leak", "use_generative": True, "method": "l2-near", "leak": True},
    {"label": "random", "use_generative": True, "method": "random", "leak": False},
    {"label": "random w/leak", "use_generative": True, "method": "random", "leak": True},
    {"label": "greedy frobenius", "use_generative": True, "method": "greedy-frobenius", "leak": False},
    {"label": "greedy frobenius w/leak", "use_generative": True, "method": "greedy-frobenius", "leak": True},
    {"label": "frobenius", "use_generative": True, "method": "MPfast", "leak": False},
    {"label": "frobenius w/leak", "use_generative": True, "method": "MPfast", "leak": True},
    {"label": "maxmin", "use_generative": True, "method": "cover-maxmin-batched", "leak": False},
    {"label": "maxmin w/leak", "use_generative": True, "method": "cover-maxmin-batched", "leak": True},
    {"label": "kmean", "use_generative": True, "method": "kmeans-diverse", "leak": False},
    {"label": "kmean w/leak", "use_generative": True, "method": "kmeans-diverse", "leak": True},
    {"label": "l2-near pca", "use_generative": True, "method": "l2-near-pca-32", "leak": False},
    {"label": "l2-near pca w/leak", "use_generative": True, "method": "l2-near-pca-32", "leak": True},
]

accs = {config['label']: [] for config in settings}
results = {}

for run in range(experiment_count):
    print(f"\n Run {run + 1}/{experiment_count}")
    subset_leak, subset_train2, features_leak, cifar10features=get_two_real_subsets("cifar10",train_set_full,\
                                    targets,leak_fraction=leak_subset_fraction,subset_fraction=real_subset_fraction,clip=do_clip)


    for config in settings:
        effective_subset_leak = subset_leak if config.get("leak", True) else None
        effective_features_leak = features_leak if config.get("leak", True) else None
        print(f" Testing setting: {config['label']}")

        trainloader, testloader,_ = get_full_dataset(
            dataset_name = "cifar10",
            subset_train=subset_train2,
            test_set = test_set,
            use_generative=config["use_generative"],
            cifar10_real_features=cifar10features,
            number_of_generated=n_generated,
            batch_size=128,
            method=config["method"],
            zero_centered=True, #NOTE THAT THIS IS FALSSEEEEE
            clip=do_clip,
            leak_dataset=effective_subset_leak,
            leak_features=effective_features_leak
        )

        acc = train_resnet(
            trainloader, testloader,
            epochs=25,
            learning_rate=0.001,
            if_resnet18=True,
            num_classes=10
        )

        print(f"Accuracy: {acc:.4f}")
        accs[config['label']].append(acc)

for label, scores in accs.items():
    scores = np.array(scores)
    results[label] = {
        "mean": scores.mean(),
        "std": scores.std(),
        "all": scores
    }

print("Results:")
for key, val in results.items():
    print(f"{key:>10s} → Avg: {val['mean']:.4f}, Std: {val['std']:.4f}")