# IMAGENET

import torch
import torch.backends.cudnn
import torchvision
from torch.utils.data import Dataset
from torchvision import transforms, datasets
import numpy as np
from prepare_datasets import get_real_subdataset, get_full_dataset, get_transformations, extend_dataset,get_two_real_subsets
from resnet_training import train_resnet

torch.backends.cudnn.benchmark = True

real_subset_count = 100
leak_subset_count = 10
n_generated = 400
experiment_count = 1
do_clip =False
LR = 0.001
EPOCHS = 30
PRETRAINED = "No"
DO_VALIDATION = False
LEAK_EXPERIMENT = False
READ_EACH_GENERATED = 2000
DATASET_EXPANSION = 1
BATCH_SIZE = 128

transform_val = get_transformations("imagenet")[2]
train_set_full = datasets.ImageFolder(root='../imagenet100/train/', transform=None)
test_set = datasets.ImageFolder(root='../imagenet100/val/', transform=transform_val)
targets = np.array(train_set_full.targets)

settings = [
    {"label": "real-only", "use_generative": False, "method": None,"zero_centered": False,"leak":False},
    {"label": "random", "use_generative": True, "method": "random", "zero_centered": True, "leak":False},
    # {"label": "random w/leak", "use_generative": True, "method": "random", "zero_centered": True, "leak":True},
    # {"label": "l2-near", "use_generative": True, "method": "l2-near", "zero_centered": True, "leak":False},
    {"label": "frobenius", "use_generative": True, "method": "MPfast","zero_centered": True, "leak":False}
    # {"label": "maxmin", "use_generative": True, "method": "cover-maxmin-batched"},
    # {"label": "kmean", "use_generative": True, "method": "kmeans-diverse"}
]

print("===== Experiment Settings =====")
print(f"Pretrained Model     : {PRETRAINED}")
print(f"Learning Rate        : {LR}")
print(f"Epochs               : {EPOCHS}")
print(f"Subset Fraction      : {real_subset_count}")
print(f"Generated Samples    : {n_generated}")
print(f"Experiment Count     : {experiment_count}")
print(f"Using CLIP Features  : {do_clip}")
print("================================")

accs = {config['label']: [] for config in settings}
results = {}

for run in range(experiment_count):
    print(f"\n Run {run + 1}/{experiment_count}")
    subset_train2, realfeatures=get_real_subdataset("imagenet",train_set_full,\
                                    targets,subset_count=real_subset_count,clip=do_clip)


    for config in settings:
        effective_subset_leak = subset_leak if config.get("leak", True) else None
        effective_features_leak = features_leak if config.get("leak", True) else None
        print(f" Testing setting: {config['label']}")

        trainloader, testloader,_ = get_full_dataset(
            dataset_name = "imagenet",
            subset_train=subset_train2,
            test_set = test_set,
            use_generative=config["use_generative"],
            cifar10_real_features=realfeatures,
            number_of_generated=n_generated,
            batch_size=BATCH_SIZE,
            method=config["method"],
            zero_centered=config["zero_centered"], #NOTE THAT THIS IS FALSSEEEEE
            clip=do_clip,
            expand = DATASET_EXPANSION,
            leak_dataset=effective_subset_leak,
            leak_features=effective_features_leak,
            read_amount = READ_EACH_GENERATED
        )

        

        acc = train_resnet(
            trainloader, testloader,
            epochs=EPOCHS,
            learning_rate=LR,
            if_resnet18=True,
            pretrained=PRETRAINED,
            num_classes=100
        )

        print(f"Accuracy: {acc:.4f}")
        accs[config['label']].append(acc)

for label, scores in accs.items():
    scores = np.array(scores)
    results[label] = {
        "mean": scores.mean(),
        "std": scores.std(),
        "all": scores
    }

print("Results:")
for key, val in results.items():
    print(f"{key:>10s} → Avg: {val['mean']:.4f}, Std: {val['std']:.4f}")