# # from sklearn.preprocessing import MinMaxScaler
# from kdd import *
# from Utils.data_methods import *
# from Utils.data_methods_synthetic import generate_anomalies
# from pipeline import *
# from post_processing import *
#
# path_train = '../data/kdd/KDDTrain+.txt'
# path_test = '../data/kdd/KDDTest+.txt'
# df = get_df(path_train, columns=columns, drop=False)
# test_df = get_df(path_test, columns=columns, drop=False)
#
# val_split = 0.2
#
# class_label = dict()
# for lab, num in zip(attack_labels, test_classes):
#     class_label[lab] = num
#
# features_to_encode = ['protocol_type', 'service', 'flag']
# # get numeric features, we won't worry about encoding these at this point
# # numeric_features = ['duration', 'src_bytes', 'dst_bytes']
# # Use all features
# numeric_features = sorted(list(set(df.columns[:-5]) - set(features_to_encode)))
#
# # only select normal class for training
# training_classes = [0]
# scaler = MinMaxScaler()
#
# x_training_real, y_training_real, x_test, y_test = preprocess(
#     df, test_df, features_to_encode, numeric_features, training_classes=training_classes,
#     map_attack=map_attack_kdd, raw_label_col="attack", normal_label="normal", scaler=scaler,
#     train_index_match_col='attack_map', train_label_col='normal_flag',
#     test_index_match_col='attack_map', test_label_col='attack_map')
# n_dim = x_training_real.shape[-1]
#
# # # Baselines
# # num_att_total = np.sum(y_training)
# # num_normal = len(y_training) - num_att_total
# # print("Baseline train AUPR: ", 1 - num_normal/len(y_training))
# #
# # num_att_total = np.sum(y_test)
# # num_normal = len(y_test) - num_att_total
# # print("Baseline overall AUPR: ", 1 - num_normal/len(y_test))
# #
# # val_counts = test_df['attack_map'].value_counts()[1:]
# #
# # for att in new_attacks:
# #     num_att = val_counts[att]
# #     print(f"Baseline AUPR {att}: ", num_att/(num_normal + num_att))
# # #####################################################################
#
# repeats = 3
# model_type = "SVM"
# one_class = True
# sigmoid_head = True
# classifier_layers = 3
# # change this to list instead
# rep_dim = [n_dim for i in range(classifier_layers - 1)]
# assert len(rep_dim) == classifier_layers - 1
# activation = torch.nn.LeakyReLU()
# # epochs = 20
# epochs = 200
# # weight_decay = 0
# weight_decay = 1e-2
# optimizer_params = {'lr': 1e-3}
# # from pl_bolts.optimizers.lr_scheduler import LinearWarmupCosineAnnealingLR
# # lr_scheduler = LinearWarmupCosineAnnealingLR
# # lr_scheduler_params = {"warmup_epochs": epochs//10, "max_epochs": epochs}
# # lr_scheduler = torch.optim.lr_scheduler.CosineAnnealingLR
# # lr_scheduler_params = {"T_max": epochs}
# lr_scheduler = None
# lr_scheduler_params = dict()
# use_hinge = False
# patience = 7
# batch_size = 1024
#
# theory_nn = True
# if theory_nn:
#     one_class = False
#     # classifier_layers = 3
#     # rep_dim = [n_dim, n_dim]
#     activation = torch.nn.ReLU()
#     # activation = torch.nn.LeakyReLU()
#     sigmoid_head = False
#     use_hinge = True
#     weight_decay = 1e-2
#
# if weight_decay > 0:
#     optimizer = torch.optim.AdamW   # w weight decay
#     optimizer_params['weight_decay'] = weight_decay
# else:
#     optimizer = torch.optim.Adam
# if use_hinge:
#     from torchmetrics import HingeLoss
#     loss_fn = HingeLoss(task="binary")
#     neg_labels = False
#     # loss_fn = torch.nn.HingeEmbeddingLoss(margin=1.0)
#     # neg_labels = True
# else:
#     loss_fn = torch.nn.functional.binary_cross_entropy
#     neg_labels = False
#
# synthetic_anom_ratio = 1
#
# fpr = 0.05
# eval_only = True
#
# results = []
#
# for i in range(repeats):
#     run_num = repeats - i
#     print("Run ", i+1)
#     # Resample train vs val split
#     x_train_real, y_train_real, x_val_real, y_val_real = validation_split(
#         x_training_real, y_training_real, val_split=val_split, seed=1234+i)
#
#     classifier, classifier_name = get_classifier_and_name(
#         model_type, classifier_layers=classifier_layers, rep_dim=rep_dim, activation=activation, one_class=one_class,
#         sigmoid_head=sigmoid_head, seed=i)
#     if theory_nn:
#         classifier_name = "T" + classifier_name[1:]
#
#     # generate and combine synthetic anoms w seed 23+i
#     # train eval model
#     if eval_only:
#         version_num = -run_num
#     else:
#         version_num = None
#
#     result = experiment_run(
#         classifier, classifier_name, x_train_real, y_train_real, x_val_real, y_val_real, x_test, y_test, class_label,
#         synthetic_anom_ratio, epochs=epochs, optimizer=optimizer, optimizer_params=optimizer_params,
#         lr_scheduler=lr_scheduler, lr_scheduler_params=lr_scheduler_params, patience=patience, neg_labels=neg_labels,
#         batch_size=batch_size, loss_fn=loss_fn,
#         plot=True, fpr=fpr, normal_is_positive=False, seed=i, seed_anom_generation=23+i, positive_class=0,
#         model_type=model_type, version_num=version_num)
#
#     results.append(result)
#
# results_dict = collate_results(
#     results, result_cols=["precision", "recall", "f1", "average_precision", "auroc", "df_results"])
# aggregated_results = agg_results(results_dict)
# print_exp_agg_results(
#     aggregated_results["precision"], aggregated_results["recall"], aggregated_results["f1"],
#     aggregated_results["average_precision"], aggregated_results["acc"], aggregated_results["df_results"])
