import numpy as np
import pandas as pd
from sklearn.datasets import make_classification, make_blobs
from sklearn.model_selection import train_test_split, GridSearchCV, KFold, StratifiedKFold
from sklearn.preprocessing import StandardScaler, MinMaxScaler
from sklearn.svm import SVC
from tqdm import tqdm
# from sklearn.feature_selection import mutual_info_classif, f_classif
# from skfeature.function.similarity_based import fisher_score, lap_score, reliefF, SPEC
# from skfeature.function.statistical_based import gini_index, t_score
# from skfeature.utility.construct_W import construct_W
import os
from joblib import Parallel, delayed
from itertools import product
from Functions import Kernel_matrix, LG_sym, calc_differential_vec
from ELVES import Differential_method, Shared_space, Multiple_latent_variables

# generate Hypercube dataset
n_relevant_features = 10
X, y = make_classification(
    n_samples=2000,
    n_features=200,
    n_informative=10,
    n_redundant=0,
    n_clusters_per_class=2,
    flip_y=0.01,     # control label noise ratio (default 0.01)
    class_sep=1,  # increase class separation (default 1)
    scale=1.0,    # control the variance of the data (default 1)
    shuffle=False,  # do not disrupt the order of features, and ensure that the first 10 are relevant features
    random_state=42
)

# ================== experimental parameters ==================
elves_param_grid = {
    'N': [5, 8, 10, 20, 30, 50, 80, 100],     # the number of iterations
    'K': [20, 60, 90, 100, 170, 180],      # the number of neighbors     
    'k': [10, 30, 50, 80, 100, 190],      
    'k0': [200],     
    'w1': [0.5]   
}
svm_param_grid = {
    'C': [2 ** i for i in [-5, -2, 1, 4, 7, 10, 13]],
    'gamma': [2 ** i for i in [-15, -12, -9, -6, -3, 0, 3]]
}
n_outer_iter = 50
n_inner_folds = 10
true_features = set(range(n_relevant_features))
seed_grid = {
    'seed1': [1234],
    'seed2': [3407],    
    'seed3': [42]    
}

# os.makedirs('/Hypercube', exist_ok=True)


# ELVES：Only the differential vector of the last iteration is considered
def ELVES(X1, X2, N=2, K=200, k=500, k0=400, w1=0.5):
    """ iteratively calculate the differential vector: take the larger value at the corresponding position as the final score"""
    delta1 = Multiple_latent_variables(X1, X2, N=N, K=K, k=k, k0=k0)
    delta2 = Multiple_latent_variables(X2, X1, N=N, K=K, k=k, k0=k0)

    # ===== intra-category aggregation =====
    # calculate score1 and score2
    score1 = delta1[:, -1] ** 2
    score2 = delta2[:, -1] ** 2

    # normalize score1 and score2 to 0-1
    scaler = MinMaxScaler()
    score1 = scaler.fit_transform(score1.reshape(-1, 1)).flatten()
    score2 = scaler.fit_transform(score2.reshape(-1, 1)).flatten()

    # ===== aggregation across categories =====
    # for score1 and score2, take the larger value in the corresponding position
    score = np.maximum(score1, score2)

    return delta1, delta2, score1, score2, score


def evaluate_single_param(params, X_train_sub, y_train_sub, X_temp, y_temp, seed3):
    """Evaluate individual parameter combinations in parallel"""
    N, K, k, k0, w1 = params
    try:
        # feature selection
        X1 = X_train_sub[y_train_sub == 0]
        X2 = X_train_sub[y_train_sub == 1]
        _, _, _, _, scores = ELVES(X1, X2, N=N, K=K, k=k, k0=k0)
        selected = np.argsort(scores)[-10:]
    except Exception as e:
        print(f"parameter combination {params} error: {str(e)}")
        return (params, -np.inf, [])

    # inner cross validation
    inner_scores = []
    inner_kf = StratifiedKFold(n_splits=5, shuffle=True, random_state=seed3)   
    for inner_train_idx, inner_val_idx in inner_kf.split(X_temp, y_temp):
        X_inner_train = X_temp[inner_train_idx]
        y_inner_train = y_temp[inner_train_idx]
        X_inner_val = X_temp[inner_val_idx]
        y_inner_val = y_temp[inner_val_idx]

        svm = SVC(kernel='rbf')
        svm.fit(X_inner_train[:, selected], y_inner_train)
        inner_scores.append(svm.score(X_inner_val[:, selected], y_inner_val))

    return (params, np.mean(inner_scores), selected)


# ================== Parallel task encapsulation ==================
def process_outer_iteration(seed_combo, outer_iter):
    seed1, seed2, seed3 = seed_combo
    X_temp, X_test_final, y_temp, y_test_final = train_test_split(
        X, y, test_size=500,
        random_state=seed2 + outer_iter,
        stratify=y
    )

    np.random.seed(seed1)
    sample_idx = np.random.choice(X_temp.shape[0], 50, replace=False)
    X_train_sub = X_temp[sample_idx]
    y_train_sub = y_temp[sample_idx]

    param_combinations = list(product(*elves_param_grid.values()))

    # evaluate parameter combinations in parallel
    param_results = Parallel(n_jobs=8, verbose=0)(
        delayed(evaluate_single_param)(params, X_train_sub, y_train_sub, X_temp, y_temp, seed3)
        for params in param_combinations
    )

    # choose the best parameters
    best_params = max(param_results, key=lambda x: x[1])
    N_best, K_best, k_best, k0_best, w1_best = best_params[0]
    selected_features = best_params[2]

    # SVM parameter tuning
    grid_search = GridSearchCV(
        SVC(kernel='rbf'),
        svm_param_grid,
        cv=StratifiedKFold(n_splits=10, shuffle=True, random_state=42),   
        n_jobs=1
    )
    grid_search.fit(X_temp[:, selected_features], y_temp)

    test_acc = grid_search.score(X_test_final[:, selected_features], y_test_final)
    correct = len(set(selected_features) & true_features)

    return {
        'seed1': seed1,
        'seed2': seed2,
        'seed3': seed3,
        'iteration': outer_iter,
        'test_accuracy': test_acc,
        'correct_features': correct,
        'selected_features': selected_features,
        'best_C': grid_search.best_params_['C'],
        'best_gamma': grid_search.best_params_['gamma'],
        'test_data': (X_test_final, y_test_final)
    }


def process_seed_combination(seed_combo):
    seed_results = Parallel(n_jobs=8, verbose=0)(
        delayed(process_outer_iteration)(seed_combo, outer_iter)
        for outer_iter in range(n_outer_iter)
    )
    return seed_results


# ================== Main execution process ==================
if __name__ == "__main__":
    seed_combinations = list(product(
        seed_grid['seed1'],
        seed_grid['seed2'],
        seed_grid['seed3']
    ))

    all_results = Parallel(n_jobs=8, verbose=10)(
        delayed(process_seed_combination)(seed_combo)
        for seed_combo in seed_combinations
    )

    final_results = []
    for seed_results in all_results:
        final_results.extend(seed_results)

    df = pd.DataFrame(final_results)
    df.to_csv('/Hypercube/final_results_elves.csv', index=False)  
    avg_test_accuracy = df['test_accuracy'].mean()
    avg_correct = df['correct_features'].mean()
    print(f'avg_test_accuracy: {avg_test_accuracy}')
    print(f'avg_correct: {avg_correct}')
    
    

