
import numpy as np
from itertools import combinations
from collections import Counter


from itertools import combinations
from collections import Counter
import numpy as np

def stability_analysis(feature_sets, N, k):

    sets = [set(fs) for fs in feature_sets]
    freq = Counter(f for s in sets for f in s)
    selection_freq = {f: freq[f] / len(sets) for f in range(N)}

    jaccards = []
    kunchevas = []
    for a, b in combinations(sets, 2):
        inter = len(a & b)
        union = len(a | b)
        if union > 0:
            jaccards.append(inter / union)

        kunchevas.append((inter * N - k**2) / (k * (N - k)))

    mean_jaccard = np.mean(jaccards) if jaccards else np.nan
    mean_kuncheva = np.mean(kunchevas) if kunchevas else np.nan

    return {
        "mean_jaccard": mean_jaccard,
        "mean_kuncheva": mean_kuncheva,
        "selection_freq": selection_freq
    }


from itertools import combinations
from collections import Counter


def stability_used_feature(feature_sets):
    sets = [set(fs) for fs in feature_sets]

    jaccards = []
    kunchevas = []
    for a, b in combinations(sets, 2):
        inter = len(a & b)
        union = len(a | b)
        if union > 0:
            jaccards.append(inter / union)

    mean_jaccard = np.mean(jaccards) if jaccards else np.nan

    return round(np.mean(mean_jaccard), 4)

def eval_against_truth(selected, true_set):
    try:
        selected = set(selected)
        true_set = set(true_set)

        tp = len(selected & true_set)
        precision = tp / len(selected) if selected else 0
        recall = tp / len(true_set) if true_set else 0
        f1 = 2 * precision * recall / (precision + recall) if (precision + recall) > 0 else 0

        return precision, recall, f1
    except Exception as e:
        print(f"eval_against_truth: {e}")
        return 0.0, 0.0, 0.0


def ev_truth(f_set, N, true_set):
    precisions = []
    recalls = []
    f1_scores = []

    for i in range(min(N, len(f_set))):
        try:
            precision, recall, f1 = eval_against_truth(f_set[i], true_set)
            precisions.append(precision)
            recalls.append(recall)
            f1_scores.append(f1)
        except Exception as e:

            precisions.append(0.0)
            recalls.append(0.0)
            f1_scores.append(0.0)

    mean_precision = np.mean(precisions) if precisions else 0.0
    mean_recall = np.mean(recalls) if recalls else 0.0
    mean_f1 = np.mean(f1_scores) if f1_scores else 0.0

    return mean_precision, mean_recall, mean_f1


import numpy as np
from scipy.stats import spearmanr, kendalltau


def multiple_run_consistency(importance_runs, feature_names=None):
    n_runs = len(importance_runs)
    n_features = len(importance_runs[0])

    if feature_names is None:
        feature_names = [f'Feature_{i + 1}' for i in range(n_features)]

    rankings = []
    for run in importance_runs:

        ranks = np.argsort(run)[::-1]
        rankings.append(ranks)

    rankings = np.array(rankings)

    avg_ranks = np.mean(rankings, axis=0)

    spearman_matrix = np.zeros((n_runs, n_runs))
    kendall_matrix = np.zeros((n_runs, n_runs))

    for i in range(n_runs):
        for j in range(i, n_runs):
            if i == j:
                spearman_matrix[i, j] = 1.0
                kendall_matrix[i, j] = 1.0
            else:
                spearman_corr, _ = spearmanr(rankings[i], rankings[j])
                kendall_corr, _ = kendalltau(rankings[i], rankings[j])

                spearman_matrix[i, j] = spearman_corr
                spearman_matrix[j, i] = spearman_corr
                kendall_matrix[i, j] = kendall_corr
                kendall_matrix[j, i] = kendall_corr

    spearman_values = spearman_matrix[np.triu_indices(n_runs, k=1)]
    kendall_values = kendall_matrix[np.triu_indices(n_runs, k=1)]

    mean_spearman = round(np.mean(spearman_values), 4)
    mean_kendall = round(np.mean(kendall_values), 4)
    return mean_spearman

def slope_trend_similarity(shapes, xs):
    slopes = np.diff(shapes, axis=1) / np.diff(xs)

    from sklearn.metrics.pairwise import cosine_similarity
    cos_mat = cosine_similarity(slopes)
    return np.mean(cos_mat[np.triu_indices_from(cos_mat, k=1)])