
from __future__ import annotations
from typing import Sequence, List, Dict
import numpy as np
import pandas as pd
from sklearn.metrics.pairwise import (
    rbf_kernel,
    linear_kernel,
    polynomial_kernel,
    sigmoid_kernel,
)

def cav_pairwise_mean_angle_deg(cavs: Sequence[np.ndarray]) -> float:
    if len(cavs)<2: return 0.0
    ang=[]
    for i in range(len(cavs)):
        for j in range(i+1,len(cavs)):
            u,v = cavs[i], cavs[j]
            cs = abs(float(u@v) / (np.linalg.norm(u)*np.linalg.norm(v) + 1e-8))
            cs = min(1.0, max(-1.0, cs))
            ang.append(float(np.degrees(np.arccos(cs))))
    return float(np.mean(ang))

def sensitivity_from_grad_and_cav(grad: np.ndarray, cav: np.ndarray) -> float:
    return float(grad@cav)

def tcav_score_from_grads_and_cavs(grads: np.ndarray, cavs: Sequence[np.ndarray]) -> List[float]:
    scores=[]
    for v in cavs:
        s = grads@v
        scores.append(float((s>0).mean()))
    return scores

def aggregate_variance_by_n(records: List[Dict]) -> pd.DataFrame:
    df = pd.DataFrame.from_records(records)
    if df.empty:
        return df
    keys = ['layer', 'n']
    if 'concept' in df.columns:
        keys = ['layer', 'concept', 'n']
    agg = df.groupby(keys).agg(
        mean_value=('value','mean'),
        std_value=('value','std'),
        count=('value','size')
    ).reset_index()
    return agg

def _svc_resolve_gamma(clf) -> float:
    gamma = getattr(clf, "_gamma", None)
    if gamma is None:
        gamma = clf.gamma if isinstance(clf.gamma, (int, float)) else 1.0
    return float(gamma)

def _svc_kernel_matrix(X: np.ndarray, Y: np.ndarray, *, kernel: str, gamma: float, degree: int, coef0: float) -> np.ndarray:
    if kernel == "linear":
        return linear_kernel(X, Y)
    if kernel == "rbf":
        return rbf_kernel(X, Y, gamma=gamma)
    if kernel == "poly":
        return polynomial_kernel(X, Y, gamma=gamma, degree=degree, coef0=coef0)
    if kernel == "sigmoid":
        return sigmoid_kernel(X, Y, gamma=gamma, coef0=coef0)
    raise ValueError(f"Unsupported kernel for SVC inner-product: {kernel}")

def svc_weight_inner_product(clf_a, clf_b) -> float:
    if clf_a.kernel != clf_b.kernel:
        raise ValueError(f"Kernel mismatch: {clf_a.kernel} vs {clf_b.kernel}")
    kernel = str(clf_a.kernel)
    gamma = _svc_resolve_gamma(clf_a)
    degree = int(getattr(clf_a, "degree", 3))
    coef0 = float(getattr(clf_a, "coef0", 0.0))

    coef_a = np.asarray(clf_a.dual_coef_).ravel()
    coef_b = np.asarray(clf_b.dual_coef_).ravel()
    sv_a = np.asarray(clf_a.support_vectors_, dtype=float)
    sv_b = np.asarray(clf_b.support_vectors_, dtype=float)

    K = _svc_kernel_matrix(sv_a, sv_b, kernel=kernel, gamma=gamma, degree=degree, coef0=coef0)
    return float(coef_a @ K @ coef_b.T)

def _trace_variance_from_gram(G: np.ndarray, ddof: int = 1) -> float:
    n = G.shape[0]
    if n < 2:
        return 0.0
    mean_diag = float(np.mean(np.diag(G)))
    mean_all = float(np.mean(G))
    var = mean_diag - mean_all
    if ddof == 1:
        var *= n / (n - 1)
    return float(max(var, 0.0))

def svc_weight_trace_variance(clfs: Sequence, normalize: bool = True, ddof: int = 1) -> float:
    clfs = [c for c in clfs if c is not None]
    if len(clfs) < 2:
        return 0.0
    n = len(clfs)
    G = np.zeros((n, n), dtype=float)
    for i in range(n):
        G[i, i] = max(0.0, svc_weight_inner_product(clfs[i], clfs[i]))
        for j in range(i + 1, n):
            val = svc_weight_inner_product(clfs[i], clfs[j])
            G[i, j] = val
            G[j, i] = val

    if normalize:
        norms = np.sqrt(np.maximum(np.diag(G), 0.0))
        denom = np.outer(norms, norms)
        G = np.where(denom > 0, G / denom, 0.0)

    return _trace_variance_from_gram(G, ddof=ddof)
