
from sklearn.linear_model import LinearRegression
import numpy as np
from sklearn.linear_model import lars_path
from sklearn.metrics import r2_score, mean_squared_error
from sklearn.linear_model import Ridge


def apply_centered_weights_train(X, y, sample_weight=None, eps_std=1e-12):

    X = np.asarray(X, dtype=float)
    y = np.asarray(y, dtype=float)
    n, p = X.shape

    if sample_weight is None:
        X_mean = np.mean(X, axis=0)
        X_centered = X - X_mean

        X_std = np.std(X_centered, axis=0, ddof=1)
        X_std[X_std < eps_std] = 1.0
        X_scaled = X_centered

        y_centered = y - np.mean(y)
        return X_scaled, y_centered, X_mean, np.mean(y)


    w = np.asarray(sample_weight, dtype=float)
    if w.ndim != 1 or w.shape[0] != n:
        raise ValueError("sample_weight must be a one-dimensional array with length equal to the number of samples")
    if np.any(w < 0):
        raise ValueError("sample weights must be non-negative")

    sum_w = np.sum(w)
    if sum_w <= 0:
        raise ValueError("the sum of sample weights must be positive")

    # 加权均值
    X_wmean = np.average(X, axis=0, weights=w)
    y_wmean = np.average(y, weights=w)

    X_centered = X - X_wmean
    y_centered = y - y_wmean

    X_scaled = (X_centered) * np.sqrt(w)[:, None]
    y_scaled = y_centered * np.sqrt(w)

    return X_scaled, y_scaled, X_wmean, y_wmean


def apply_centered_weights_test(X_test, y_test, X_mean, y_mean=None, sample_weight=None):
    X_test = np.asarray(X_test, dtype=float)
    n_test, p = X_test.shape

    X_scaled = (X_test - X_mean)
    y_scaled = y_test - y_mean

    if sample_weight is not None:
        w = np.asarray(sample_weight, dtype=float)
        X_scaled = X_scaled * np.sqrt(w)[:, None]
        y_scaled = y_scaled * np.sqrt(w)
    return X_scaled, y_scaled


def compute_enter_alphas(p_g,Z, r, gamma, active_set, tol=1e-12):

    p = Z.shape[1]
    enter_alphas = {}
    if not active_set:
        return enter_alphas

    j_ref = active_set[0]
    zr_ref = Z[:, j_ref].dot(r)/p_g[j_ref]
    zzg_ref = Z[:, j_ref].dot(Z.dot(gamma))/p_g[j_ref]

    for j in range(p):

        if j in active_set:
            continue

        #α_j = (Z_j^T r[k-1] - Z_j'^T r[k-1]) / (Z_j^T (Zγ) - Z_j'^T (Zγ))
        zr_j = Z[:, j].dot(r)/p_g[j]
        zzg_j = Z[:, j].dot(Z.dot(gamma))/p_g[j]
        numerator = zr_j - zr_ref
        denominator = zzg_j - zzg_ref


        if (abs(denominator) > tol) and (abs(numerator) > tol):
            if (numerator > 0 and denominator > 0) or (numerator < 0 and denominator < 0):
                alpha_j = (numerator) / (denominator)
                enter_alphas[j] = alpha_j
    return enter_alphas


def compute_zero_alphas(d, gamma, active_set, tol=1e-12):

    zero_alphas = {}
    for j in active_set:
        if gamma[j] < -tol:
            alpha_j = -d[j] / gamma[j]
            if alpha_j > tol and alpha_j <= 1.0 + tol:
                zero_alphas[j] = alpha_j
    return zero_alphas


def nonnegative_garrotte_path(p_g,
        X, y, beta_init=None, sample_weight=None,
        max_iter=1000, tol=1e-12, verbose=True):

    import numpy as np
    from sklearn.linear_model import LinearRegression


    X = np.asarray(X, dtype=float)
    y = np.asarray(y, dtype=float)
    n, p = X.shape


    if beta_init is None:
        X_w_init, y_w_init, _, _ = apply_centered_weights_train(X, y, sample_weight)
        lr_init = LinearRegression(fit_intercept=False)

        lr_init.fit(X_w_init, y_w_init)
        beta_init = lr_init.coef_
    else:
        beta_init = np.asarray(beta_init, dtype=float)


    X_weighted, y_weighted, _, _ = apply_centered_weights_train(X, y, sample_weight)


    Z = X_weighted * beta_init[np.newaxis, :]


    d = np.zeros(p)
    r = y_weighted.copy()
    k = 0

    d_path = [d.copy()]
    r_path = [r.copy()]
    actives = [[]]
    beta_hat_path = [(beta_init * d).copy()]
    cov_zr = Z.T.dot(r)/p_g
    j_star = int(np.argmax(cov_zr))

    C_new = sorted(list(set([j_star])))
    actives.append(C_new)
    removed=[]

    while k < max_iter:
        C = C_new
        gamma = np.zeros(p)
        if len(C) > 0:
            ZC = Z[:, C]
            G = ZC.T.dot(ZC)
            ztr = ZC.T.dot(r)

            try:
                gamma_C = np.linalg.solve(G, ztr)
            except np.linalg.LinAlgError:
                gamma_C = np.linalg.pinv(G).dot(ztr)

            for idx, val in zip(C, gamma_C):
                gamma[idx] = val

        if np.linalg.norm(gamma) < tol:
            if verbose:
                print(f"Iter {k + 1}: direction vector norm ({np.linalg.norm(gamma):.6f}) < tol, terminating")

            break

        enter_alphas = compute_enter_alphas(p_g,Z, r, gamma, C, tol)
        zero_alphas = compute_zero_alphas(d, gamma, C, tol)


        candidates = [('enter', a, j) for j, a in enter_alphas.items()] + \
                     [('zero', a, j) for j, a in zero_alphas.items()] + \
                     [('full', 1.0, None)]
        candidates = [c for c in candidates if c[1] > tol]

        if not candidates:
            alpha = 1.0
            kind = 'full'
            idx = None
        else:
            kind, alpha, idx = min(candidates, key=lambda x: x[1])
            alpha = min(alpha, 1.0)

        # 更新参数
        d_new = d + alpha * gamma
        d_new[d_new < 0] = 0.0

        # 更新活跃集
        if kind == 'enter':
            C_new = sorted(list(set(C + [idx])))
        elif kind == 'zero':
            C_new = sorted([j for j in C if j != idx])
            removed.append(idx)
        else:
            C_new = sorted(list(np.where(d_new > tol)[0]))


        r_new = y_weighted - Z.dot(d_new)
        d = d_new
        r = r_new
        d_path.append(d.copy())
        r_path.append(r.copy())
        actives.append(C_new)
        beta_hat_path.append((beta_init * d).copy())
        if abs(alpha - 1.0) < tol:
            if verbose:
                print("α = 1, path shrinkage completed, algorithm terminated.")
            break

        if verbose:
            print(f"Iter {k + 1}: type={kind:6s}, step size={alpha:.4g}, active set size={len(C_new)}")

        k += 1


    if k >= max_iter and verbose:
        print(f"Reached the maximum number of iterations ({max_iter}).")


    return d_path, r_path, actives, beta_hat_path, beta_init, removed


def find_steps_with_exact_k(actives, k, verbose=False):

    steps_k = [
        (t, active_set)
        for t, active_set in enumerate(actives)
        if len(active_set) == k
    ]

    is_unique = (len(steps_k) == 1)

    if verbose:
        if len(steps_k) == 0:
            print(f"[Info] |C| = {k} does not appear along the path")
        elif is_unique:
            print(f"[Info] |C| = {k} appears only once (at step {steps_k[0][0]})")
        else:
            print(f"[Warning] |C| = {k} appears {len(steps_k)} times")

    return steps_k

def select_topk_features_by_path(actives, k,removed):
    selected = []
    seen = set()

    for active_set in actives:
        for feature in active_set:
            if feature not in seen:
                seen.add(feature)
                selected.append(feature)
                if len(selected) >= k:
                    return selected
    if set(selected) & set(removed) != set():
        print("used feature removed")
    return selected


from sklearn.linear_model import lars_path

def generate_lars_path(weighted_data, weighted_labels):

    alphas, _, coefs = lars_path(weighted_data,
                                 weighted_labels,
                                 method='lasso',
                                 verbose=False)
    return alphas, coefs


def select_features_with_lasso_path(data, labels, weights, num_features):

    weighted_data = ((data - np.average(data, axis=0, weights=weights))
                     * np.sqrt(weights[:, np.newaxis]))
    weighted_labels = ((labels - np.average(labels, weights=weights))
                       * np.sqrt(weights))

    _, coefs = generate_lars_path(weighted_data, weighted_labels)

    nonzero = range(weighted_data.shape[1])
    for i in range(len(coefs.T) - 1, 0, -1):
        nonzero = coefs.T[i].nonzero()[0]
        if len(nonzero) <= num_features:
            break

    used_features = nonzero

    return used_features

def lasso_path_coef(data, labels, weights=None, num_features=30):
    if weights ==None:
        weights = np.ones(len(labels))

    _, coefs = generate_lars_path(data,labels)

    nonzero = range(data.shape[1])
    for i in range(len(coefs.T) - 1, 0, -1):
        nonzero = coefs.T[i].nonzero()[0]
        if len(nonzero) <= num_features:

            break
    selected_coef = coefs.T[i]
    return selected_coef




