
# %%
# pip install numpy powerlaw
import numpy as np
import powerlaw

def report_degree_tail(degrees, q=0.99, verbose=False):
    """Report 'not heavy-tailed' evidence for integer degree data."""
    x = np.asarray(degrees, dtype=float)
    x = x[np.isfinite(x)]
    x = x[x > 0]  # power-law fit is defined for positive support

    if x.size < 20 or x.sum() == 0:
        raise ValueError("Not enough positive degrees to analyze.")

    fit = powerlaw.Fit(x, discrete=True, verbose=False)
    alpha = fit.power_law.alpha
    xmin  = fit.power_law.xmin
    n_tail = int((x >= xmin).sum())

    # Model comparisons (LLR, p). Positive LLR favors the first model.
    R_ln,  p_ln  = fit.distribution_compare('power_law', 'lognormal',  normalized_ratio=True)
    R_exp, p_exp = fit.distribution_compare('power_law', 'exponential', normalized_ratio=True)

    # Concentration summaries
    cv = float(x.std(ddof=0) / x.mean())
    qratio = float(np.quantile(x, q) / np.median(x))

    one_liner = (
        f"Power-law vs log-normal: LLR={R_ln:.2f}, p={p_ln:.3g}; "
        f"vs exponential: LLR={R_exp:.2f}, p={p_exp:.3g}. "
        f"Concentration: CV={cv:.2f}; {int(q*100)}th/median={qratio:.2f}. "
        f"Tail fit (PL): alpha={alpha:.2f}, xmin={xmin}, n_tail={n_tail}."
    )

    if verbose:
        print(one_liner)

    return {
        "LLR_PL_vs_LN": R_ln, "p_PL_vs_LN": p_ln,
        "LLR_PL_vs_EXP": R_exp, "p_PL_vs_EXP": p_exp,
        "CV": cv, f"q{int(q*100)}/median": qratio,
        "alpha": alpha, "xmin": xmin, "n_tail": n_tail,
        "summary": one_liner
    }


for file in ["saelens_degrees.pkl", "seam_cells_degrees.pkl", "hypodermis_degrees.pkl"]:
    with open(file, "rb") as f:
        degrees = pickle.load(f)

    results = report_degree_tail(degrees)
    print(file, results["summary"])
    

# %%
