#!/usr/bin/env python3
# -*- coding: utf-8 -*-
"""
Created on Wed Oct 15 10:59:22 2025

Time comparison CFCP vs Hoyer and GSP 

Line 495   y = torch.randn or rand to set Gaussian or Uniform

Constraint l 

@author: Anonymous
"""

import time
import argparse
import numpy as np
import torch
import matplotlib.pyplot as plt
#import math

import os
os.makedirs('./Vector_Plots', exist_ok=True)

EPS = 1e-10

def l2(x):
    return torch.sqrt((x * x).sum() + EPS)

def hoyer_H(v):
    l1 = v.abs().sum()
    l2n = l2(v)
    return float((l1 / l2n) ** 2)





# ----------------------------------------------------------------
#   x = argmin ||x - v||_2  s.t. x >= 0, sum(x) = s
#   u = sort(v, desc), cs = cumsum(u)
#   rho = max { j : u_j > (cs_j - s)/j }
#   tau = (cs_rho - s)/rho
#   x = max(v - tau, 0)
# ----------------------------------------------------------------
def proj_simplex_condat_sorted(v: torch.Tensor, s: float) -> torch.Tensor:
    assert v.dim() == 1, "v must be 1D"
    device, dtype = v.device, v.dtype
    n = v.numel()
    if n == 0:
        return v
    if s <= 0:
        return torch.zeros_like(v)

    u, _ = torch.sort(v, descending=True)
    cssv = torch.cumsum(u, dim=0) - s
    j = torch.arange(1, n + 1, device=device, dtype=dtype)
    cond = u > (cssv / j)
    if not torch.any(cond):
        return torch.zeros_like(v)

    rho = torch.nonzero(cond, as_tuple=False)[-1].item() + 1  # index 1-based
    tau = cssv[rho - 1] / rho
    w = torch.clamp(v - tau, min=0.0)
    sw = w.sum()
    if sw > 0:
        w = w * (s / sw)
    return w


# ===============================================================
# Hoyer 'projfunc' (2004) — PyTorch port with Condat simplex init
# ===============================================================
def projfunc_torch(s: torch.Tensor, k1: float, k2: float, nn: bool):
    """
    PyTorch port of Patrik O. Hoyer's 'projfunc' (2004),
    modified with Condat simplex projection as initialization:

        v = proj_simplex_condat_sorted(s, k1)

    Constraints:
        sum(abs(v)) = k1
        sum(v^2)    = k2
        nn=True  -> v >= 0 (non-negativity)

    Returns:
        v (tensor), usediters (int)
    """
    assert s.dim() == 1, "s must be a 1D tensor"
    device = s.device
    dtype  = s.dtype
    N      = s.numel()

    # If non-negativity flag not set, record signs and take abs
    if not nn:
        isneg = s < 0
        s = s.abs()
    else:
        isneg = None
    v = proj_simplex_condat_sorted(s, float(k1))

    zerocoeff = torch.zeros(N, dtype=torch.bool, device=device)  # 
    j = 0

    while True:
        # Active set
        active_count = int((~zerocoeff).sum().item())
        if active_count <= 0:
            v = torch.zeros_like(v)
            if N > 0:
                idx = torch.argmax(s.abs())
                v[idx] = k1
            usediters = j + 1
            break

        midpoint_val = k1 / active_count
        midpoint = torch.where(
            zerocoeff,
            torch.zeros((), dtype=dtype, device=device),
            torch.tensor(midpoint_val, dtype=dtype, device=device)
        )

        w = v - midpoint

        a = (w * w).sum()
        b = 2.0 * (w * v).sum()
        c = (v * v).sum() - k2

        # alphap = (-b + sqrt(b^2 - 4ac)) / (2a)
        if float(a.abs()) <= 1e-20:
            alphap = torch.zeros((), dtype=dtype, device=device)
        else:
            disc = (b * b - 4.0 * a * c).clamp_min(0.0)
            sqrt_disc = torch.sqrt(disc)
            alphap = (-b + sqrt_disc) / (2.0 * a + torch.finfo(dtype).eps)

        v = alphap * w + v 

        if torch.all(v >= 0):
            usediters = j + 1
            break

        j += 1
        neg_mask = v <= 0
        zerocoeff = zerocoeff | neg_mask
        v = torch.where(neg_mask, torch.zeros_like(v), v)

        active_count = int((~zerocoeff).sum().item())
        if active_count <= 0:
            v = torch.zeros_like(v)
            if N > 0:
                idx = torch.argmax(s.abs())
                v[idx] = k1
            usediters = j
            break


        vp = proj_simplex_condat_sorted(v, float(k1))
        shift = vp / active_count
        
        #tempsum = v.sum()
        #shift = (k1 - tempsum) / active_count
        v = vp + shift
        v = torch.where(zerocoeff, torch.zeros_like(v), v)

    if not nn:
        sign = torch.where(
            isneg,
            torch.tensor(-1.0, dtype=dtype, device=device),
            torch.tensor(1.0,  dtype=dtype, device=device),
        )
        v = v * sign
        
          
             

    return v, usediters


# ----------------------------------------------------------------
# HOYER
# ----------------------------------------------------------------
def hoyer_projection(y: torch.Tensor, l: float,
                              tol: float = 1e-7, max_iter: int = 200,
                              restore_sign: bool = True):
    """Wrapper that delegates to Hoyer's 'projfunc_torch' (Matlab original)
    to match 'Bench-original-true.py'. We compute k1 = sqrt(l)*||y||_2 and
    k2 = ||y||_2^2, with nn=False to preserve/restore signs like the Matlab code.

    Returns: (x, usediters)
    """
    assert y.dim() == 1
    # Parameters per Bench-original-true.py
    k2 = float((y * y).sum().item())
    k1 = float(l**0.5) * float(l2(y).item())
    x, usediters = projfunc_torch(y.clone(), k1=k1, k2=k2, nn=False)
    return x, usediters

# ----------------------------------------------------------------
# HYBRID NEWTON-BISECTION METHOD (from GSP)
# ----------------------------------------------------------------
def hybrid_newton_bisection_with_iters(y: torch.Tensor, l: float, precision: float = 1e-6, linrat: float = 0.9, max_iter: int = 100):
    """
    Hybrid Newton-Bisection method for Hoyer sparsity projection.
    
    Uses Newton's method with bisection fallback to solve for the Lagrange multiplier mu
    that enforces the sparsity constraint.
    
    Args:
        y: Input vector (1D tensor)
        l: Target Hoyer sparsity level (1 = maximally sparse, n = dense)
        precision: Convergence tolerance
        linrat: Linear rate guarantee parameter
        max_iter: Maximum iterations
        
    Returns:
        (x, iters): Projected vector and number of iterations
    """
    assert y.dim() == 1
    device, dtype = y.device, y.dtype
    n = float(y.numel())
    
    epsilon = 1e-15
    
    # Handle signs
    sgn = torch.sign(y)
    pos_vector = y.abs()
    
    # Clamp l to valid range [1, n)
    l = max(1.0, min(float(l), n - 1.0))
    
    # Convert Hoyer level l to GSP sparsity parameter sps
    # GSP: sps = (sqrt(n) - L1/L2) / (sqrt(n) - 1), where 0=dense, 1=sparse
    # Hoyer: H = (L1/L2)^2, where 1=sparse, n=dense
    # Target L1/L2 = sqrt(l)
    # Therefore: sps = (sqrt(n) - sqrt(l)) / (sqrt(n) - 1)
    sqrt_n = np.sqrt(n)
    sqrt_l = np.sqrt(float(l))
    sps = (sqrt_n - sqrt_l) / (sqrt_n - 1.0)
    
    # GSP formulation parameters
    betai = 1.0 / (sqrt_n - 1.0)
    r = 1  # Single vector
    
    # Target k for GSP method
    k = r * sqrt_n / (sqrt_n - 1.0) - r * sps
    
    # Check critical values
    max_val = pos_vector.max()
    muup0 = float(max_val * (sqrt_n - 1.0))
    
    # Define gmu function (compute sparsity measure as in GSP)
    def gmu_1d(vec, mu):
        # Project: x = [vec - mu*beta]+
        xp = torch.clamp(vec - mu * betai, min=0.0)
        
        # L2 norm
        norm_xp = torch.norm(xp, p=2)
        
        if norm_xp > epsilon:
            # Normalized vector
            xp_normalized = xp / norm_xp
            nip = (xp > 0).sum().float()
            
            # Gradient computation
            sum_xp_norm = xp_normalized.sum()
            term1 = -nip / norm_xp
            term2 = (xp.sum()) ** 2 / (norm_xp ** 3)
            gradg = (betai ** 2) * (term1 + term2)
            
            # Sparsity measure vgmu = beta * sum(xp_normalized)
            vgmu = betai * sum_xp_norm
        else:
            # If all zeros, set max element to 1
            xp_normalized = torch.zeros_like(xp)
            max_idx = torch.argmax(vec)
            xp_normalized[max_idx] = 1.0
            xp = xp_normalized.clone()
            
            vgmu = betai
            gradg = torch.tensor(0.0, device=device, dtype=dtype)
        
        return vgmu, xp, gradg
    
    # Initial evaluation at mu=0
    vgmu, xp, gradg = gmu_1d(pos_vector, 0.0)
    
    # Check if already at target sparsity
    if vgmu < k:
        # Already sparse enough - no projection needed
        return y.clone(), 0
    
    # Initialize bisection bounds
    mulow = 0.0
    muup = muup0
    glow = vgmu
    
    # Start with mu=0
    newmu = 0.0
    gnew = glow
    gpnew = gradg
    delta = muup - mulow
    
    numiter = 0
    
    # Main iteration loop
    while abs(gnew - k) > precision * r and numiter < max_iter:
        oldmu = newmu
        
        # Newton step
        newmu = oldmu + (k - gnew) / (gpnew + epsilon)
        
        # If Newton goes out of bounds, use bisection
        if newmu >= muup or newmu <= mulow:
            newmu = (mulow + muup) / 2.0
            
        # Evaluate at new mu
        gnew, xnew, gpnew = gmu_1d(pos_vector, newmu)
        
        # Update bounds
        if gnew < k:
            muup = newmu
        else:
            mulow = newmu
            
        # Guarantee linear convergence
        if (muup - mulow) > linrat * delta and abs(oldmu - newmu) < (1 - linrat) * delta:
            newmu = (mulow + muup) / 2.0
            gnew, xnew, gpnew = gmu_1d(pos_vector, newmu)
            
            if gnew < k:
                muup = newmu
            else:
                mulow = newmu
                
            numiter += 1
            
        numiter += 1
    
    # Final projection at converged mu
    _, xp_final, _ = gmu_1d(pos_vector, newmu)
    
    # Normalize the projected vector
    norm_xp_final = torch.norm(xp_final, p=2)
    if norm_xp_final > epsilon:
        xp_normalized = xp_final / norm_xp_final
    else:
        xp_normalized = xp_final
    
    # Scale to match original norm
    orig_norm = torch.norm(pos_vector, p=2)
    xp_scaled = xp_normalized * orig_norm
    
    # Restore signs
    x = xp_scaled * sgn
    
    # Final rescaling using inner product (as in GSP alpha calculation)
    alpha = (x * y).sum() / ((x * x).sum() + epsilon)
    x = alpha * x
    
    return x, numiter

# ----------------------------------------------------------------
# CFCP 
# ----------------------------------------------------------------
def cfcp(y: torch.Tensor, l: float, max_iter: int = 4, track_alpha: bool = False, track_active: bool = False):
    assert y.dim() == 1
    n = y.numel()
    sgn = torch.sign(y)
    x = y.abs().clone()
    
    l1 = x.sum()
    alpha = (l1 / n)
    
    #alpha = torch.tensor(1.0, device=y.device, dtype=y.dtype)
    
    x = torch.where(x >= alpha, x, torch.zeros_like(x))
    l_eff = float(max(1.0, min(float(l), float(n))))

    nu_prev = int((x > 0).sum().item())
    nu = nu_prev + 1
    loops = 0
    
    
    alpha_history = [] if track_alpha else None
    active_history = [] if track_active else None

    #while nu != nu_prev and loops < max_iter:
    while loops < max_iter:    
        loops += 1
        nu_prev = nu
        mask = (x > 0)
        nu = int(mask.sum().item())
        #nu=torch.count_nonzero(x)
        if track_active:
            active_history.append(nu)
        if nu == 0:
            return torch.zeros_like(y), loops

        x_active = x

        l1a = x_active.sum()
        
        l2a = (x_active * x_active).sum()
        
       
        Hx = (l1a*l1a / l2a)
        num = l_eff * (nu - Hx)
        den = Hx * (nu - l_eff) + EPS
        frac = (num / den)
        root = torch.sqrt(frac)

        alpha = (l1a / nu*(1.0 - root))
        #alpha = (l1a / nu)
        
        # Track alpha if requested
        if track_alpha:
            alpha_history.append(float(alpha.item()))

        x = torch.where(x >= alpha, x, torch.zeros_like(x))

    mask = (x > 0)
    nu = int(mask.sum().item())
    #nu=torch.count_nonzero(x)
    if track_active and (len(active_history) == 0 or active_history[-1] != nu):
        active_history.append(nu)
    
    
    
    if nu == 0:
        return torch.zeros_like(y), loops

    #x_active = x[mask]
    
    x_active=x
    l1a = x_active.sum()

    denom = (1.0 - (alpha * nu) / (l1a + EPS))
    #lam = 1.0 / denom if abs(float(denom)) > 1e-15 else torch.tensor(1.0, device=y.device, dtype=y.dtype)

    
    lam = 1.0 / denom
    
    d = torch.zeros_like(x)
    d_val = (l1a / max(nu, 1))
    d[mask] = d_val


    x = lam * x + (1.0 - lam) * d
    x = x * sgn
   
    
    if track_alpha or track_active:
        return x, loops, (alpha_history if track_alpha else None), (active_history if track_active else None), float(lam)
    return x, loops, float(lam)

# ----------------------------------------------------------------
# Plot alpha vs loop number
# ----------------------------------------------------------------
def plot_alpha_vs_loops(alpha_history, loops: int, l, n, save_path: str = None):
    
    print(30*'-')

    plt.figure(figsize=(10, 6))
    plt.plot(range(1, len(alpha_history) + 1), alpha_history, 'o-', linewidth=2, markersize=8)
    plt.xlabel('Loop Number', fontsize=14)
    plt.ylabel('Alpha Value', fontsize=14)
    plt.title(f'Alpha vs Loop Number (l={l}, n={n})', fontsize=16)
    plt.grid(True, alpha=0.3)
    plt.tight_layout()
    
    if save_path:
        plt.savefig(save_path, dpi=300, bbox_inches='tight')
        print(f"Plot saved to {save_path}")
    
    plt.show()
    
    print(f"Total loops: {loops}")
    print(f"Alpha values: {alpha_history}")
    print(30*'-')
    
    return alpha_history

# ----------------------------------------------------------------
# Benchmark vs CFCP
# ----------------------------------------------------------------
def bench_one_setting(n: int, l: float, rep: int, device: torch.device):
    t_hoyer, t_cfcp, t_hybrid = [], [], []
    it_hoyer, it_cfcploops, it_hybrid = [], [], []
    diff_hoyer_vs_cfcp, diff_hybrid_vs_cfcp = [], []
    rel_hoyer_vs_cfcp, rel_hybrid_vs_cfcp = [], []
    lambda_val = None

    for rep_idx in range(rep):
        y = torch.randn(n, device=device)

        # CFCP
        if device.type == "cuda": torch.cuda.synchronize()
        t0 = time.perf_counter()
        x_cfcp, itF, alpha_history, active_history, lambda_val = cfcp(y.clone(), l, track_alpha=True, track_active=True)
        if device.type == "cuda": torch.cuda.synchronize()
        t1 = time.perf_counter()
        t_cfcp.append((t1 - t0) * 1000.0)
        it_cfcploops.append(itF)
        norm_cfcp = torch.norm(x_cfcp, p=2).item() + EPS


        # Hoyer
        if device.type == "cuda": torch.cuda.synchronize()
        t0 = time.perf_counter()
        x_hoyer, itO = hoyer_projection(y.clone(), l)
        if device.type == "cuda": torch.cuda.synchronize()
        t1 = time.perf_counter()
        t_hoyer.append((t1 - t0) * 1000.0)
        it_hoyer.append(itO)

        # Hybrid Newton-Bisection
        if device.type == "cuda": torch.cuda.synchronize()
        t0 = time.perf_counter()
        x_hybrid, itH = hybrid_newton_bisection_with_iters(y.clone(), l)
        if device.type == "cuda": torch.cuda.synchronize()
        t1 = time.perf_counter()
        t_hybrid.append((t1 - t0) * 1000.0)
        it_hybrid.append(itH)

        # Erreurs vs CFCP
        dO = torch.norm(x_hoyer - x_cfcp, p=2).item()
        dH = torch.norm(x_hybrid - x_cfcp, p=2).item()
        diff_hoyer_vs_cfcp.append(dO)
        diff_hybrid_vs_cfcp.append(dH)
        rel_hoyer_vs_cfcp.append(dO / norm_cfcp)
        rel_hybrid_vs_cfcp.append(dH / norm_cfcp)

    def mean_std(a):
        a = np.asarray(a, dtype=float)
        mu = a.mean() if a.size else 0.0
        sd = a.std(ddof=1) if a.size > 1 else 0.0
        return float(mu), float(sd)

    out = {
        "time_hoyer": mean_std(t_hoyer),
        "time_cfcp": mean_std(t_cfcp),
        "time_hybrid": mean_std(t_hybrid),
        "iters_hoyer": float(np.mean(it_hoyer)),
        "loops_cfcp": float(np.mean(it_cfcploops)),
        "iters_hybrid": float(np.mean(it_hybrid)),
        "diff_hoyer_vs_cfcp": float(np.mean(diff_hoyer_vs_cfcp)),
        "diff_hybrid_vs_cfcp": float(np.mean(diff_hybrid_vs_cfcp)),
        "rel_hoyer_vs_cfcp": float(np.mean(rel_hoyer_vs_cfcp)),
        "rel_hybrid_vs_cfcp": float(np.mean(rel_hybrid_vs_cfcp)),
        # Histories from last repetition
        "alpha_history": alpha_history,
        "active_history": active_history,
        "lambda": lambda_val,
    }
    return out

def main():
    parser = argparse.ArgumentParser(description="Benchmark (Hoyer/Hybrid/CFCP) with Condat-simplex (sorted); errors vs CFCP.")
    parser.add_argument("--ns", type=int, nargs="+", default=[1000,2000,3000,4000,5000], help="Vector sizes.")
    parser.add_argument("--ls", type=float, nargs="+", default=[100,200], help="Hoyer levels l to test.")
    parser.add_argument("--rep", type=int, default=100, help="Repetitions per (n,l).")
    parser.add_argument("--seed", type=int, default=0, help="Random seed.")

    args = parser.parse_args()

    torch.manual_seed(args.seed)
    if torch.cuda.is_available():
        torch.cuda.manual_seed_all(args.seed)

    # device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
    device = torch.device("cpu")  # Force CPU for consistency
    print(f"Device: {device}\nns={args.ns}\nls={args.ls}\nrep={args.rep}\n")

    all_results = {}
    for l in args.ls:
        print(f"=== l = {l} ===")
        rows = []
        for n in args.ns:
            res = bench_one_setting(n, l, args.rep, device)
            rows.append((n, res))
            print(
                f"\nn={n:5d} | "
                f"\nHoyer {res['time_hoyer'][0]:.2f}±{res['time_hoyer'][1]:.2f} ms | "
                f"\nCFCP {res['time_cfcp'][0]:.2f}±{res['time_cfcp'][1]:.2f} ms | "
                f"\nHybrid {res['time_hybrid'][0]:.2f}±{res['time_hybrid'][1]:.2f} ms | "
                f"\nIters: Hoyer={res['iters_hoyer']:.2f}, CFCPLoops={res['loops_cfcp']:.2f}, Hybrid={res['iters_hybrid']:.2f} | "
                f"\nErr vs CFCP: diff(Hoyer)={res['diff_hoyer_vs_cfcp']:.3e}, diff(Hybrid)={res['diff_hybrid_vs_cfcp']:.3e}, "
                f"\nrel(Hoyer)={res['rel_hoyer_vs_cfcp']:.3e}, rel(Hybrid)={res['rel_hybrid_vs_cfcp']:.3e} | "
                f"\nLambda: {res['lambda']:.6f}"
            )
        all_results[l] = rows
        
        # Generate combined alpha vs loops plot for this l value
        plt.figure()
        for n, res in rows:
            alpha_hist = res.get('alpha_history', [])
            if alpha_hist:
                plt.plot(range(1, len(alpha_hist) + 1), alpha_hist, 'o-', linewidth=2, markersize=6, label=f'n={n}')
        plt.xlabel('Loop Number', fontsize=14)
        plt.ylabel('alpha ', fontsize=14)
        plt.title(f'Threshold vs Loop Number for l={l} (all n values)', fontsize=16)
        plt.grid(True, alpha=0.3)
        plt.legend()
        plt.tight_layout()
        
        save_path = f"./Vector_Plots/alpha_vs_loops_l{int(l)}_combined.png"
        plt.savefig(save_path, dpi=300, bbox_inches='tight')
        print(f"Combined alpha plot saved to {save_path}")
        plt.show()
        plt.close()
        
        # Generate combined active-set size vs loops plot for this l value
        plt.figure()
        for n, res in rows:
            active_hist = res.get('active_history', [])
            if active_hist:
                plt.plot(range(1, len(active_hist) + 1), active_hist, 's-', linewidth=2, markersize=6, label=f'n={n}')
        plt.xlabel('Loop Number', fontsize=14)
        plt.ylabel('Active set size (nu)', fontsize=14)
        plt.title(f'Active Set Size vs Loop Number for l={l} (all n values)', fontsize=16)
        plt.grid(True, alpha=0.3)
        plt.legend()
        plt.tight_layout()
        save_path = f"./Vector_Plots/active_vs_loops_l{int(l)}_combined.png"
        plt.savefig(save_path, dpi=300, bbox_inches='tight')
        print(f"Combined active-set plot saved to {save_path}")
        plt.show()
        plt.close()

        print()
    for l, rows in all_results.items():
        ns = [r[0] for r in rows]
        th = [r[1]["time_hoyer"][0] for r in rows]
        tc = [r[1]["time_cfcp"][0] for r in rows]
        thy = [r[1]["time_hybrid"][0] for r in rows]
        plt.plot(ns, th, marker="^", label=f"Hoyer (l={int(l)})")
        plt.plot(ns, tc, marker="o", label=f"CFCP (l={int(l)})")
        plt.plot(ns, thy, marker="d", label=f"Hybrid (l={int(l)})")
    plt.xlabel("Vector length n"); plt.ylabel("Avg time (ms)")
    plt.title("Time vs n (Gaussian Distribution)")
    plt.grid(True, linestyle="--", linewidth=0.5); plt.legend(); plt.tight_layout(); plt.show(); plt.savefig('./Vector_Plots/time_vs_n.png')

    plt.figure()
    for l, rows in all_results.items():
        ns = [r[0] for r in rows]
        ih = [r[1]["iters_hoyer"] for r in rows]
        lc = [r[1]["loops_cfcp"] for r in rows]
        ihy = [r[1]["iters_hybrid"] for r in rows]
        plt.plot(ns, ih, marker="^", label=f"Hoyer iters (l={int(l)})")
        plt.plot(ns, lc, marker="o", label=f"CFCP loops (l={int(l)})")
        plt.plot(ns, ihy, marker="d", label=f"Hybrid iters (l={int(l)})")
    plt.xlabel("Vector length n"); plt.ylabel("Avg iterations / loops")
    plt.title("Iteration and loops counts vs n (Uniform distribution)")
    plt.grid(True, linestyle="--", linewidth=0.5); plt.legend(); plt.tight_layout(); plt.show(); plt.savefig('./Vector_Plots/iters_loops_vs_n.png')

    plt.figure(figsize=(8,6))
    for l, rows in all_results.items():
        ns = [r[0] for r in rows]
        dH = [r[1]["diff_hoyer_vs_cfcp"] for r in rows]
        dHy = [r[1]["diff_hybrid_vs_cfcp"] for r in rows]
        plt.plot(ns, dH, marker="^", label=f"‖Hoyer − CFCP‖₂ (l={int(l)})")
        plt.plot(ns, dHy, marker="d", label=f"‖Hybrid − CFCP‖₂ (l={int(l)})")
    plt.xlabel("Vector length n"); plt.ylabel("L2 difference")
    plt.title(f"L2 Difference vs CFCP (rep={args.rep})")
    plt.grid(True, linestyle="--", linewidth=0.5); plt.legend(); plt.tight_layout(); plt.show(); plt.savefig('./Vector_Plots/l2_diff_vs_n.png')

    plt.figure()
    for l, rows in all_results.items():
        ns = [r[0] for r in rows]
        rH = [r[1]["rel_hoyer_vs_cfcp"] for r in rows]
        rHy = [r[1]["rel_hybrid_vs_cfcp"] for r in rows]
        plt.plot(ns, rH, marker="^", label=f"RelErr(Hoyer vs CFCP) (l={int(l)})")
        plt.plot(ns, rHy, marker="d", label=f"RelErr(Hybrid vs CFCP) (l={int(l)})")
    plt.xlabel("Vector length n"); plt.ylabel("Relative $ \ell_2$ error $ \%$")
    plt.title(f"Relative Error CFCP vs Hoyer (rep={args.rep})")
    plt.grid(True, linestyle="--", linewidth=0.5); plt.legend(); plt.tight_layout(); plt.show(); plt.savefig('./Vector_Plots/rel_err_vs_n.png')


if __name__ == "__main__":
    
    main()
