# -*- coding: utf-8 -*-

!pip install kaggle

#@title Authentication on Kaggle
import os
from google.colab import files

# 1. This will create a button. Click it and select 'kaggle.json' from your Downloads.
print("Please upload the kaggle.json file from your Downloads folder...")
uploaded = files.upload()

# 2. Move the file to the correct directory
!mkdir -p ~/.kaggle
!cp kaggle.json ~/.kaggle/
!chmod 600 ~/.kaggle/kaggle.json

# 3. Now the download command should work
print("\nAuthentication successful. Downloading dataset...")

#@title Data Load

!kaggle competitions download -c pkdd-15-predict-taxi-service-trajectory-i
!unzip -o pkdd-15-predict-taxi-service-trajectory-i.zip

#@title Uncompress

!unzip -o train.csv.zip
!unzip -o test.csv.zip

#@title Conformal Check -- Setup

import pandas as pd
import ast
import numpy as np
import random
from scipy.cluster.vq import kmeans2
from scipy.optimize import linprog
from scipy.sparse import coo_matrix, vstack
from collections import Counter

# ==========================================
# 1. Config & Data Loading
# ==========================================
AIRPORT = (41.242, -8.678)
CENTER = (41.147, -8.611)
N_GRID = 100
MIN_LON, MAX_LON = -8.69, -8.57
MIN_LAT, MAX_LAT = 41.14, 41.25

def to_grid(lon, lat):
    x = int((lon - MIN_LON) / (MAX_LON - MIN_LON) * N_GRID)
    y = int((lat - MIN_LAT) / (MAX_LAT - MIN_LAT) * N_GRID)
    return x, y

def get_airport_trip(polyline_str):
    try:
        # Quick string check
        if "41.24" not in polyline_str: return None
        points = ast.literal_eval(polyline_str)
        if len(points) < 20: return None
        # Start: Airport
        if (points[0][1] - AIRPORT[0])**2 + (points[0][0] - AIRPORT[1])**2 > 0.02**2: return None
        # End: Center
        if (points[-1][1] - CENTER[0])**2 + (points[-1][0] - CENTER[1])**2 > 0.02**2: return None
        return points
    except: return None

print("Scanning for Airport->Center traces...")
raw_traces = []
target_load = 1000  # Need enough for train/test splitting

# Note: Assuming train.csv is present in the environment
try:
    for chunk in pd.read_csv('train.csv', usecols=['POLYLINE'], chunksize=50000):
        for poly in chunk['POLYLINE']:
            trace = get_airport_trip(poly)
            if trace: raw_traces.append(trace)
        if len(raw_traces) >= target_load: break
except FileNotFoundError:
    print("Error: 'train.csv' not found. Please ensure the dataset is downloaded.")
    # Create dummy data for code verification if file missing
    raw_traces = [[(AIRPORT[1], AIRPORT[0]), (CENTER[1], CENTER[0])] for _ in range(100)]

print(f"Loaded {len(raw_traces)} traces.")

# ==========================================
# 2. Mode Separation & Splitting
# ==========================================
midpoints = np.array([t[len(t)//2] for t in raw_traces])
if len(midpoints) > 2:
    centroids, labels = kmeans2(midpoints, 2, minit='points')

    # Identify Highway vs Urban
    p1, p2 = np.array([AIRPORT[1], AIRPORT[0]]), np.array([CENTER[1], CENTER[0]])
    dists = [np.abs(np.cross(p2-p1, p1-c))/np.linalg.norm(p2-p1) for c in centroids]
    idx_hwy = np.argmax(dists)
    idx_urb = 1 - idx_hwy

    highway_pool = [raw_traces[i] for i in range(len(raw_traces)) if labels[i] == idx_hwy]
    urban_pool = [raw_traces[i] for i in range(len(raw_traces)) if labels[i] == idx_urb]
else:
    # Fallback for dummy data
    highway_pool = raw_traces[:len(raw_traces)//2]
    urban_pool = raw_traces[len(raw_traces)//2:]

# Setup: 40/60 Split for Train and Test
n_hwy = 40
n_urb = 60

# Duplicate if insufficient data
if len(highway_pool) < 2*n_hwy: highway_pool = highway_pool * (2*n_hwy // len(highway_pool) + 1)
if len(urban_pool) < 2*n_urb: urban_pool = urban_pool * (2*n_urb // len(urban_pool) + 1)

random.seed(42)
# Sample Train
train_hwy = random.sample(highway_pool, n_hwy)
train_urb = random.sample(urban_pool, n_urb)
train_traces = train_hwy + train_urb

# Remove selected to ensure disjoint test set
rem_hwy = [t for t in highway_pool if t not in train_hwy]
rem_urb = [t for t in urban_pool if t not in train_urb]

# Sample Test (Duplicating remainder if needed to fill test set)
if len(rem_hwy) < n_hwy: rem_hwy = rem_hwy * (n_hwy // len(rem_hwy) + 1)
if len(rem_urb) < n_urb: rem_urb = rem_urb * (n_urb // len(rem_urb) + 1)

test_hwy = random.sample(rem_hwy, n_hwy)
test_urb = random.sample(rem_urb, n_urb)
test_traces = test_hwy + test_urb

print(f"Train Set: {len(train_traces)} (40 Hwy / 60 Urb)")
print(f"Test Set:  {len(test_traces)}  (40 Hwy / 60 Urb)")


# ==========================================
# 3. Discretization
# ==========================================
def discretize(traces):
    hedges = []
    for t in traces:
        pset = set()
        for lon, lat in t:
            gx, gy = to_grid(lon, lat)
            if 0<=gx<N_GRID and 0<=gy<N_GRID: pset.add((gx,gy))
        if len(pset)>0: hedges.append(list(pset))
    return hedges

train_hyperedges = discretize(train_traces)
test_hyperedges = discretize(test_traces)

# ==========================================
# 4. Solvers & Pre-computation
# ==========================================

# LP Solver Definition
def solve_lp(hyperedges, tau_con):
    unique = set(c for h in hyperedges for c in h)
    items = list(unique)
    imap = {c: i for i, c in enumerate(items)}
    n_i, n_p = len(items), len(hyperedges)

    c = np.concatenate([np.ones(n_i), np.zeros(n_p)])

    rows, cols, data = [0]*n_p, list(range(n_i, n_i+n_p)), [-1.0]*n_p
    A_cov = coo_matrix((data, (rows, cols)), shape=(1, n_i+n_p))
    b_cov = [-tau_con * n_p]

    p_rows, p_cols, p_data = [], [], []
    curr = 0
    for pid, h in enumerate(hyperedges):
        for item in h:
            p_rows.extend([curr, curr])
            p_cols.extend([n_i+pid, imap[item]])
            p_data.extend([1.0, -1.0])
            curr += 1

    A_path = coo_matrix((p_data, (p_rows, p_cols)), shape=(curr, n_i+n_p))
    b_path = np.zeros(curr)

    A_ub = vstack([A_cov, A_path])
    b_ub = np.concatenate([b_cov, b_path])

    # Solve
    res = linprog(c, A_ub=A_ub, b_ub=b_ub, bounds=(0,1), method='highs')

    # Return just the z variables (the last n_p variables)
    # The x variables (n_i) are the first ones.
    if res.success:
        return res.x[n_i:]
    else:
        return np.zeros(n_p)

# Pre-calculate Greedy Ranking (Frequency on Train Set)
train_counts = Counter(c for h in train_hyperedges for c in h)
greedy_order = [c for c, _ in train_counts.most_common()]

#@title Conformal Check Run

import matplotlib.pyplot as plt
import numpy as np
from collections import Counter, defaultdict
from scipy.optimize import linprog
from scipy.sparse import coo_matrix, vstack

# ==========================================
# 1. New Solver: Returns x (Cell Weights)
# ==========================================

def solve_lp2(hyperedges, tau_con):
    """
    Solves the LP relaxation and returns the x variables (cell weights).
    Returns: dict {cell: weight}
    """
    # 1. Identify Universe
    unique = set(c for h in hyperedges for c in h)
    items = sorted(list(unique)) # Sort for determinism
    imap = {c: i for i, c in enumerate(items)}

    n_i = len(items)       # Number of items (cells)
    n_p = len(hyperedges)  # Number of paths (hyperedges)

    # 2. Setup LP
    # Variables: [x_0 ... x_{ni-1}, z_0 ... z_{np-1}]
    # Objective: Minimize sum(x)
    c = np.concatenate([np.ones(n_i), np.zeros(n_p)])

    # Constraint 1: Coverage -> sum(z) >= tau * N  => -sum(z) <= -tau * N
    rows = [0] * n_p
    cols = list(range(n_i, n_i + n_p)) # Indices of z variables
    data = [-1.0] * n_p
    A_cov = coo_matrix((data, (rows, cols)), shape=(1, n_i + n_p))
    b_cov = [-tau_con * n_p]

    # Constraint 2: Consistency -> z_j <= x_i  =>  z_j - x_i <= 0
    p_rows, p_cols, p_data = [], [], []
    curr_row = 0

    for pid, h in enumerate(hyperedges):
        for item in h:
            # z_pid - x_item <= 0
            p_rows.append(curr_row)
            p_cols.append(n_i + pid)
            p_data.append(1.0)

            p_rows.append(curr_row)
            p_cols.append(imap[item])
            p_data.append(-1.0)

            curr_row += 1

    A_path = coo_matrix((p_data, (p_rows, p_cols)), shape=(curr_row, n_i + n_p))
    b_path = np.zeros(curr_row)

    # Stack constraints
    A_ub = vstack([A_cov, A_path])
    b_ub = np.concatenate([b_cov, b_path])

    # 3. Solve
    res = linprog(c, A_ub=A_ub, b_ub=b_ub, bounds=(0, 1), method='highs')

    # 4. Extract Results
    weights = {}
    if res.success:
        x_vals = res.x[:n_i]
        for idx, val in enumerate(x_vals):
            weights[items[idx]] = val
    else:
        for item in items: weights[item] = 0.0

    return weights

# ==========================================
# 2. Helper Functions
# ==========================================

def calc_coverage_cells(selected_cells, hyperedges):
    if not hyperedges: return 0.0
    selected_set = set(selected_cells)
    covered = 0
    for h in hyperedges:
        if set(h).issubset(selected_set):
            covered += 1
    return covered / len(hyperedges)

def get_cells_for_target_coverage(sorted_cells, hyperedges_to_cover, target_tau):
    """
    Greedy addition: Adds cells from sorted list until target_tau is reached.
    """
    selected = set()
    if target_tau <= 0: return 0

    # Optimization: Pre-convert hyperedges to sets
    hyperedges_sets = [set(h) for h in hyperedges_to_cover]
    total_h = len(hyperedges_to_cover)

    for i, cell in enumerate(sorted_cells):
        selected.add(cell)

        # Check coverage
        covered = 0
        for h_set in hyperedges_sets:
            if h_set.issubset(selected):
                covered += 1

        if (covered / total_h) >= target_tau:
            return i + 1

    return len(sorted_cells)

# ==========================================
# 3. Setup Universe & Greedy Order
# ==========================================

all_cells_list = sorted(list(set(cell for h in train_hyperedges for cell in h)))

train_counts = Counter(cell for h in train_hyperedges for cell in h)
greedy_order = sorted(all_cells_list, key=lambda x: train_counts[x], reverse=True)

# ==========================================
# 4. Pre-calculate LP Subgraphs (tau_p)
# ==========================================
tau_ps = np.arange(0.1, 1.01, 0.1)
lp_cache = []

print("Pre-calculating LP solutions for tau_p range...")

for tp in tau_ps:
    # 1. Solve LP (Get x weights directly)
    cell_weights = solve_lp2(train_hyperedges, tp)

    # 2. Filter non-zero cells for the subgraph
    subgraph_cells_weighted = []
    for cell, w in cell_weights.items():
        if w > 1e-5:
            subgraph_cells_weighted.append((cell, w))

    # 3. Calculate max possible Test coverage for this subgraph
    if subgraph_cells_weighted:
        full_set = {c for c, w in subgraph_cells_weighted}
        test_cov_max = calc_coverage_cells(full_set, test_hyperedges)
    else:
        test_cov_max = 0.0

    lp_cache.append({
        'tau_p': tp,
        'weighted_cells': subgraph_cells_weighted,
        'max_test_coverage': test_cov_max
    })

# ==========================================
# 5. Main Evaluation Loop
# ==========================================
eval_taus = [0.1, 0.15, 0.2, 0.25, 0.3, 0.35,0.4,0.45,0.5]

greedy_budgets = []
lp_budgets = []

print(f"{'Target Tau':<12} | {'Greedy':<10} | {'LP':<10} | {'Chosen Tp':<10}")
print("-" * 50)

test_h_sets = [set(h) for h in test_hyperedges]
total_test = len(test_h_sets)

for tau in eval_taus:
    # --- A. Greedy Strategy ---
    n_greedy = get_cells_for_target_coverage(greedy_order, test_hyperedges, tau)
    greedy_budgets.append(n_greedy)

    # --- B. LP Strategy (with Pruning and Expansion) ---

    # 1. Find smallest tau_p with sufficient coverage potential
    selected_candidate = None
    for candidate in lp_cache:
        if candidate['max_test_coverage'] >= tau:
            selected_candidate = candidate
            break

    if selected_candidate is None:
        # CASE B: Even the max LP subgraph is not enough.
        # Strategy: Take the biggest LP subgraph (tau_p=1.0) and fill gaps with Greedy.

        # Use the last candidate (usually tau_p=1.0)
        best_lp = lp_cache[-1]
        tp_str = f"{best_lp['tau_p']:.1f}+"

        # Start with all LP cells
        active_set = {c for c, w in best_lp['weighted_cells']}
        base_count = len(active_set)

        # Identify missing cells from the universe
        missing_cells = [c for c in greedy_order if c not in active_set]

        # Greedily add missing cells until coverage met
        needed_extra = 0
        current_cov = calc_coverage_cells(active_set, test_hyperedges)

        # If even base set < tau (which it is, since we are in this block)
        for cell in missing_cells:
            active_set.add(cell)
            needed_extra += 1
            if calc_coverage_cells(active_set, test_hyperedges) >= tau:
                break

        n_lp = base_count + needed_extra

    else:
        # CASE A: We found a tau_p that covers enough.
        # Strategy: Prune the smallest x values.
        tp_str = f"{selected_candidate['tau_p']:.1f}"

        cells_to_process = list(selected_candidate['weighted_cells'])

        # Sort by Weight ASCENDING (Remove smallest x first)
        cells_to_process.sort(key=lambda x: x[1])

        active_set = {c for c, w in cells_to_process}

        # Pruning Loop
        for cell, weight in cells_to_process:
            # Temporarily remove
            active_set.remove(cell)

            # Efficient Coverage Check
            covered = 0
            for h_set in test_h_sets:
                if h_set.issubset(active_set):
                    covered += 1

            # If coverage drops below target, put it back
            if (covered / total_test) < tau:
                active_set.add(cell)

        n_lp = len(active_set)

    lp_budgets.append(n_lp)
    print(f"{tau:<12.2f} | {n_greedy:<10} | {n_lp:<10} | {tp_str:<10}")

# ==========================================
# 6. Visualization
# ==========================================
fig, ax = plt.subplots(figsize=(8, 5))

ax.plot(eval_taus, lp_budgets, marker='o', markersize=8, linewidth=2.5,
        label='LP (Adaptive)', color='royalblue', linestyle='-')

ax.plot(eval_taus, greedy_budgets, marker='s', markersize=8, linewidth=2.5,
        label='Greedy (Static)', color='firebrick', linestyle='--')

ax.set_xlabel(r'Target Test Coverage ($\phi$)', fontsize=12)
ax.set_ylabel('Number of Edges Required', fontsize=12)
ax.set_title('Efficiency: Edges Required for Target Coverage', fontsize=14)

ax.set_xticks(eval_taus)
ax.grid(True, linestyle='--', alpha=0.6)
ax.legend(fontsize=11)

plt.tight_layout()
plt.show()

#@title Multiple Runs + Reverse Greedy

# ==========================================
# 3. Main Experiment Loop (Multiple Runs)
# ==========================================

import numpy as np
import matplotlib.pyplot as plt
import random
from collections import Counter

# Helper for coverage calculation
def calc_cov_simple(active_set, target_sets):
    if not target_sets: return 0.0
    count = sum(1 for h in target_sets if h.issubset(active_set))
    return count / len(target_sets)

N_RUNS = 10
eval_taus = [0.1, 0.15, 0.2, 0.25, 0.3, 0.35, 0.4, 0.45, 0.5]
tau_ps = np.arange(0.1, 1.01, 0.1)

# Storage: (run, tau_index)
all_greedy_budgets = np.zeros((N_RUNS, len(eval_taus)))
all_rev_greedy_budgets = np.zeros((N_RUNS, len(eval_taus))) # New
all_lp_budgets = np.zeros((N_RUNS, len(eval_taus)))

print(f"Starting {N_RUNS} runs...")

for run_idx in range(N_RUNS):
    # Determine seed
    current_seed = 42 + run_idx
    random.seed(current_seed)
    np.random.seed(current_seed)

    # --- Split Data (Safe) ---
    # Sampling Train
    # Ensure pools are sufficient
    def safe_sample(pool, k):
        if not pool: return []
        if len(pool) < k: pool = pool * (k // len(pool) + 1)
        return random.sample(pool, k)

    train_hwy = safe_sample(highway_pool, n_hwy)
    train_urb = safe_sample(urban_pool, n_urb)
    train_traces = train_hwy + train_urb

    # Remove selected to ensure disjoint test set
    # Using object identity/string repr to filter
    train_ids = {str(t) for t in train_traces}
    rem_hwy = [t for t in highway_pool if str(t) not in train_ids]
    rem_urb = [t for t in urban_pool if str(t) not in train_ids]

    # Safety check for empty remainder (Fixes Division by Zero)
    if not rem_hwy: rem_hwy = list(highway_pool)
    if not rem_urb: rem_urb = list(urban_pool)

    test_hwy = safe_sample(rem_hwy, n_hwy)
    test_urb = safe_sample(rem_urb, n_urb)
    test_traces = test_hwy + test_urb

    # Discretize
    train_hyperedges = discretize(train_traces)
    test_hyperedges = discretize(test_traces)

    # Pre-compute Sets for fast coverage check
    train_h_sets = [set(h) for h in train_hyperedges]
    test_h_sets = [set(h) for h in test_hyperedges]
    total_test = len(test_h_sets)

    # Setup Universe & Greedy Order (Train Only)
    all_cells_list = sorted(list(set(cell for h in train_hyperedges for cell in h)))
    train_counts = Counter(cell for h in train_hyperedges for cell in h)
    greedy_order = sorted(all_cells_list, key=lambda x: train_counts[x], reverse=True)

    # --- Pre-calculate LP Subgraphs (tau_p) ---
    lp_cache = []

    for tp in tau_ps:
        cell_weights = solve_lp2(train_hyperedges, tp)

        subgraph_cells_weighted = []
        for cell, w in cell_weights.items():
            if w > 1e-5:
                subgraph_cells_weighted.append((cell, w))

        if subgraph_cells_weighted:
            full_set = {c for c, w in subgraph_cells_weighted}
            test_cov_max = calc_cov_simple(full_set, test_h_sets)
        else:
            test_cov_max = 0.0

        lp_cache.append({
            'tau_p': tp,
            'weighted_cells': subgraph_cells_weighted,
            'max_test_coverage': test_cov_max
        })

    # --- Evaluate Taus ---
    run_greedy = []
    run_rev = []
    run_lp = []

    print(f"Run {run_idx+1}/{N_RUNS} processing...", end='\r')

    for tau in eval_taus:
        # A. Forward Greedy
        # Re-implement inline for safety/speed
        sel = set()
        for c in greedy_order:
            sel.add(c)
            if calc_cov_simple(sel, test_h_sets) >= tau: break
        run_greedy.append(len(sel))

        # B. Reverse Greedy (Adaptive)
        active = set(all_cells_list)
        locked = set()

        while True:
            # 1. Identify currently covered TRAIN paths
            covered_indices = [i for i, h in enumerate(train_h_sets) if h.issubset(active)]

            # 2. Count usage in covered TRAIN paths
            counts = Counter()
            for i in covered_indices:
                for c in train_h_sets[i]:
                    if c in active: counts[c] += 1

            # 3. Sort Candidates ASC (Least used in Train)
            candidates = [c for c in active if c not in locked]
            if not candidates: break

            # Optimization: batch remove 0-counts
            zero_counts = [c for c in candidates if counts[c] == 0]
            if zero_counts:
                for c in zero_counts: active.remove(c)
                # Must re-check constraint after batch removal?
                # Yes, but 0-count edges don't support TRAIN paths. They might support TEST paths.
                # To be safe, we check test constraint.
                ncov = sum(1 for h in test_h_sets if h.issubset(active))
                if ncov/total_test < tau:
                    # Revert is hard for batch. Let's do standard loop for safety.
                    for c in zero_counts: active.add(c)
                else:
                    continue # Valid batch removal, recalculate

            candidates.sort(key=lambda c: counts[c])

            removed_any = False
            for c in candidates:
                active.remove(c)

                # Check TEST Constraint
                ncov = sum(1 for h in test_h_sets if h.issubset(active))

                if (ncov / total_test) >= tau:
                    removed_any = True
                    if counts[c] > 0: break # Recalculate
                else:
                    active.add(c)
                    locked.add(c)

            if not removed_any: break

        run_rev.append(len(active))

        # C. LP
        cand = next((c for c in lp_cache if c['max_test_coverage'] >= tau), None)

        if cand is None:
            # Fallback
            best = lp_cache[-1]
            active = {c for c, w in best['weighted_cells']}
            for c in greedy_order:
                if calc_cov_simple(active, test_h_sets) >= tau: break
                active.add(c)
            n_lp = len(active)
        else:
            # Pruning
            lst = list(cand['weighted_cells'])
            lst.sort(key=lambda x: x[1]) # Sort ASC weight

            active = {c for c, w in lst}
            for c, w in lst:
                active.remove(c)
                if calc_cov_simple(active, test_h_sets) < tau:
                    active.add(c)
            n_lp = len(active)

        run_lp.append(n_lp)

    all_greedy_budgets[run_idx, :] = run_greedy
    all_rev_greedy_budgets[run_idx, :] = run_rev
    all_lp_budgets[run_idx, :] = run_lp

print(f"\nDone.")

# ==========================================
# 4. Aggregation & Plotting
# ==========================================
mean_greedy = np.mean(all_greedy_budgets, axis=0)
std_greedy = np.std(all_greedy_budgets, axis=0)

mean_rev = np.mean(all_rev_greedy_budgets, axis=0)
std_rev = np.std(all_rev_greedy_budgets, axis=0)

mean_lp = np.mean(all_lp_budgets, axis=0)
std_lp = np.std(all_lp_budgets, axis=0)

fig, ax = plt.subplots(figsize=(10, 6))

ax.errorbar(eval_taus, mean_lp, yerr=std_lp,
            fmt='o-', linewidth=2.5, markersize=8, capsize=5,
            label='Nested LP', color='royalblue', ecolor='royalblue', alpha=0.9)

ax.errorbar(eval_taus, mean_greedy, yerr=std_greedy,
            fmt='s--', linewidth=2.5, markersize=8, capsize=5,
            label='Forward Greedy', color='firebrick', ecolor='firebrick', alpha=0.9)

ax.errorbar(eval_taus, mean_rev, yerr=std_rev,
            fmt='^-', linewidth=2.5, markersize=8, capsize=5,
            label='Reverse Greedy', color='forestgreen', ecolor='forestgreen', alpha=0.9)

ax.set_xlabel(r'Target Test Coverage ($\phi$)', fontsize=14)
ax.set_ylabel('Number of Cells (Edges) Required', fontsize=14)
ax.set_title(f'Efficiency vs Coverage ({N_RUNS} Runs)', fontsize=16)

ax.set_xticks(eval_taus)
ax.grid(True, linestyle='--', alpha=0.5)
ax.legend(fontsize=12)

plt.tight_layout()
plt.show()

#@title Visualization

import matplotlib.pyplot as plt
import matplotlib.colors as mcolors
import matplotlib.patheffects as pe
from collections import Counter

# ==========================================
# Visualization for Tau=0.8, V2 Set
# ==========================================

# 1. Solve LP for Tau = 0.8
target_tau = 0.8
z_scores = solve_lp(train_hyperedges, target_tau)

# 2. Extract V2 Set (Hyperedges with z > 0.001)
v2_indices = [i for i, z in enumerate(z_scores) if z > 0.001]

# 3. Form LP Subgraph (Union of cells)
lp_cells = set()
for idx in v2_indices:
    lp_cells.update(train_hyperedges[idx])

budget = len(lp_cells)

# 4. Form Greedy Subgraph (Same budget)
greedy_cells = set(greedy_order[:budget])

# 5. Compute Coverage on TEST set (to match the visualization of test traffic)
cov_lp = sum(1 for h in test_hyperedges if set(h).issubset(lp_cells)) / len(test_hyperedges)
cov_greedy = sum(1 for h in test_hyperedges if set(h).issubset(greedy_cells)) / len(test_hyperedges)

print(f"Visualization Config: Tau={target_tau}, Threshold=0.001 (V2)")
print(f"Budget: {budget} edges")
print(f"Test Coverage -> LP: {cov_lp:.2f} | Greedy: {cov_greedy:.2f}")

# ==========================================
# Plotting Logic
# ==========================================
def draw_landmarks(ax):
    lax, lay = to_grid(-8.678, 41.242)
    lcx, lcy = to_grid(-8.611, 41.147)

    ax.scatter([lax], [lay], c='blue', marker='^', s=100, zorder=10, edgecolors='white')
    ax.scatter([lcx], [lcy], c='black', marker='*', s=150, zorder=10, edgecolors='white')

    for x, y, txt in [(lax, lay-6, "Airport"), (lcx, lcy+4, "Center")]:
        t = ax.text(x, y, txt, ha='center', fontsize=9, fontweight='bold', color='black', zorder=11)
        t.set_path_effects([pe.withStroke(linewidth=2, foreground='white')])

def plot_map(ax, cells, title, color):
    if cells:
        xs, ys = zip(*cells)
        ax.scatter(xs, ys, s=15, c=color, marker='s', edgecolors='none', alpha=0.8)
    draw_landmarks(ax)
    ax.set_title(title, fontsize=12, fontweight='bold')
    ax.set_xticks([]); ax.set_yticks([])
    ax.set_xlim(0, N_GRID); ax.set_ylim(0, N_GRID)

fig, axes = plt.subplots(1, 3, figsize=(18, 6))

# Panel 1: Test Traffic Heatmap
counts = Counter(c for h in test_hyperedges for c in h)
xs, ys = zip(*counts.keys())
vals = list(counts.values())
sc = axes[0].scatter(xs, ys, c=vals, s=15,
                norm=mcolors.LogNorm(vmin=1, vmax=max(vals)),
                cmap='inferno_r', marker='s', edgecolors='none', alpha=0.9)
plt.colorbar(sc, ax=axes[0], label='Test Traffic (Log Scale)')
draw_landmarks(axes[0])
axes[0].set_title("A. Test Traffic Intensity", fontsize=12, fontweight='bold')
axes[0].set_xticks([]); axes[0].set_yticks([])
axes[0].set_xlim(0, N_GRID); axes[0].set_ylim(0, N_GRID)

# Panel 2: Greedy Selection
plot_map(axes[1], greedy_cells, f"B. Greedy Selection\n(Budget={budget}, Test Cov={cov_greedy:.2f})", 'firebrick')

# Panel 3: LP Selection
plot_map(axes[2], lp_cells, f"C. Conformal LP \n(Budget={budget}, Test Cov={cov_lp:.2f})", 'blue')

plt.tight_layout()
plt.show()