import numpy as np
from codes.data.dataset import ECGDatasetWithDemographics


demos = []
splits = ["train", "val", "test"]
for sp in splits:
    dset = ECGDatasetWithDemographics(
        datatype=sp,
        seed=1,
        neg="PTBXL-NORM",
        pos="PTBXL-AFIB",
        data_lim=None,
        transform=None,
    )
    demo = dset.demo
    lb = dset.label
    neg_demo = demo[lb == 0]
    demos.append(neg_demo)
demos = np.concatenate(demos, axis=0)[:, 0] # Extract ages.
# Filter none.
demos = demos[~np.isnan(demos)]

# Get 25percentile, 50percentile, 75percentile
percentiles = np.percentile(demos, [25, 50, 75])
print("25th percentile:", percentiles[0])
print("50th percentile:", percentiles[1])
print("75th percentile:", percentiles[2])