"""Data loading utilities."""
from __future__ import annotations
from dataclasses import dataclass
from pathlib import Path
import pandas as pd

from .config import DEFAULT_FILES, resolve

@dataclass
class RealData:
    runs: pd.DataFrame           # metadataset_Risk.csv
    curves: pd.DataFrame         # risk_curve_by_dataset.csv

@dataclass
class SyntheticData:
    task_specs: pd.DataFrame     # synthetic_task_specs.csv
    run_logs: pd.DataFrame       # synthetic_run_logs.csv
    risk_curves: pd.DataFrame    # synthetic_risk_curves.csv

def load_real(data_dir: str | Path) -> RealData:
    runs = pd.read_csv(resolve(data_dir, DEFAULT_FILES.metadataset_risk))
    curves = pd.read_csv(resolve(data_dir, DEFAULT_FILES.risk_curve_by_dataset))
    return RealData(runs=runs, curves=curves)

def load_synthetic(data_dir: str | Path) -> SyntheticData:
    task_specs = pd.read_csv(resolve(data_dir, DEFAULT_FILES.synthetic_task_specs))
    run_logs = pd.read_csv(resolve(data_dir, DEFAULT_FILES.synthetic_run_logs))
    risk_curves = pd.read_csv(resolve(data_dir, DEFAULT_FILES.synthetic_risk_curves))
    return SyntheticData(task_specs=task_specs, run_logs=run_logs, risk_curves=risk_curves)
