# complements/myhooks.py
import pandas as pd
import numpy as np
from sklearn.model_selection import train_test_split

def load_data(path="data/uganda_tile_dataset.csv"):
    """
    Load LSMS/Uganda tile dataset.
    Expected format: features in columns, last column 'electrified' as label.
    Adjust path/column names to match your repo.
    """
    df = pd.read_csv(path)
    # drop rows with missing labels
    df = df.dropna(subset=['electrified'])
    y = df['electrified'].astype(int).values
    # use all other columns as features
    X = df.drop(columns=['electrified']).fillna(0).values
    X_train, X_test, y_train, y_test = train_test_split(
        X, y, test_size=0.2, random_state=0, stratify=y
    )
    return X_train, y_train, X_test, y_test

# Optional: plug in your generator + acceptance function

def sample_synthetics(n, mode="naive"):
    """
    Example: random recombination of households/villages.
    Replace with your AWML generator call if available.
    """
    # Placeholder: return None (script will fall back to naive)
    return None, None

def accept_synthetics(X_syn, y_syn, meta=None):
    """
    Your calibrated acceptance function goes here.
    Return a boolean mask of same length as X_syn.
    """
    # Placeholder: accept all
    return np.ones(len(X_syn), dtype=bool)
