"""
low_resource_languages.py
Low-resource language dataset loader (e.g., Masakhane).
"""

# At top of experiment file
import importlib
pkg = "Code"  # package directory name in this repo; adjust if you rename the folder
datasets = importlib.import_module(f"{pkg}.datasets")
climate_agriculture = getattr(datasets, "climate_agriculture")
healthcare_sparse   = getattr(datasets, "healthcare_sparse")


import torch


def toy_translation_pairs(n_samples=100):
    """
    Toy dataset: English → low-resource language (dummy pairs).
    """
    src = ["hello", "world", "good", "day", "friend"]
    tgt = ["sannu", "duniya", "lafiya", "rana", "aboki"]  # Hausa (example)
    pairs = [(src[i % len(src)], tgt[i % len(tgt)]) for i in range(n_samples)]
    return pairs
