# tests/test_training_loop.py
"""
Sanity test for training loop: train on a few small episodes to ensure no crash.
"""
import pytest
from configs import Config
from train.train_agent import train
from data.dataset_builder import generate_random_taskset

def test_train_sanity():
    cfg = Config()
    cfg.n_tasksets_train = 2
    cfg.update_target_every = 10
    cfg.memory_size = 100
    policy, diag = train(cfg, n_tasks=3)
    assert policy is not None
    assert "losses" in diag and "rewards" in diag
