#!/usr/bin/env python3
# -*- coding: utf-8 -*-
"""ocr_datasets.builder

Single entry point:
    build_ctc_dataloaders(args, logger=None)

Returns:
    train_loader, val_loader, charset_mapper, blank_id, num_classes
"""

from __future__ import annotations

from typing import Any, Optional, Tuple

from .iam_line import build_iam_line_dataloaders
from .read2016 import build_read2016_dataloaders
from .lam import build_lam_line_dataloaders


def build_ctc_dataloaders(args: Any, logger=None):
    name = (getattr(args, "dataset", "") or "").lower().strip()

    if name in ("iam", "iam_line", "iam-line", "tekla/iam-line", "teklia/iam-line"):
        return build_iam_line_dataloaders(args, logger)

    if name in ("read2016", "read", "icfhr2016", "read-2016"):
        return build_read2016_dataloaders(args, logger)

    # allow protocol embedded in dataset spec: lam | lam:basic | lam:leave_decade_out/leave_decade_4_out
    if name.startswith("lam"):
        return build_lam_line_dataloaders(args, logger)

    raise ValueError(
        f"Unsupported dataset='{getattr(args, 'dataset', None)}'. "
        "Supported: iam_line / rimes / read2016 / lam"
    )
