# src/data/llm_eval_datasets.py

import csv
from pathlib import Path
from typing import Dict, List


def read_generations_csv(path: str) -> List[dict]:
    rows = []
    with open(path, newline="", encoding="utf-8") as f:
        r = csv.DictReader(f)
        for row in r:
            rows.append(row)
    return rows


def load_truthfulqa_csv(path: str | Path, limit: int = 0) -> List[Dict]:
    """
    Load TruthfulQA from the official CSV.
    Returns a list of dicts with a unified interface:
      - id: int
      - question: str
      - type, category, source: str (may be empty for other datasets)
    """
    rows = []
    path = Path(path)
    with path.open(newline="", encoding="utf-8") as f:
        reader = csv.DictReader(f)
        for idx, row in enumerate(reader):
            rows.append(
                {
                    "id": idx,
                    "question": row.get("Question", ""),
                    "type": row.get("Type", ""),
                    "category": row.get("Category", ""),
                    "source": row.get("Source", ""),
                    "best_answer": row.get("Best Answer", ""),
                }
            )
            if limit > 0 and len(rows) >= limit:
                break
    return rows
