from __future__ import annotations

import json
from collections import deque
from dataclasses import dataclass
from datetime import datetime, timezone
from pathlib import Path
from typing import Any


def _utc_now_iso() -> str:
    return datetime.now(timezone.utc).isoformat()


def _truncate(text: str | None, *, max_chars: int) -> str | None:
    if text is None:
        return None
    if len(text) <= max_chars:
        return text
    return text[:max_chars] + "... [truncated]"


@dataclass(frozen=True, slots=True)
class HistoryRecord:
    ts: str
    pipeline: str
    run_id: str
    lean_file: str
    task_id: str | None
    kind: str
    summary: str | None
    log_path: str | None
    payload: dict[str, Any]

    def to_json(self) -> dict[str, Any]:
        return {
            "ts": self.ts,
            "pipeline": self.pipeline,
            "run_id": self.run_id,
            "lean_file": self.lean_file,
            "task_id": self.task_id,
            "kind": self.kind,
            "summary": self.summary,
            "log_path": self.log_path,
            "payload": self.payload,
        }


def append_history(
    history_file: Path,
    *,
    pipeline: str,
    run_id: str,
    lean_file: str,
    kind: str,
    payload: dict[str, Any] | None = None,
    task_id: str | None = None,
    summary: str | None = None,
    log_path: str | None = None,
    max_payload_chars: int = 20000,
) -> None:
    """
    Append a compact JSONL history record, meant for human/operator debugging and resume.
    """
    history_file.parent.mkdir(parents=True, exist_ok=True)
    raw_payload = dict(payload or {})
    for k, v in list(raw_payload.items()):
        if isinstance(v, str):
            raw_payload[k] = _truncate(v, max_chars=max_payload_chars)

    record = HistoryRecord(
        ts=_utc_now_iso(),
        pipeline=pipeline,
        run_id=run_id,
        lean_file=lean_file,
        task_id=task_id,
        kind=kind,
        summary=_truncate(summary, max_chars=2000) if summary else None,
        log_path=log_path,
        payload=raw_payload,
    )
    with history_file.open("a", encoding="utf-8") as f:
        f.write(json.dumps(record.to_json(), ensure_ascii=False) + "\n")


def load_recent_history(
    history_file: Path,
    *,
    lean_file: str,
    max_records: int = 30,
    kinds: set[str] | None = None,
    task_id: str | None = None,
    item_index: int | None = None,
    label: str | None = None,
) -> list[dict[str, Any]]:
    """
    Load the last `max_records` matching records for `lean_file` and optional item-level filters.
    This is a best-effort helper (does not throw on partial/corrupt lines).
    """
    if not history_file.exists():
        return []

    want_task_id = str(task_id) if task_id is not None else None
    want_item_index = int(item_index) if item_index is not None else None
    want_label = label.strip() if isinstance(label, str) and label.strip() else None

    buf: deque[dict[str, Any]] = deque(maxlen=max_records)
    for line in history_file.read_text(encoding="utf-8").splitlines():
        line = line.strip()
        if not line:
            continue
        try:
            rec = json.loads(line)
        except json.JSONDecodeError:
            continue
        if not isinstance(rec, dict):
            continue
        if rec.get("lean_file") != lean_file:
            continue
        if kinds is not None and rec.get("kind") not in kinds:
            continue
        if want_task_id is not None and str(rec.get("task_id")) != want_task_id:
            continue

        payload = rec.get("payload")
        payload_dict = payload if isinstance(payload, dict) else {}
        if want_item_index is not None:
            raw_idx = payload_dict.get("index")
            idx_value: int | None = None
            if isinstance(raw_idx, int):
                idx_value = raw_idx
            elif isinstance(raw_idx, str):
                raw_idx = raw_idx.strip()
                if raw_idx.isdigit():
                    idx_value = int(raw_idx)
            if idx_value != want_item_index:
                continue

        if want_label is not None:
            raw_label = payload_dict.get("label")
            label_value = raw_label.strip() if isinstance(raw_label, str) else None
            if label_value != want_label:
                continue

        buf.append(rec)

    return list(buf)
