"""field.py — the operational reasoning field + apply_delta + D projection.

supplement copy of the deterministic typed-field reducer used for the reported runs.
"""
from __future__ import annotations
from dataclasses import dataclass, field, replace
from copy import deepcopy
from typing import Any

HARD_SOURCES = {"formal", "calc", "world", "explicit"}
SOFT_SOURCES = {"model", "heuristic", "analogy"}
PATH_STATUS = {"alive", "soft_dead", "hard_dead", "suspended", "merged", "resurrected"}


@dataclass
class Constraint:
    pred: str
    source: str           # HARD_SOURCES | SOFT_SOURCES
    active: bool = True


@dataclass
class Path:
    id: str
    status: str = "alive"
    resurrection_cond: str | None = None


@dataclass
class Field:
    beliefs: set[str] = field(default_factory=set)
    constraints: list[Constraint] = field(default_factory=list)
    paths: list[Path] = field(default_factory=list)
    frame_id: str = "phi0"
    frame_desc: str = ""
    subgoals: set[str] = field(default_factory=set)
    determined: dict[str, Any] | None = None

    def path(self, pid: str) -> Path | None:
        return next((p for p in self.paths if p.id == pid), None)


def _canon(s: str) -> str:
    return " ".join(str(s).split())


def D(F: Field):
    """Intensional decision projection — hashable signature of decision-relevant
    content. Used for: decorative-ΔF detection (D unchanged ⇒ inert), merge
    detection (shared D), structural region change."""
    hard = frozenset(
        _canon(c.pred) for c in F.constraints if c.active and c.source in HARD_SOURCES
    )
    det = tuple(sorted((k, _canon(v)) for k, v in (F.determined or {}).items()))
    pfate = frozenset((p.id, p.status) for p in F.paths)
    return (hard, det, pfate, frozenset(F.subgoals))


def _gold_leak(op: dict, gold_norm: str | None) -> bool:
    """Gold-substring guard used in the reported control run.
    Returns True iff any STRING-valued field of `op` contains the normalised
    gold answer as a verbatim substring (case-insensitive, ≥2 chars).
    Numeric `gold` is normalised to its digit/char-stripped canonical form;
    op string fields are scanned the same way before comparison."""
    if not gold_norm or len(gold_norm) < 2:
        return False
    for v in op.values():
        if isinstance(v, str) and gold_norm in v.lower():
            return True
    return False


def apply_delta(F: Field, ops: list[dict], *,
                gold: str | None = None) -> tuple[Field, list[str]]:
    """Deterministic typed reducer. Returns (F', rejections). Malformed/invalid
    ops are auto-rejected (NOT silently applied) — the validity column of the
    design-note op table is enforced here.
    If `gold` is passed, operations whose string fields contain the gold answer verbatim are rejected as a leakage guard."""
    G = deepcopy(F)
    rej: list[str] = []
    gold_norm = gold.strip().lower() if gold else None
    for op in ops:
        if _gold_leak(op, gold_norm):
            rej.append(f"{op.get('op')}:gold-substring leak (R2 guard, gold={gold!r})")
            continue
        k = op.get("op")
        try:
            if k == "add_constraint":
                src = op["source"]
                if src not in HARD_SOURCES | SOFT_SOURCES:
                    rej.append(f"add_constraint:bad source {src!r}"); continue
                if not str(op.get("pred", "")).strip():
                    rej.append("add_constraint:empty pred"); continue
                G.constraints.append(Constraint(op["pred"], src, True))
            elif k == "retire_constraint":
                cs = [c for c in G.constraints if _canon(c.pred) == _canon(op["pred"])]
                if not cs: rej.append(f"retire:no constraint {op['pred']!r}"); continue
                for c in cs: c.active = False
            elif k in ("weaken", "strengthen"):
                if not any(_canon(c.pred) == _canon(op["pred"]) for c in G.constraints):
                    rej.append(f"{k}:no constraint"); continue
            elif k == "add_path":
                if G.path(op["pid"]): rej.append(f"add_path:dup {op['pid']}"); continue
                G.paths.append(Path(op["pid"], "alive"))
            elif k == "kill_path":
                p = G.path(op["pid"])
                if not p: rej.append(f"kill_path:no path {op['pid']}"); continue
                kind = op.get("kind", "soft")
                if kind == "soft" and not op.get("cond"):
                    rej.append("kill_path:soft requires cond"); continue
                if kind == "hard" and op.get("cond"):
                    rej.append("kill_path:hard forbids cond"); continue
                p.status = "soft_dead" if kind == "soft" else "hard_dead"
                p.resurrection_cond = op.get("cond")
            elif k == "suspend_path":
                p = G.path(op["pid"])
                if not p: rej.append(f"suspend:no path {op['pid']}"); continue
                p.status = "suspended"
                p.resurrection_cond = op.get("cond")
            elif k == "resurrect_path":
                p = G.path(op["pid"])
                if not p: rej.append(f"resurrect:no path {op['pid']}"); continue
                if p.status not in ("soft_dead", "suspended"):
                    rej.append(f"resurrect:path {op['pid']} not soft_dead/suspended "
                               f"(is {p.status}) — invariant violated"); continue
                p.status = "resurrected"
            elif k == "merge_paths":
                p1, p2 = G.path(op["p1"]), G.path(op["p2"])
                if not (p1 and p2): rej.append("merge:missing path"); continue
                if not str(op.get("shared", "")).strip():
                    rej.append("merge:no shared_state"); continue
                p1.status = p2.status = "merged"
                G.beliefs.add("merged@" + _canon(op["shared"]))
            elif k == "transform_construct":
                # must yield a constraint, else rejected (design-note validity)
                if not str(op.get("to_pred", "")).strip():
                    rej.append("transform:must yield a constraint"); continue
                G.constraints.append(Constraint(op["to_pred"], op.get("source", "calc"), True))
            elif k == "reframe_field":
                if op.get("new_id", G.frame_id) == G.frame_id:
                    rej.append("reframe:new_id == old"); continue
                G.frame_id, G.frame_desc = op["new_id"], op.get("new_desc", "")
            elif k == "close_subgoal":
                sg = op["sg"]
                G.subgoals.discard(sg)
                G.determined = dict(G.determined or {})
                G.determined[sg] = op.get("value")
            elif k == "open_subgoal":
                G.subgoals.add(op["sg"])
            elif k == "record_warning":
                if not str(op.get("text", "")).strip():
                    rej.append("warning:empty"); continue
                G.beliefs.add("⚠ " + op["text"])
            else:
                rej.append(f"unknown op {k!r}")
        except KeyError as e:
            rej.append(f"{k}:missing arg {e}")
    return G, rej


def serialize(F: Field) -> str:
    """Machine rendering (terse, structured). Kept for D-debug / StandIn leak
    detection. NOT recommended as the solver prompt — see render_nl()."""
    L = [f"FRAME[{F.frame_id}] {F.frame_desc}".rstrip()]
    if F.beliefs:
        L.append("BELIEFS: " + "; ".join(sorted(F.beliefs)))
    act = [f"{c.pred} ({c.source})" for c in F.constraints if c.active]
    if act:
        L.append("CONSTRAINTS: " + "; ".join(act))
    if F.paths:
        L.append("PATHS: " + "; ".join(f"{p.id}:{p.status}" for p in F.paths))
    if F.subgoals:
        L.append("OPEN: " + "; ".join(sorted(F.subgoals)))
    if F.determined:
        L.append("DETERMINED: " + "; ".join(f"{k}={v}" for k, v in F.determined.items()))
    return "\n".join(L)


def render_nl(F: Field) -> str:
    """Natural-language rendering of the field AS A PROBLEM a small solver can
    consume. The thesis is that the field-after *information* helps a downstream
    solver — it must be delivered in usable form, else we test the serializer,
    not the field. Beliefs = the problem; active constraints = established facts
    to use; frame = the recommended approach; determined IS deliberately included
    (answer-leak conditions rely on it; honest conditions never set it).
    """
    parts = []
    facts = sorted(F.beliefs)
    if facts:
        parts.append("Problem facts:\n" + "\n".join(f"- {b}" for b in facts))
    act = [c.pred for c in F.constraints if c.active]
    if act:
        parts.append("Established (already derived, you may rely on these):\n"
                     + "\n".join(f"- {p}" for p in act))
    if F.frame_desc:
        parts.append(f"Recommended approach: {F.frame_desc}.")
    live = [p.id for p in F.paths if p.status in ("alive", "resurrected")]
    dead = [(p.id, p.status, p.resurrection_cond) for p in F.paths
            if p.status in ("soft_dead", "hard_dead", "suspended")]
    if dead:
        parts.append("Notes on approaches: " + "; ".join(
            f"{i} is {s}" + (f" (revisit if: {c})" if c else "") for i, s, c in dead))
    if F.subgoals:
        parts.append("Still to determine: " + ", ".join(sorted(F.subgoals)) + ".")
    if F.determined:
        parts.append("Given results: "
                     + "; ".join(f"{k} = {v}" for k, v in F.determined.items()))
    parts.append("Using the above, solve the original problem.")
    return "\n\n".join(parts)
