from __future__ import annotations

import json
import os
import subprocess
from dataclasses import dataclass
from datetime import datetime, timezone
from pathlib import Path
from typing import Any

from .stage_agents import StageAgentsError, ensure_stage_agents
from .config import (
    CODEX_FINAL_CWD,
    CODEX_PROOF_CWD,
    CODEX_STATEMENT_CWD,
    CODEX_CMD,
    FINAL_LOGS_DIR,
    FINAL_PROMPTS_DIR,
    INFRA_LOGS_DIR,
    INFRA_PROMPTS_DIR,
    LEAN_ROOT,
    get_final_agent_a_model,
    get_final_agent_a_reasoning_effort,
    get_final_agent_b_model,
    get_final_agent_b_reasoning_effort,
    get_final_agent_c_model,
    get_final_agent_c_reasoning_effort,
    PROOF_LOGS_DIR,
    PROOF_PROMPTS_DIR,
    ROOT,
    STATEMENT_LOGS_DIR,
    STATEMENT_PROMPTS_DIR,
    resolve_item_target_file,
)
from .loader import NLItem
from .log_utils import build_log_filename, parse_tokens_used, slugify

AGENT_A_PROMPT = (STATEMENT_PROMPTS_DIR / "agent_a_prompt.txt").read_text(encoding="utf-8")
AGENT_B_PROMPT = (STATEMENT_PROMPTS_DIR / "agent_b_prompt.txt").read_text(encoding="utf-8")
_STATEMENT_AGENT_C_SEMANTIC_CHECK_PROMPT_PATH = STATEMENT_PROMPTS_DIR / "agent_c_semantic_check_prompt.txt"
STATEMENT_AGENT_C_SEMANTIC_CHECK_PROMPT = (
    _STATEMENT_AGENT_C_SEMANTIC_CHECK_PROMPT_PATH.read_text(encoding="utf-8")
    if _STATEMENT_AGENT_C_SEMANTIC_CHECK_PROMPT_PATH.exists()
    else ""
)
_ITEM_STATEMENT_AGENT_A_ADDENDUM_PATH = STATEMENT_PROMPTS_DIR / "item_addendum_agent_a.txt"
_ITEM_STATEMENT_AGENT_B_ADDENDUM_PATH = STATEMENT_PROMPTS_DIR / "item_addendum_agent_b.txt"
_ITEM_STATEMENT_AGENT_C_SEMANTIC_CHECK_ADDENDUM_PATH = (
    STATEMENT_PROMPTS_DIR / "item_addendum_agent_c_semantic_check.txt"
)
ITEM_STATEMENT_AGENT_A_ADDENDUM = (
    _ITEM_STATEMENT_AGENT_A_ADDENDUM_PATH.read_text(encoding="utf-8")
    if _ITEM_STATEMENT_AGENT_A_ADDENDUM_PATH.exists()
    else ""
)
ITEM_STATEMENT_AGENT_B_ADDENDUM = (
    _ITEM_STATEMENT_AGENT_B_ADDENDUM_PATH.read_text(encoding="utf-8")
    if _ITEM_STATEMENT_AGENT_B_ADDENDUM_PATH.exists()
    else ""
)
ITEM_STATEMENT_AGENT_C_SEMANTIC_CHECK_ADDENDUM = (
    _ITEM_STATEMENT_AGENT_C_SEMANTIC_CHECK_ADDENDUM_PATH.read_text(encoding="utf-8")
    if _ITEM_STATEMENT_AGENT_C_SEMANTIC_CHECK_ADDENDUM_PATH.exists()
    else ""
)
ITEM_STATEMENT_AGENT_A_PROMPT = (
    AGENT_A_PROMPT + ("\n\n" + ITEM_STATEMENT_AGENT_A_ADDENDUM.strip() if ITEM_STATEMENT_AGENT_A_ADDENDUM.strip() else "")
)
ITEM_STATEMENT_AGENT_B_PROMPT = (
    AGENT_B_PROMPT + ("\n\n" + ITEM_STATEMENT_AGENT_B_ADDENDUM.strip() if ITEM_STATEMENT_AGENT_B_ADDENDUM.strip() else "")
)
ITEM_STATEMENT_AGENT_C_SEMANTIC_CHECK_PROMPT = (
    STATEMENT_AGENT_C_SEMANTIC_CHECK_PROMPT
    + (
        "\n\n" + ITEM_STATEMENT_AGENT_C_SEMANTIC_CHECK_ADDENDUM.strip()
        if ITEM_STATEMENT_AGENT_C_SEMANTIC_CHECK_ADDENDUM.strip()
        else ""
    )
)
AGENT_B_BOOKCHECK_PROMPT = (STATEMENT_PROMPTS_DIR / "agent_b_bookcheck_prompt.txt").read_text(
    encoding="utf-8"
)
PROOF_AGENT_A_PROMPT = (PROOF_PROMPTS_DIR / "agent_a_prompt.txt").read_text(encoding="utf-8")
PROOF_AGENT_B_PROMPT = (PROOF_PROMPTS_DIR / "agent_b_prompt.txt").read_text(encoding="utf-8")
PROOF_AGENT_B_BOOKCHECK_PROMPT = (PROOF_PROMPTS_DIR / "agent_b_bookcheck_prompt.txt").read_text(
    encoding="utf-8"
)
PROOF_AGENT_C_PROMPT = (PROOF_PROMPTS_DIR / "agent_c_prompt.txt").read_text(encoding="utf-8")
_ITEM_PROOF_AGENT_A_ADDENDUM_PATH = PROOF_PROMPTS_DIR / "item_addendum_agent_a.txt"
_ITEM_PROOF_AGENT_B_ADDENDUM_PATH = PROOF_PROMPTS_DIR / "item_addendum_agent_b.txt"
_ITEM_PROOF_AGENT_C_ADDENDUM_PATH = PROOF_PROMPTS_DIR / "item_addendum_agent_c.txt"
ITEM_PROOF_AGENT_A_ADDENDUM = (
    _ITEM_PROOF_AGENT_A_ADDENDUM_PATH.read_text(encoding="utf-8") if _ITEM_PROOF_AGENT_A_ADDENDUM_PATH.exists() else ""
)
ITEM_PROOF_AGENT_B_ADDENDUM = (
    _ITEM_PROOF_AGENT_B_ADDENDUM_PATH.read_text(encoding="utf-8") if _ITEM_PROOF_AGENT_B_ADDENDUM_PATH.exists() else ""
)
ITEM_PROOF_AGENT_C_ADDENDUM = (
    _ITEM_PROOF_AGENT_C_ADDENDUM_PATH.read_text(encoding="utf-8") if _ITEM_PROOF_AGENT_C_ADDENDUM_PATH.exists() else ""
)
ITEM_PROOF_AGENT_A_PROMPT = (
    PROOF_AGENT_A_PROMPT + ("\n\n" + ITEM_PROOF_AGENT_A_ADDENDUM.strip() if ITEM_PROOF_AGENT_A_ADDENDUM.strip() else "")
)
ITEM_PROOF_AGENT_B_PROMPT = (
    PROOF_AGENT_B_PROMPT + ("\n\n" + ITEM_PROOF_AGENT_B_ADDENDUM.strip() if ITEM_PROOF_AGENT_B_ADDENDUM.strip() else "")
)
ITEM_PROOF_AGENT_C_PROMPT = (
    PROOF_AGENT_C_PROMPT + ("\n\n" + ITEM_PROOF_AGENT_C_ADDENDUM.strip() if ITEM_PROOF_AGENT_C_ADDENDUM.strip() else "")
)
_PROOF_AGENT_D_PROMPT_PATH = PROOF_PROMPTS_DIR / "agent_d_prompt.txt"
PROOF_AGENT_D_PROMPT = (
    _PROOF_AGENT_D_PROMPT_PATH.read_text(encoding="utf-8") if _PROOF_AGENT_D_PROMPT_PATH.exists() else ""
)
FINAL_AGENT_A_PROMPT = (FINAL_PROMPTS_DIR / "agent_a_prompt.txt").read_text(encoding="utf-8")
FINAL_AGENT_B_PROMPT = (FINAL_PROMPTS_DIR / "agent_b_prompt.txt").read_text(encoding="utf-8")
FINAL_AGENT_B_BOOK_PROMPT = (FINAL_PROMPTS_DIR / "agent_b_book_prompt.txt").read_text(encoding="utf-8")
FINAL_AGENT_C_PROMPT = (FINAL_PROMPTS_DIR / "agent_c_prompt.txt").read_text(encoding="utf-8")
_INFRA_PLAN_PROMPT_PATH = INFRA_PROMPTS_DIR / "agent_plan_prompt.txt"
INFRA_PLAN_PROMPT = _INFRA_PLAN_PROMPT_PATH.read_text(encoding="utf-8") if _INFRA_PLAN_PROMPT_PATH.exists() else ""
_INFRA_PLAN_CHECK_PROMPT_PATH = INFRA_PROMPTS_DIR / "agent_plan_check_prompt.txt"
INFRA_PLAN_CHECK_PROMPT = (
    _INFRA_PLAN_CHECK_PROMPT_PATH.read_text(encoding="utf-8")
    if _INFRA_PLAN_CHECK_PROMPT_PATH.exists()
    else ""
)


def _agent_logs_dir(base: Path, agent: str) -> Path:
    """
    Place codex call logs under per-agent subfolders for easier navigation:
    - log/<project>/<stage>_logs/agent_a/
    - log/<project>/<stage>_logs/agent_b/
    - ...
    """
    safe = (agent or "").strip().lower() or "unknown"
    return base / f"agent_{safe}"


def _print_agent_start(
    *,
    pipeline: str,
    agent: str,
    task: str,
    target_file: str | None = None,
    mode: str | None = None,
    model: str | None = None,
    reasoning_effort: str | None = None,
) -> None:
    parts = [f"[Agent {agent}]", f"[{pipeline}] start", task]
    if mode:
        parts.append(f"(mode={mode})")
    if target_file:
        parts.append(f"target={target_file}")
    if model or reasoning_effort:
        parts.append(f"model={model or 'default'}/{reasoning_effort or 'default'}")
    print(" ".join(parts))


def _preview_text(text: str, *, max_lines: int = 2, max_chars: int = 320) -> str | None:
    if not text:
        return None
    lines = [line.strip() for line in text.splitlines() if line.strip()]
    if not lines:
        return None
    preview = " | ".join(lines[-max_lines:])
    preview = " ".join(preview.split())
    if len(preview) > max_chars:
        return preview[: max_chars - 3] + "..."
    return preview


def _print_agent_result(
    *,
    meta: dict[str, Any],
    return_code: int,
    tokens_used: int | None,
    log_path: Path | None,
    stdout: str,
    stderr: str,
) -> None:
    """
    Print a concise terminal summary for each agent call so pipeline progress is debuggable live.
    """
    if os.getenv("ORCH_PRINT_AGENT_INTERACTIONS", "1").strip().lower() in {"0", "false", "no", "off"}:
        return
    agent = str(meta.get("agent") or "").strip()
    pipeline = str(meta.get("pipeline") or "").strip()
    if not agent or not pipeline:
        return

    parts = [f"[Agent {agent}]", f"[{pipeline}] done", f"code={return_code}"]
    for key in ("task_id", "item_index", "label", "plan_round", "attempt", "progress_attempt", "mode"):
        value = meta.get(key)
        if value is None:
            continue
        parts.append(f"{key}={value}")
    if tokens_used is not None:
        parts.append(f"tokens={tokens_used}")
    if log_path:
        parts.append(f"log={log_path}")
    print(" ".join(parts))

    stdout_preview = _preview_text(stdout)
    if stdout_preview:
        print(f"[Agent {agent}] [{pipeline}] stdout_tail: {stdout_preview}")
    stderr_preview = _preview_text(stderr)
    if stderr_preview:
        print(f"[Agent {agent}] [{pipeline}] stderr_tail: {stderr_preview}")


@dataclass(frozen=True, slots=True)
class CodexCallResult:
    code: int
    stdout: str
    stderr: str
    tokens_used: int | None
    log_path: Path | None


def _assemble_prompt(
    base_prompt: str, meta: dict[str, Any], extra_instructions: str | None = None
) -> str:
    if extra_instructions and extra_instructions.strip():
        return (
            base_prompt
            + "\n\n"
            + extra_instructions.strip()
            + "\n\n"
            + json.dumps(meta, ensure_ascii=False, indent=2)
        )
    return base_prompt + "\n\n" + json.dumps(meta, ensure_ascii=False, indent=2)


def _extract_tokens(stdout: str, stderr: str) -> int | None:
    return parse_tokens_used(stderr) or parse_tokens_used(stdout)


def _has_model_arg(args: list[str]) -> bool:
    for i, a in enumerate(args):
        if a in {"--model", "-m"} and i + 1 < len(args):
            return True
    return False


def _strip_model_args(args: list[str]) -> list[str]:
    """
    Remove `--model <...>` / `-m <...>` pairs from a flat argv list.
    """
    cleaned: list[str] = []
    i = 0
    while i < len(args):
        a = args[i]
        if a in {"--model", "-m"}:
            i += 2
            continue
        cleaned.append(a)
        i += 1
    return cleaned


def run_codex(
    prompt: str,
    *,
    extra_args: list[str] | None = None,
    log_name: str | None = None,
    log_dir: Path = STATEMENT_LOGS_DIR,
    log_meta: dict[str, Any] | None = None,
    cwd: Path | None = None,
    stage: str | None = None,
) -> CodexCallResult:
    """
    Execute a codex CLI call in the Lean project root.
    Codex runs from `M2F/` so its default sandbox (`workspace-write`) can write target Lean files.
    Stage rules are enforced by swapping `M2F/AGENTS.md` before each call (see `stage_agents.py`).
    输入内容 = CODEX_CMD（["codex","exec","--full-auto"]） + prompt 字符串。
    """
    cmd = list(CODEX_CMD)
    if extra_args:
        # Users often set a global model via `CODEX_EXTRA_ARGS`. If we also pass an agent-specific
        # `--model`, Codex CLI rejects duplicate `--model` flags. Prefer the per-agent override.
        if _has_model_arg(extra_args):
            cmd = _strip_model_args(cmd)
        cmd.extend(extra_args)
    effective_cwd = cwd or LEAN_ROOT

    if stage:
        try:
            ensure_stage_agents(lean_root=LEAN_ROOT, stage=stage)
        except StageAgentsError as e:
            return CodexCallResult(
                code=2,
                stdout="",
                stderr=str(e),
                tokens_used=None,
                log_path=None,
            )

    result = subprocess.run(
        cmd + [prompt],
        cwd=effective_cwd,
        text=True,
        stdout=subprocess.PIPE,
        stderr=subprocess.PIPE,
    )

    tokens_used = _extract_tokens(result.stdout, result.stderr)
    return_code = result.returncode

    meta = dict(log_meta or {})
    log_path: Path | None = None
    if log_name:
        log_dir.mkdir(parents=True, exist_ok=True)
        log_path = log_dir / log_name
        meta.setdefault("ts_utc", datetime.now(timezone.utc).isoformat())
        meta.setdefault("cwd", str(effective_cwd))
        meta.setdefault("cmd", cmd)
        log_content = (
            "META:\n"
            + json.dumps(meta, ensure_ascii=False, indent=2)
            + "\n\nSTDOUT:\n"
            + result.stdout
            + "\n\nSTDERR:\n"
            + result.stderr
        )
        log_path.write_text(log_content, encoding="utf-8")

    _print_agent_result(
        meta=meta,
        return_code=return_code,
        tokens_used=tokens_used,
        log_path=log_path,
        stdout=result.stdout,
        stderr=result.stderr,
    )

    return CodexCallResult(
        code=return_code,
        stdout=result.stdout,
        stderr=result.stderr,
        tokens_used=tokens_used,
        log_path=log_path,
    )


def _agent_extra_args(*, model: str | None, reasoning_effort: str | None) -> list[str]:
    args: list[str] = []
    if model:
        args += ["--model", model]
    if reasoning_effort:
        # Codex CLI uses `model_reasoning_effort` in config.toml; override via `-c`.
        # Value is parsed as TOML; quote to force string.
        args += ["-c", f'model_reasoning_effort="{reasoning_effort}"']
    return args


def build_agent_a_prompt(item: NLItem, *, extra_instructions: str | None = None) -> str:
    """
    Build the prompt for Agent A by attaching metadata for the current item.
    输入组成：agent_a_prompt.txt 的文本 + JSON 元信息：
      - item 原始字段（index/label/env/number_components/content/context）
      - target_file：章节 Lean 文件的相对路径
    """
    lean_path = resolve_item_target_file(
        item.chapter, item.section, label=item.label, target_file=getattr(item, "target_file", None)
    )
    meta = {
        "item": {
            "index": item.index,
            "label": item.label,
            "env": item.env,
            "number_components": item.number_components,
            "content": item.content,
            "context": item.context,
            "dependencies": item.dependencies,
            "nl_answer": item.nl_answer,
        },
        "target_file": str(lean_path),
    }
    return _assemble_prompt(AGENT_A_PROMPT, meta, extra_instructions)


def _build_statement_agent_b_prompt(
    base_prompt: str,
    lean_file: Path,
    error_log: str,
    *,
    item_index: int | None = None,
    label: str | None = None,
    item_context: dict[str, Any] | None = None,
    item_dependencies: list[Any] | None = None,
    item_notes: Any | None = None,
    extra_instructions: str | None = None,
) -> str:
    """
    Build the prompt for Agent B with the lean file context and recent errors.
    输入组成：agent_b_prompt.txt 的文本 + JSON 元信息：
      - lean_file：相对 LEAN_ROOT 的路径
      - error_log：上一次 lean 编译的 stderr
      - context：数据条目中的上下文信息（若提供）
    """
    meta = {
        "item_index": item_index,
        "label": label,
        "target_file": str(lean_file),
        "lean_file": str(lean_file),
        "error_log": error_log,
        "dependencies": item_dependencies,
        "context": item_context,
        "notes": item_notes,
    }
    return _assemble_prompt(base_prompt, meta, extra_instructions)


def build_agent_b_prompt(
    lean_file: Path,
    error_log: str,
    *,
    item_index: int | None = None,
    label: str | None = None,
    item_context: dict[str, Any] | None = None,
    item_dependencies: list[Any] | None = None,
    item_notes: Any | None = None,
    extra_instructions: str | None = None,
) -> str:
    return _build_statement_agent_b_prompt(
        AGENT_B_PROMPT,
        lean_file,
        error_log,
        item_index=item_index,
        label=label,
        item_context=item_context,
        item_dependencies=item_dependencies,
        item_notes=item_notes,
        extra_instructions=extra_instructions,
    )


def build_item_statement_agent_b_prompt(
    lean_file: Path,
    error_log: str,
    *,
    item_index: int | None = None,
    label: str | None = None,
    item_context: dict[str, Any] | None = None,
    item_dependencies: list[Any] | None = None,
    item_notes: Any | None = None,
    extra_instructions: str | None = None,
) -> str:
    return _build_statement_agent_b_prompt(
        ITEM_STATEMENT_AGENT_B_PROMPT,
        lean_file,
        error_log,
        item_index=item_index,
        label=label,
        item_context=item_context,
        item_dependencies=item_dependencies,
        item_notes=item_notes,
        extra_instructions=extra_instructions,
    )


def build_agent_b_bookcheck_prompt(
    lean_file: Path,
    error_log: str,
    *,
    item_index: int | None = None,
    label: str | None = None,
    item_context: dict[str, Any] | None = None,
    item_dependencies: list[Any] | None = None,
    item_notes: Any | None = None,
    extra_instructions: str | None = None,
) -> str:
    return _build_statement_agent_b_prompt(
        AGENT_B_BOOKCHECK_PROMPT,
        lean_file,
        error_log,
        item_index=item_index,
        label=label,
        item_context=item_context,
        item_dependencies=item_dependencies,
        item_notes=item_notes,
        extra_instructions=extra_instructions,
    )


def build_statement_semantic_check_prompt(
    *,
    label: str,
    env: str | None,
    content: str,
    target_file: Path,
    formal_snippet: str,
    decl_info: dict[str, Any] | None,
    dependencies: list[Any] | None,
    context: dict[str, Any] | None,
) -> str:
    """
    Build the prompt for the statement semantic-check Agent C.
    """
    if not STATEMENT_AGENT_C_SEMANTIC_CHECK_PROMPT.strip():
        raise RuntimeError("Missing prompts/statement/agent_c_semantic_check_prompt.txt")
    meta = {
        "label": label,
        "env": env,
        "content": content,
        "target_file": str(target_file),
        "formal_snippet": formal_snippet,
        "decl_info": decl_info,
        "dependencies": dependencies or [],
        "context": context or {},
    }
    return _assemble_prompt(STATEMENT_AGENT_C_SEMANTIC_CHECK_PROMPT, meta, extra_instructions=None)


def run_statement_agent_c_semantic_check(
    *,
    label: str,
    env: str | None,
    content: str,
    target_file: Path,
    formal_snippet: str,
    decl_info: dict[str, Any] | None,
    dependencies: list[Any] | None = None,
    context: dict[str, Any] | None = None,
    model: str | None = None,
    reasoning_effort: str | None = None,
) -> CodexCallResult:
    """
    Run statement semantic-check Agent C (read-only; returns a JSON report in stdout).
    """
    _print_agent_start(
        pipeline="statement",
        agent="C",
        task=f"label={label}",
        target_file=str(target_file),
        mode="semantic_check",
        model=model,
        reasoning_effort=reasoning_effort,
    )
    prompt = build_statement_semantic_check_prompt(
        label=label,
        env=env,
        content=content,
        target_file=target_file,
        formal_snippet=formal_snippet,
        decl_info=decl_info,
        dependencies=dependencies,
        context=context,
    )
    log_name = build_log_filename("statement", "agent_c_semantic_check", slugify(label), target_file.as_posix())
    extra_args = _agent_extra_args(model=model, reasoning_effort=reasoning_effort)
    return run_codex(
        prompt,
        extra_args=extra_args or None,
        log_name=log_name,
        log_dir=_agent_logs_dir(STATEMENT_LOGS_DIR, "c"),
        cwd=CODEX_STATEMENT_CWD,
        stage="statement",
        log_meta={
            "pipeline": "statement",
            "agent": "C",
            "mode": "semantic_check",
            "label": label,
            "target_file": str(target_file),
            "model": model,
            "reasoning_effort": reasoning_effort,
        },
    )


def run_agent_a(
    item: NLItem,
    *,
    model: str | None = None,
    reasoning_effort: str | None = None,
    extra_instructions: str | None = None,
    log_name: str | None = None,
) -> CodexCallResult:
    target_file = resolve_item_target_file(
        item.chapter, item.section, label=item.label, target_file=getattr(item, "target_file", None)
    )
    _print_agent_start(
        pipeline="statement",
        agent="A",
        task=f"idx={item.index} label={item.label}",
        target_file=str(target_file),
        model=model,
        reasoning_effort=reasoning_effort,
    )
    prompt = build_agent_a_prompt(item, extra_instructions=extra_instructions)
    log_name = log_name or build_log_filename("statement", "agent_a", f"idx{item.index}", item.label)
    extra_args = _agent_extra_args(model=model, reasoning_effort=reasoning_effort)
    return run_codex(
        prompt,
        extra_args=extra_args or None,
        log_name=log_name,
        log_dir=_agent_logs_dir(STATEMENT_LOGS_DIR, "a"),
        cwd=CODEX_STATEMENT_CWD,
        stage="statement",
        log_meta={
            "pipeline": "statement",
            "agent": "A",
            "item_index": item.index,
            "label": item.label,
            "model": model,
            "reasoning_effort": reasoning_effort,
        },
    )


def run_agent_b(
    lean_file: Path,
    error_log: str,
    item_index: int,
    item_context: dict[str, Any] | None = None,
    item_dependencies: list[Any] | None = None,
    label: str | None = None,
    *,
    model: str | None = None,
    reasoning_effort: str | None = None,
    extra_instructions: str | None = None,
) -> CodexCallResult:
    _print_agent_start(
        pipeline="statement",
        agent="B",
        task=f"idx={item_index}" + (f" label={label}" if label else ""),
        target_file=str(lean_file),
        model=model,
        reasoning_effort=reasoning_effort,
    )
    prompt = build_agent_b_prompt(
        lean_file,
        error_log,
        item_index=item_index,
        label=label,
        item_context=item_context,
        item_dependencies=item_dependencies,
        extra_instructions=extra_instructions,
    )
    log_name = build_log_filename("statement", "agent_b", f"idx{item_index}", lean_file.as_posix())
    extra_args = _agent_extra_args(model=model, reasoning_effort=reasoning_effort)
    return run_codex(
        prompt,
        extra_args=extra_args or None,
        log_name=log_name,
        log_dir=_agent_logs_dir(STATEMENT_LOGS_DIR, "b"),
        cwd=CODEX_STATEMENT_CWD,
        stage="statement",
        log_meta={
            "pipeline": "statement",
            "agent": "B",
            "item_index": item_index,
            "lean_file": str(lean_file),
            "model": model,
            "reasoning_effort": reasoning_effort,
        },
    )


def run_agent_b_bookcheck(
    lean_file: Path,
    error_log: str,
    item_index: int,
    item_context: dict[str, Any] | None = None,
    item_dependencies: list[Any] | None = None,
    label: str | None = None,
    *,
    model: str | None = None,
    reasoning_effort: str | None = None,
    extra_instructions: str | None = None,
) -> CodexCallResult:
    _print_agent_start(
        pipeline="statement",
        agent="B",
        task=f"idx={item_index}" + (f" label={label}" if label else ""),
        target_file=str(lean_file),
        mode="bookcheck",
        model=model,
        reasoning_effort=reasoning_effort,
    )
    prompt = build_agent_b_bookcheck_prompt(
        lean_file,
        error_log,
        item_index=item_index,
        label=label,
        item_context=item_context,
        item_dependencies=item_dependencies,
        extra_instructions=extra_instructions,
    )
    log_name = build_log_filename("statement", "agent_b_bookcheck", f"idx{item_index}", lean_file.as_posix())
    extra_args = _agent_extra_args(model=model, reasoning_effort=reasoning_effort)
    return run_codex(
        prompt,
        extra_args=extra_args or None,
        log_name=log_name,
        log_dir=_agent_logs_dir(STATEMENT_LOGS_DIR, "b"),
        cwd=CODEX_STATEMENT_CWD,
        stage="statement",
        log_meta={
            "pipeline": "statement",
            "agent": "B",
            "mode": "bookcheck",
            "item_index": item_index,
            "lean_file": str(lean_file),
            "model": model,
            "reasoning_effort": reasoning_effort,
        },
    )


def build_proof_agent_a_prompt(
    item: NLItem,
    plan: dict[str, Any] | None = None,
    plan_raw: str | None = None,
    attempt: int = 1,
    *,
    extra_instructions: str | None = None,
) -> str:
    """
    Build the prompt for proof Agent A by attaching metadata for the current item.
    输入组成：proof agent_a_prompt.txt 的文本 + JSON 元信息：
      - item 原始字段（index/label/env/number_components/content/context）
      - target_file：章节 Lean 文件的相对路径
      - plan_from_agent_c：Agent C 输出的结构化拆题计划（可为 null）
      - plan_raw_from_agent_c：未解析的计划文本片段（可为 null，用于 fallback）
      - agent_a_attempt：同一题目下当前是第几次 Agent A 尝试（含 re-plan）
    """
    lean_path = resolve_item_target_file(
        item.chapter, item.section, label=item.label, target_file=getattr(item, "target_file", None)
    )
    meta = {
        "item": {
            "index": item.index,
            "label": item.label,
            "env": item.env,
            "number_components": item.number_components,
            "content": item.content,
            "context": item.context,
            "dependencies": item.dependencies,
            "nl_answer": item.nl_answer,
            "notes": getattr(item, "notes", None),
        },
        "target_file": str(lean_path),
        "plan_from_agent_c": plan,
        "plan_raw_from_agent_c": plan_raw,
        "agent_a_attempt": attempt,
    }
    return _assemble_prompt(PROOF_AGENT_A_PROMPT, meta, extra_instructions)


def _build_proof_agent_b_prompt(
    base_prompt: str,
    lean_file: Path,
    error_log: str,
    item_context: dict[str, Any] | None = None,
    item_content: str | None = None,
    item_dependencies: list[Any] | None = None,
    item_notes: Any | None = None,
    *,
    item_index: int | None = None,
    label: str | None = None,
    extra_instructions: str | None = None,
) -> str:
    """
    Build the prompt for proof Agent B with the lean file context and recent errors.
    输入组成：proof agent_b_prompt.txt 的文本 + JSON 元信息：
      - lean_file：相对 LEAN_ROOT 的路径
      - error_log：上一次 lean 编译的 stderr
      - content：当前证明对应的原始文本内容（若提供）
      - context：数据条目中的上下文信息（若提供）
    """
    meta = {
        "item_index": item_index,
        "label": label,
        "target_file": str(lean_file),
        "lean_file": str(lean_file),
        "error_log": error_log,
        "content": item_content,
        "dependencies": item_dependencies,
        "context": item_context,
        "notes": item_notes,
    }
    return _assemble_prompt(base_prompt, meta, extra_instructions)


def build_proof_agent_b_prompt(
    lean_file: Path,
    error_log: str,
    item_context: dict[str, Any] | None = None,
    item_content: str | None = None,
    item_dependencies: list[Any] | None = None,
    item_notes: Any | None = None,
    *,
    item_index: int | None = None,
    label: str | None = None,
    extra_instructions: str | None = None,
) -> str:
    return _build_proof_agent_b_prompt(
        PROOF_AGENT_B_PROMPT,
        lean_file,
        error_log,
        item_context=item_context,
        item_content=item_content,
        item_dependencies=item_dependencies,
        item_notes=item_notes,
        item_index=item_index,
        label=label,
        extra_instructions=extra_instructions,
    )


def build_proof_agent_b_bookcheck_prompt(
    lean_file: Path,
    error_log: str,
    item_context: dict[str, Any] | None = None,
    item_content: str | None = None,
    item_dependencies: list[Any] | None = None,
    item_notes: Any | None = None,
    *,
    item_index: int | None = None,
    label: str | None = None,
    extra_instructions: str | None = None,
) -> str:
    return _build_proof_agent_b_prompt(
        PROOF_AGENT_B_BOOKCHECK_PROMPT,
        lean_file,
        error_log,
        item_context=item_context,
        item_content=item_content,
        item_dependencies=item_dependencies,
        item_notes=item_notes,
        item_index=item_index,
        label=label,
        extra_instructions=extra_instructions,
    )


def build_proof_agent_c_prompt(
    item: NLItem,
    feedback_from_agent_a: dict[str, Any] | None = None,
    prior_plan: dict[str, Any] | None = None,
    *,
    extra_instructions: str | None = None,
) -> str:
    """
    Build the prompt for proof Agent C (decomposer/planner).
    输入组成：proof agent_c_prompt.txt 的文本 + JSON 元信息：
      - item 原始字段（index/label/env/number_components/content/context）
      - target_file：章节 Lean 文件的相对路径
      - feedback_from_agent_a：Agent A 发出的结构化反馈（若有 re-plan 请求）
      - prior_plan：上一轮 Agent C 输出的 plan（若存在）
    """
    lean_path = resolve_item_target_file(
        item.chapter, item.section, label=item.label, target_file=getattr(item, "target_file", None)
    )
    meta = {
        "item": {
            "index": item.index,
            "label": item.label,
            "env": item.env,
            "number_components": item.number_components,
            "content": item.content,
            "context": item.context,
            "dependencies": item.dependencies,
            "nl_answer": item.nl_answer,
            "notes": getattr(item, "notes", None),
        },
        "target_file": str(lean_path),
        "feedback_from_agent_a": feedback_from_agent_a,
        "prior_plan": prior_plan,
    }
    return _assemble_prompt(PROOF_AGENT_C_PROMPT, meta, extra_instructions)


def run_proof_agent_a(
    item: NLItem,
    plan: dict[str, Any] | None = None,
    plan_raw: str | None = None,
    attempt: int = 1,
    *,
    model: str | None = None,
    reasoning_effort: str | None = None,
    extra_instructions: str | None = None,
    log_name: str | None = None,
) -> CodexCallResult:
    target_file = resolve_item_target_file(
        item.chapter, item.section, label=item.label, target_file=getattr(item, "target_file", None)
    )
    _print_agent_start(
        pipeline="proof",
        agent="A",
        task=f"idx={item.index} attempt={attempt} label={item.label}",
        target_file=str(target_file),
        model=model,
        reasoning_effort=reasoning_effort,
    )
    prompt = build_proof_agent_a_prompt(
        item,
        plan=plan,
        plan_raw=plan_raw,
        attempt=attempt,
        extra_instructions=extra_instructions,
    )
    log_name = log_name or build_log_filename(
        "proof", "agent_a", f"idx{item.index}", item.label, f"attempt{attempt}"
    )
    extra_args = _agent_extra_args(model=model, reasoning_effort=reasoning_effort)
    return run_codex(
        prompt,
        extra_args=extra_args or None,
        log_name=log_name,
        log_dir=_agent_logs_dir(PROOF_LOGS_DIR, "a"),
        cwd=CODEX_PROOF_CWD,
        stage="proof",
        log_meta={
            "pipeline": "proof",
            "agent": "A",
            "item_index": item.index,
            "label": item.label,
            "attempt": attempt,
            "model": model,
            "reasoning_effort": reasoning_effort,
        },
    )


def run_proof_agent_b(
    lean_file: Path,
    error_log: str,
    item_index: int,
    item_context: dict[str, Any] | None = None,
    item_content: str | None = None,
    item_dependencies: list[Any] | None = None,
    item_notes: Any | None = None,
    label: str | None = None,
    *,
    model: str | None = None,
    reasoning_effort: str | None = None,
    extra_instructions: str | None = None,
) -> CodexCallResult:
    _print_agent_start(
        pipeline="proof",
        agent="B",
        task=f"idx={item_index}" + (f" label={label}" if label else ""),
        target_file=str(lean_file),
        model=model,
        reasoning_effort=reasoning_effort,
    )
    prompt = build_proof_agent_b_prompt(
        lean_file,
        error_log,
        item_context=item_context,
        item_content=item_content,
        item_dependencies=item_dependencies,
        item_notes=item_notes,
        item_index=item_index,
        label=label,
        extra_instructions=extra_instructions,
    )
    log_name = build_log_filename("proof", "agent_b", f"idx{item_index}", lean_file.as_posix())
    extra_args = _agent_extra_args(model=model, reasoning_effort=reasoning_effort)
    return run_codex(
        prompt,
        extra_args=extra_args or None,
        log_name=log_name,
        log_dir=_agent_logs_dir(PROOF_LOGS_DIR, "b"),
        cwd=CODEX_PROOF_CWD,
        stage="proof",
        log_meta={
            "pipeline": "proof",
            "agent": "B",
            "item_index": item_index,
            "lean_file": str(lean_file),
            "model": model,
            "reasoning_effort": reasoning_effort,
        },
    )


def run_proof_agent_b_bookcheck(
    lean_file: Path,
    error_log: str,
    item_index: int,
    item_context: dict[str, Any] | None = None,
    item_content: str | None = None,
    item_dependencies: list[Any] | None = None,
    item_notes: Any | None = None,
    label: str | None = None,
    *,
    model: str | None = None,
    reasoning_effort: str | None = None,
    extra_instructions: str | None = None,
) -> CodexCallResult:
    _print_agent_start(
        pipeline="proof",
        agent="B",
        task=f"idx={item_index}" + (f" label={label}" if label else ""),
        target_file=str(lean_file),
        mode="bookcheck",
        model=model,
        reasoning_effort=reasoning_effort,
    )
    prompt = build_proof_agent_b_bookcheck_prompt(
        lean_file,
        error_log,
        item_context=item_context,
        item_content=item_content,
        item_dependencies=item_dependencies,
        item_notes=item_notes,
        item_index=item_index,
        label=label,
        extra_instructions=extra_instructions,
    )
    log_name = build_log_filename("proof", "agent_b_bookcheck", f"idx{item_index}", lean_file.as_posix())
    extra_args = _agent_extra_args(model=model, reasoning_effort=reasoning_effort)
    return run_codex(
        prompt,
        extra_args=extra_args or None,
        log_name=log_name,
        log_dir=_agent_logs_dir(PROOF_LOGS_DIR, "b"),
        cwd=CODEX_PROOF_CWD,
        stage="proof",
        log_meta={
            "pipeline": "proof",
            "agent": "B",
            "mode": "bookcheck",
            "item_index": item_index,
            "lean_file": str(lean_file),
            "model": model,
            "reasoning_effort": reasoning_effort,
        },
    )


def run_proof_agent_c(
    item: NLItem,
    feedback_from_agent_a: dict[str, Any] | None = None,
    prior_plan: dict[str, Any] | None = None,
    *,
    model: str | None = None,
    reasoning_effort: str | None = None,
    extra_instructions: str | None = None,
) -> CodexCallResult:
    target_file = resolve_item_target_file(
        item.chapter, item.section, label=item.label, target_file=getattr(item, "target_file", None)
    )
    _print_agent_start(
        pipeline="proof",
        agent="C",
        task=f"idx={item.index} label={item.label}",
        target_file=str(target_file),
        model=model,
        reasoning_effort=reasoning_effort,
    )
    prompt = build_proof_agent_c_prompt(
        item,
        feedback_from_agent_a=feedback_from_agent_a,
        prior_plan=prior_plan,
        extra_instructions=extra_instructions,
    )
    log_name = build_log_filename("proof", "agent_c", f"idx{item.index}", item.label)
    extra_args = _agent_extra_args(model=model, reasoning_effort=reasoning_effort)
    return run_codex(
        prompt,
        extra_args=extra_args or None,
        log_name=log_name,
        log_dir=_agent_logs_dir(PROOF_LOGS_DIR, "c"),
        cwd=CODEX_PROOF_CWD,
        stage="proof",
        log_meta={
            "pipeline": "proof",
            "agent": "C",
            "item_index": item.index,
            "label": item.label,
            "model": model,
            "reasoning_effort": reasoning_effort,
        },
    )


def build_proof_agent_d_prompt(
    *,
    lean_file: Path,
    max_lines: int,
    extra_instructions: str | None = None,
) -> str:
    """
    Agent D is a "section splitter": split oversized Lean files into `sectionXX_partYY.lean` files,
    update the aggregate `sectionXX.lean`, and preserve declarations/comments.
    """
    meta = {"lean_file": str(lean_file), "max_lines": max_lines}
    return _assemble_prompt(PROOF_AGENT_D_PROMPT, meta, extra_instructions)


def run_proof_agent_d(
    *,
    lean_file: Path,
    max_lines: int,
    task_id: str,
    model: str | None = None,
    reasoning_effort: str | None = None,
    extra_instructions: str | None = None,
) -> CodexCallResult:
    if not PROOF_AGENT_D_PROMPT.strip():
        return CodexCallResult(
            code=2,
            stdout="",
            stderr="Missing prompts/proof/agent_d_prompt.txt; cannot run Agent D splitter.",
            tokens_used=None,
            log_path=None,
        )
    _print_agent_start(
        pipeline="proof",
        agent="D",
        task=f"task_id={task_id} max_lines={max_lines}",
        target_file=str(lean_file),
        model=model,
        reasoning_effort=reasoning_effort,
    )
    prompt = build_proof_agent_d_prompt(
        lean_file=lean_file,
        max_lines=max_lines,
        extra_instructions=extra_instructions,
    )
    log_name = build_log_filename("proof", "agent_d", task_id, lean_file.as_posix())
    extra_args = _agent_extra_args(model=model, reasoning_effort=reasoning_effort)
    return run_codex(
        prompt,
        extra_args=extra_args or None,
        log_name=log_name,
        log_dir=_agent_logs_dir(PROOF_LOGS_DIR, "d"),
        cwd=CODEX_PROOF_CWD,
        stage="proof",
        log_meta={
            "pipeline": "proof",
            "agent": "D",
            "task_id": task_id,
            "lean_file": str(lean_file),
            "max_lines": max_lines,
            "model": model,
            "reasoning_effort": reasoning_effort,
        },
    )


def run_final_agent_d(
    *,
    lean_file: Path,
    max_lines: int,
    task_id: str,
    model: str | None = None,
    reasoning_effort: str | None = None,
    extra_instructions: str | None = None,
) -> CodexCallResult:
    """
    Final-stage Agent D is a section splitter for oversized chapter files.
    Reuses the same prompt text as the proof-stage splitter, but writes logs under `log/<project>/final_logs/agent_d/`.
    """
    if not PROOF_AGENT_D_PROMPT.strip():
        return CodexCallResult(
            code=2,
            stdout="",
            stderr="Missing prompts/proof/agent_d_prompt.txt; cannot run Agent D splitter.",
            tokens_used=None,
            log_path=None,
        )
    _print_agent_start(
        pipeline="final",
        agent="D",
        task=f"task_id={task_id} max_lines={max_lines}",
        target_file=str(lean_file),
        model=model,
        reasoning_effort=reasoning_effort,
    )
    prompt = build_proof_agent_d_prompt(
        lean_file=lean_file,
        max_lines=max_lines,
        extra_instructions=extra_instructions,
    )
    log_name = build_log_filename("final", "agent_d", task_id, lean_file.as_posix())
    extra_args = _agent_extra_args(model=model, reasoning_effort=reasoning_effort)
    return run_codex(
        prompt,
        extra_args=extra_args or None,
        log_name=log_name,
        log_dir=_agent_logs_dir(FINAL_LOGS_DIR, "d"),
        cwd=CODEX_FINAL_CWD,
        stage="final",
        log_meta={
            "pipeline": "final",
            "agent": "D",
            "task_id": task_id,
            "lean_file": str(lean_file),
            "max_lines": max_lines,
            "model": model,
            "reasoning_effort": reasoning_effort,
        },
    )


def build_final_agent_c_prompt(
    *,
    lean_file: Path,
    target: dict[str, Any],
    feedback_from_agent_a: dict[str, Any] | None = None,
    prior_plan: dict[str, Any] | None = None,
    nl_hint: str | None = None,
    nl_answer: str | None = None,
    extra_instructions: str | None = None,
) -> str:
    meta = {
        "lean_file": str(lean_file),
        "target": target,
        "feedback_from_agent_a": feedback_from_agent_a,
        "prior_plan": prior_plan,
        "nl_hint": nl_hint,
        "nl_answer": nl_answer,
    }
    return _assemble_prompt(FINAL_AGENT_C_PROMPT, meta, extra_instructions)


def build_final_agent_a_prompt(
    *,
    lean_file: Path,
    target: dict[str, Any],
    plan: dict[str, Any] | None = None,
    plan_raw: str | None = None,
    attempt: int = 1,
    extra_instructions: str | None = None,
    nl_hint: str | None = None,
    nl_answer: str | None = None,
) -> str:
    meta = {
        "lean_file": str(lean_file),
        "target": target,
        "plan_from_agent_c": plan,
        "plan_raw_from_agent_c": plan_raw,
        "agent_a_attempt": attempt,
        "nl_hint": nl_hint,
        "nl_answer": nl_answer,
    }
    return _assemble_prompt(FINAL_AGENT_A_PROMPT, meta, extra_instructions)


def build_final_agent_b_prompt(
    *,
    lean_file: Path,
    error_log: str,
    target: dict[str, Any] | None = None,
    history: list[str] | None = None,
    extra_instructions: str | None = None,
    nl_hint: str | None = None,
    nl_answer: str | None = None,
) -> str:
    meta = {
        "lean_file": str(lean_file),
        "error_log": error_log,
        "target": target,
        "agent_b_history": history,
        "nl_hint": nl_hint,
        "nl_answer": nl_answer,
    }
    return _assemble_prompt(FINAL_AGENT_B_PROMPT, meta, extra_instructions)


def build_final_agent_b_book_prompt(
    lean_file: Path,
    error_log: str,
    *,
    extra_instructions: str | None = None,
    target: dict[str, Any] | None = None,
    nl_hint: str | None = None,
    nl_answer: str | None = None,
) -> str:
    meta = {
        "lean_file": str(lean_file),
        "error_log": error_log,
        "target": target,
        "nl_hint": nl_hint,
        "nl_answer": nl_answer,
    }
    return _assemble_prompt(FINAL_AGENT_B_BOOK_PROMPT, meta, extra_instructions)


def build_infra_plan_prompt(
    *,
    bench_file: Path,
    missing_theory_signal: dict[str, Any],
    extra_instructions: str | None = None,
) -> str:
    meta = {
        "bench_file": str(bench_file),
        "missing_theory_signal": missing_theory_signal,
    }
    return _assemble_prompt(INFRA_PLAN_PROMPT, meta, extra_instructions)


def build_infra_plan_check_prompt(
    *,
    bench_file: Path,
    missing_theory_signal: dict[str, Any],
    infra_plan: list[dict[str, Any]],
    public_api_cap: int,
    extra_instructions: str | None = None,
) -> str:
    meta = {
        "bench_file": str(bench_file),
        "missing_theory_signal": missing_theory_signal,
        "public_api_cap": int(public_api_cap),
        "infra_plan": infra_plan,
    }
    return _assemble_prompt(INFRA_PLAN_CHECK_PROMPT, meta, extra_instructions)


def run_infra_plan_agent(
    *,
    bench_file: Path,
    missing_theory_signal: dict[str, Any],
    task_id: str,
    model: str | None = None,
    reasoning_effort: str | None = None,
    extra_instructions: str | None = None,
) -> CodexCallResult:
    used_model = model if model is not None else (
        os.getenv("INFRA_AGENT_PLAN_MODEL")
        or os.getenv("INFRA_PLAN_AGENT_MODEL")
        or "gpt-5.3-codex"
    )
    used_effort = reasoning_effort if reasoning_effort is not None else (
        os.getenv("INFRA_AGENT_PLAN_REASONING_EFFORT")
        or os.getenv("INFRA_PLAN_AGENT_REASONING_EFFORT")
        or "xhigh"
    )
    _print_agent_start(
        pipeline="infra",
        agent="P",
        task=f"task_id={task_id}",
        target_file=str(bench_file),
        model=used_model,
        reasoning_effort=used_effort,
    )
    prompt = build_infra_plan_prompt(
        bench_file=bench_file,
        missing_theory_signal=missing_theory_signal,
        extra_instructions=extra_instructions,
    )
    log_name = build_log_filename("infra", "agent_plan", task_id, bench_file.as_posix())
    extra_args = _agent_extra_args(model=used_model, reasoning_effort=used_effort)
    return run_codex(
        prompt,
        extra_args=extra_args or None,
        log_name=log_name,
        log_dir=_agent_logs_dir(INFRA_LOGS_DIR, "plan"),
        cwd=CODEX_FINAL_CWD,
        stage="infra",
        log_meta={
            "pipeline": "infra",
            "agent": "plan",
            "task_id": task_id,
            "bench_file": str(bench_file),
            "model": used_model,
            "reasoning_effort": used_effort,
        },
    )


def run_infra_plan_check_agent(
    *,
    bench_file: Path,
    missing_theory_signal: dict[str, Any],
    infra_plan: list[dict[str, Any]],
    public_api_cap: int,
    task_id: str,
    attempt: int,
    model: str | None = None,
    reasoning_effort: str | None = None,
    extra_instructions: str | None = None,
) -> CodexCallResult:
    used_model = model if model is not None else (
        os.getenv("INFRA_AGENT_CHECK_MODEL")
        or os.getenv("INFRA_PLAN_CHECK_AGENT_MODEL")
        or "gpt-5.3-codex"
    )
    used_effort = reasoning_effort if reasoning_effort is not None else (
        os.getenv("INFRA_AGENT_CHECK_REASONING_EFFORT")
        or os.getenv("INFRA_PLAN_CHECK_AGENT_REASONING_EFFORT")
        or "xhigh"
    )
    _print_agent_start(
        pipeline="infra",
        agent="PC",
        task=f"task_id={task_id} attempt={attempt}",
        target_file=str(bench_file),
        model=used_model,
        reasoning_effort=used_effort,
    )
    prompt = build_infra_plan_check_prompt(
        bench_file=bench_file,
        missing_theory_signal=missing_theory_signal,
        infra_plan=infra_plan,
        public_api_cap=public_api_cap,
        extra_instructions=extra_instructions,
    )
    log_name = build_log_filename("infra", "agent_plan_check", task_id, bench_file.as_posix(), f"attempt{attempt}")
    extra_args = _agent_extra_args(model=used_model, reasoning_effort=used_effort)
    return run_codex(
        prompt,
        extra_args=extra_args or None,
        log_name=log_name,
        log_dir=_agent_logs_dir(INFRA_LOGS_DIR, "plan_check"),
        cwd=CODEX_FINAL_CWD,
        stage="infra",
        log_meta={
            "pipeline": "infra",
            "agent": "plan_check",
            "task_id": task_id,
            "bench_file": str(bench_file),
            "attempt": attempt,
            "model": used_model,
            "reasoning_effort": used_effort,
        },
    )


def run_final_agent_c(
    *,
    lean_file: Path,
    target: dict[str, Any],
    task_id: str,
    feedback_from_agent_a: dict[str, Any] | None = None,
    prior_plan: dict[str, Any] | None = None,
    nl_hint: str | None = None,
    nl_answer: str | None = None,
    extra_instructions: str | None = None,
    model: str | None = None,
    reasoning_effort: str | None = None,
    stage: str = "final",
) -> CodexCallResult:
    _print_agent_start(
        pipeline="final",
        agent="C",
        task=f"task_id={task_id}",
        target_file=str(lean_file),
        model=model,
        reasoning_effort=reasoning_effort,
    )
    prompt = build_final_agent_c_prompt(
        lean_file=lean_file,
        target=target,
        feedback_from_agent_a=feedback_from_agent_a,
        prior_plan=prior_plan,
        nl_hint=nl_hint,
        nl_answer=nl_answer,
        extra_instructions=extra_instructions,
    )
    used_model = model if model is not None else get_final_agent_c_model()
    used_effort = reasoning_effort if reasoning_effort is not None else get_final_agent_c_reasoning_effort()
    log_name = build_log_filename("final", "agent_c", task_id, lean_file.as_posix())
    return run_codex(
        prompt,
        extra_args=_agent_extra_args(model=used_model, reasoning_effort=used_effort),
        log_name=log_name,
        log_dir=_agent_logs_dir(FINAL_LOGS_DIR, "c"),
        cwd=CODEX_FINAL_CWD,
        stage=stage,
        log_meta={
            "pipeline": "final",
            "agent": "C",
            "task_id": task_id,
            "lean_file": str(lean_file),
            "model": used_model,
            "reasoning_effort": used_effort,
        },
    )


def run_final_agent_a(
    *,
    lean_file: Path,
    target: dict[str, Any],
    task_id: str,
    plan: dict[str, Any] | None = None,
    plan_raw: str | None = None,
    attempt: int = 1,
    extra_instructions: str | None = None,
    log_name: str | None = None,
    nl_hint: str | None = None,
    nl_answer: str | None = None,
    echo_prompt: bool = False,
    prompt_preview_chars: int = 2000,
    model: str | None = None,
    reasoning_effort: str | None = None,
    stage: str = "final",
) -> CodexCallResult:
    _print_agent_start(
        pipeline="final",
        agent="A",
        task=f"task_id={task_id} attempt={attempt}",
        target_file=str(lean_file),
        model=model,
        reasoning_effort=reasoning_effort,
    )
    prompt = build_final_agent_a_prompt(
        lean_file=lean_file,
        target=target,
        plan=plan,
        plan_raw=plan_raw,
        attempt=attempt,
        extra_instructions=extra_instructions,
        nl_hint=nl_hint,
        nl_answer=nl_answer,
    )
    if echo_prompt:
        if len(prompt) > prompt_preview_chars:
            display = prompt[:prompt_preview_chars] + "... [truncated]"
        else:
            display = prompt
        print("[Final Agent A prompt]\n" + display)
    used_model = model if model is not None else get_final_agent_a_model()
    used_effort = reasoning_effort if reasoning_effort is not None else get_final_agent_a_reasoning_effort()
    log_name = log_name or build_log_filename(
        "final", "agent_a", task_id, lean_file.as_posix(), f"attempt{attempt}"
    )
    return run_codex(
        prompt,
        extra_args=_agent_extra_args(model=used_model, reasoning_effort=used_effort),
        log_name=log_name,
        log_dir=_agent_logs_dir(FINAL_LOGS_DIR, "a"),
        cwd=CODEX_FINAL_CWD,
        stage=stage,
        log_meta={
            "pipeline": "final",
            "agent": "A",
            "task_id": task_id,
            "lean_file": str(lean_file),
            "attempt": attempt,
            "model": used_model,
            "reasoning_effort": used_effort,
        },
    )


def run_final_agent_b(
    *,
    lean_file: Path,
    error_log: str,
    task_id: str,
    target: dict[str, Any] | None = None,
    history: list[str] | None = None,
    extra_instructions: str | None = None,
    nl_hint: str | None = None,
    nl_answer: str | None = None,
    model: str | None = None,
    reasoning_effort: str | None = None,
    stage: str = "final",
) -> CodexCallResult:
    _print_agent_start(
        pipeline="final",
        agent="B",
        task=f"task_id={task_id}",
        target_file=str(lean_file),
        model=model,
        reasoning_effort=reasoning_effort,
    )
    prompt = build_final_agent_b_prompt(
        lean_file=lean_file,
        error_log=error_log,
        target=target,
        history=history,
        extra_instructions=extra_instructions,
        nl_hint=nl_hint,
        nl_answer=nl_answer,
    )
    used_model = model if model is not None else get_final_agent_b_model()
    used_effort = reasoning_effort if reasoning_effort is not None else get_final_agent_b_reasoning_effort()
    log_name = build_log_filename("final", "agent_b", task_id, lean_file.as_posix())
    return run_codex(
        prompt,
        extra_args=_agent_extra_args(model=used_model, reasoning_effort=used_effort),
        log_name=log_name,
        log_dir=_agent_logs_dir(FINAL_LOGS_DIR, "b"),
        cwd=CODEX_FINAL_CWD,
        stage=stage,
        log_meta={
            "pipeline": "final",
            "agent": "B",
            "task_id": task_id,
            "lean_file": str(lean_file),
            "model": used_model,
            "reasoning_effort": used_effort,
        },
    )


def run_final_agent_b_book(
    lean_file: Path,
    error_log: str,
    task_id: str,
    *,
    model: str | None = None,
    reasoning_effort: str | None = None,
    extra_instructions: str | None = None,
) -> CodexCallResult:
    _print_agent_start(
        pipeline="final",
        agent="B",
        task=f"task_id={task_id}",
        target_file=str(lean_file),
        mode="bookcheck",
        model=model,
        reasoning_effort=reasoning_effort,
    )
    prompt = build_final_agent_b_book_prompt(
        lean_file=lean_file,
        error_log=error_log,
        extra_instructions=extra_instructions,
    )
    log_name = build_log_filename("final", "agent_b_book", task_id, lean_file.as_posix())
    extra_args = _agent_extra_args(model=model, reasoning_effort=reasoning_effort)
    return run_codex(
        prompt,
        extra_args=extra_args or None,
        log_name=log_name,
        log_dir=_agent_logs_dir(FINAL_LOGS_DIR, "b"),
        cwd=CODEX_FINAL_CWD,
        stage="final",
        log_meta={
            "pipeline": "final",
            "agent": "B",
            "mode": "book",
            "task_id": task_id,
            "lean_file": str(lean_file),
            "model": model,
            "reasoning_effort": reasoning_effort,
        },
    )
