#!/usr/bin/env python3
from __future__ import annotations

import json
from pathlib import Path

from reportlab.lib import colors
from reportlab.lib.pagesizes import letter
from reportlab.lib.styles import ParagraphStyle, getSampleStyleSheet
from reportlab.lib.units import inch
from reportlab.platypus import Image, PageBreak, Paragraph, SimpleDocTemplate, Spacer, Table, TableStyle


ROOT = Path(__file__).resolve().parents[1]
FIGURES = ROOT / "figures"
JSON_PATH = ROOT / "SOURCE_STRUCTURE_ANALYSIS.json"
LOCAL_REFERENCE_JSON_PATH = ROOT / "LOCAL_REFERENCE_GRAPH_ANALYSIS.json"
OUT = ROOT / "SUPPLEMENTARY_EVIDENCE_APPENDIX.pdf"


def p(text: str, style: ParagraphStyle) -> Paragraph:
    return Paragraph(text.replace("&", "&amp;"), style)


def figure(path: Path, width: float = 6.6 * inch) -> Image:
    img = Image(str(path))
    scale = width / img.imageWidth
    img.drawWidth = width
    img.drawHeight = img.imageHeight * scale
    return img


def main() -> None:
    data = json.loads(JSON_PATH.read_text())
    local_reference_data = json.loads(LOCAL_REFERENCE_JSON_PATH.read_text())
    totals = data["totals"]
    by_chain = data["by_chain"]
    local_reference_totals = local_reference_data["totals"]

    styles = getSampleStyleSheet()
    title = ParagraphStyle("Title", parent=styles["Title"], fontSize=18, leading=22, spaceAfter=12)
    h2 = ParagraphStyle("H2", parent=styles["Heading2"], fontSize=12, leading=15, spaceBefore=10, spaceAfter=6)
    body = ParagraphStyle("Body", parent=styles["BodyText"], fontSize=9, leading=12, spaceAfter=6)
    small = ParagraphStyle("Small", parent=styles["BodyText"], fontSize=8, leading=10, spaceAfter=4)

    doc = SimpleDocTemplate(
        str(OUT),
        pagesize=letter,
        rightMargin=0.55 * inch,
        leftMargin=0.55 * inch,
        topMargin=0.55 * inch,
        bottomMargin=0.55 * inch,
        title="Supplementary Evidence Appendix",
        author="Anonymous Authors",
    )

    story = [
        p("Supplementary Evidence Appendix", title),
        p(
            "This appendix collects extra plots and source-structure checks for the AI4Math submission. "
            "The core reproducibility claim remains the Lean build plus the 107-trace axiom audit; these pages add reviewer-facing context.",
            body,
        ),
        p("Static Source-Structure Proxy", h2),
        p(
            f"The analyzed snapshot has {totals['files']} Lean source files, {totals['source_lines']:,} source lines, "
            f"and {totals['theorem_lemma_decls']} theorem/lemma declarations. It has {totals['mathlib_imports']} Mathlib import lines "
            f"and {totals['internal_imports']} internal FormalSLT import lines. "
            f"{totals['decls_with_local_refs']} theorem/lemma spans ({totals['decls_with_local_refs_pct']:.1%}) textually reference another local "
            "FormalSLT theorem/lemma name after short/common names are excluded.",
            body,
        ),
        p(
            "This is a source-structure proxy. It does not count every Mathlib lemma call, and it is not a theorem-difficulty or novelty metric.",
            small,
        ),
    ]

    rows = [["Chain", "Files", "LoC", "Decls", "Mathlib imports", "FormalSLT imports", "Local-ref decls"]]
    for chain, row in sorted(by_chain.items(), key=lambda item: int(item[1]["source_lines"]), reverse=True):
        decls = int(row["theorems"]) + int(row["lemmas"])
        pct = int(row["decls_with_local_refs"]) / decls if decls else 0.0
        rows.append(
            [
                chain,
                str(row["files"]),
                f"{int(row['source_lines']):,}",
                str(decls),
                str(row["mathlib_imports"]),
                str(row["internal_imports"]),
                f"{pct:.1%}",
            ]
        )
    table = Table(rows, repeatRows=1, colWidths=[1.25 * inch, 0.45 * inch, 0.7 * inch, 0.55 * inch, 0.85 * inch, 0.95 * inch, 0.9 * inch])
    table.setStyle(
        TableStyle(
            [
                ("BACKGROUND", (0, 0), (-1, 0), colors.HexColor("#E9EEF8")),
                ("TEXTCOLOR", (0, 0), (-1, 0), colors.HexColor("#1A202C")),
                ("FONTNAME", (0, 0), (-1, 0), "Helvetica-Bold"),
                ("FONTSIZE", (0, 0), (-1, -1), 7),
                ("GRID", (0, 0), (-1, -1), 0.25, colors.HexColor("#CBD5E0")),
                ("VALIGN", (0, 0), (-1, -1), "MIDDLE"),
                ("ALIGN", (1, 1), (-1, -1), "RIGHT"),
            ]
        )
    )
    story.extend(
        [
            table,
            PageBreak(),
            p("Static Declaration Local-Reference Graph", title),
            p(
                "This source-level graph adds an edge A -> B when theorem/lemma declaration A textually references the unique local "
                "theorem/lemma name for B. Duplicate, short, and common names are ignored. This is not Lean kernel dependency extraction.",
                body,
            ),
            p(
                f"The graph has {local_reference_totals['edges']} static local-reference edges, "
                f"{local_reference_totals['declarations_with_textual_local_reference_edges']} declarations with at least one textual local-reference edge, "
                f"{local_reference_totals['declarations_textually_referenced_by_others']} declarations textually referenced by at least one other declaration, "
                f"a largest weak component of {local_reference_totals['largest_weak_component']} declarations, and maximum static local-reference depth "
                f"{local_reference_totals['max_static_local_reference_depth']}.",
                body,
            ),
            p("Chain-to-chain local-reference matrix. Rows are source declarations; columns are referenced declarations.", small),
            figure(FIGURES / "local_reference_chain_matrix.png"),
            Spacer(1, 0.15 * inch),
            p("Static local-reference depth proxy by chain. Dots show median depth; bars show maximum depth.", small),
            figure(FIGURES / "local_reference_depth_by_chain.png"),
            PageBreak(),
        ]
    )

    story.extend(
        [
            p("Ledger and Axiom-Audit Figures", title),
            p("Ledger-derived PR throughput. This supports feasibility and parallel queue pressure, not causal speedup.", small),
            figure(FIGURES / "cumulative_pr_curve.png"),
            Spacer(1, 0.15 * inch),
            p("Axiom-audit funnel. This shows the audit outcome, not statement adequacy.", small),
            figure(FIGURES / "axiom_funnel.png"),
            PageBreak(),
            p("Artifact Structure Figures", title),
            p("Source lines by proof chain. This is source mass by area, not theorem difficulty.", small),
            figure(FIGURES / "loc_by_chain_bar.png"),
            Spacer(1, 0.15 * inch),
            p("Headline theorem proof-block source lengths. This is a source-span proxy only.", small),
            figure(FIGURES / "proof_length_strip.png"),
            PageBreak(),
            p("Timing and Poster Figures", title),
            p("Merged-PR lifetime distribution. The current ledger does not separate CI time, human review time, and idle time.", small),
            figure(FIGURES / "time_to_merge_histogram.png"),
            Spacer(1, 0.15 * inch),
            p("Poster-ready metric strip. Counts match the submitted snapshot.", small),
            figure(FIGURES / "metrics_strip.png"),
            p("Current ledger limitations", h2),
            p(
                "The anonymized ledger does not encode CI start/end, human-review start/end, failed local attempts before PR creation, or line-level human/agent authorship. "
                "Therefore the submission does not claim Claude-vs-Codex performance, agent-vs-human line attribution, CI-vs-review time, gate-specific rejection counts, or a single-agent baseline speedup.",
                body,
            ),
        ]
    )

    doc.build(story)
    print(OUT)


if __name__ == "__main__":
    main()
