"""Build a v6 puzzle + v5 math combined silver file.

Joins the v6 puzzle JUDGMENTS with the existing puzzle SPANS (text +
preceding context) and writes a single jsonl in the format expected by
the train script (silver_combined_v3.jsonl shape).
"""
from __future__ import annotations

import argparse
import json
from pathlib import Path


def main() -> None:
    ap = argparse.ArgumentParser()
    ap.add_argument(
        "--puzzle-spans", type=Path, required=True,
        help="Existing puzzle silver containing span_text + preceding_context",
    )
    ap.add_argument(
        "--puzzle-judgments-v6", type=Path, required=True,
        help="V3-SC v6 judgments minted on the puzzle spans",
    )
    ap.add_argument("--out", type=Path, required=True)
    args = ap.parse_args()

    judgments = {}
    with open(args.puzzle_judgments_v6) as f:
        for line in f:
            r = json.loads(line)
            if r["llm_label"] in ("PARSE_ERROR", "API_FAILURE"):
                continue
            judgments[r["span_id"]] = r

    n_kept = 0
    n_dropped = 0
    with open(args.puzzle_spans) as f, open(args.out, "w") as g:
        for line in f:
            r = json.loads(line)
            sid = r["span_id"]
            if sid not in judgments:
                n_dropped += 1
                continue
            j = judgments[sid]
            r["llm_label"] = j["llm_label"]
            r["vote_count"] = j.get("vote_count")
            r["all_labels"] = j.get("llm_labels", [])
            r["domain"] = "puzzle"
            g.write(json.dumps(r) + "\n")
            n_kept += 1

    print(f"Wrote {n_kept} puzzle silver rows -> {args.out}")
    if n_dropped:
        print(f"Dropped {n_dropped} spans without v6 judgment")


if __name__ == "__main__":
    main()
