"""Build the math silver v2 = existing 2400 + scaleup 3390."""
from __future__ import annotations

import argparse
import json
from pathlib import Path


def main() -> None:
    ap = argparse.ArgumentParser()
    ap.add_argument(
        "--existing", type=Path, required=True,
        help="Existing silver_math_combined_v5.jsonl (2400 spans, has llm_label).",
    )
    ap.add_argument(
        "--new-spans", type=Path, required=True,
        help="silver_math_scaleup_spans.jsonl (3390 spans, no llm_label).",
    )
    ap.add_argument(
        "--new-judgments", type=Path, required=True,
        help="silver_math_scaleup_judgments.jsonl (V3-SC v5 labels).",
    )
    ap.add_argument("--out", type=Path, required=True)
    args = ap.parse_args()

    judgments = {}
    with open(args.new_judgments) as f:
        for line in f:
            r = json.loads(line)
            if r["llm_label"] in ("PARSE_ERROR", "API_FAILURE"):
                continue
            judgments[r["span_id"]] = r

    out_rows: list[dict] = []
    with open(args.existing) as f:
        for line in f:
            out_rows.append(json.loads(line))
    seen = {r["span_id"] for r in out_rows}

    n_added = 0
    n_dropped = 0
    with open(args.new_spans) as f:
        for line in f:
            sp = json.loads(line)
            sid = sp["span_id"]
            if sid in seen:
                continue
            if sid not in judgments:
                n_dropped += 1
                continue
            j = judgments[sid]
            sp["llm_label"] = j["llm_label"]
            sp["vote_count"] = j.get("vote_count")
            sp["all_labels"] = j.get("llm_labels", [])
            sp["domain"] = "math"
            out_rows.append(sp)
            seen.add(sid)
            n_added += 1

    with open(args.out, "w") as g:
        for r in out_rows:
            g.write(json.dumps(r) + "\n")

    print(f"Wrote {len(out_rows)} math silver rows -> {args.out}")
    print(f"  existing: {len(out_rows) - n_added}, added: {n_added}, dropped (no label): {n_dropped}")


if __name__ == "__main__":
    main()
