#!/usr/bin/env python3
from __future__ import annotations
import argparse, csv, json, random
from pathlib import Path

ROOT = Path(__file__).resolve().parents[1]

def read_rows(path: Path):
    with path.open(newline='', encoding='utf-8') as f:
        return list(csv.DictReader(f))

def paired_bootstrap(deltas, seed=20260517, B=10000):
    if not deltas:
        return 0.0, 0.0, 0.0
    rng = random.Random(seed)
    n = len(deltas)
    vals=[]
    for _ in range(B):
        vals.append(sum(deltas[rng.randrange(n)] for _ in range(n))/n)
    vals.sort()
    lo = vals[int(0.025*B)]
    hi = vals[int(0.975*B)-1]
    return sum(deltas)/n, lo, hi

def cumulative_lift(rows, turn=2):
    per={}
    for r in rows:
        if r.get('included', 'True') != 'True':
            continue
        item=r['item_id']; t=int(r['turn']); m=int(r['match'])
        per.setdefault(item,{})[t]=max(per.setdefault(item,{}).get(t,0),m)
    deltas=[]
    for td in per.values():
        t0=1 if td.get(0,0) else 0
        tt=1 if any(td.get(k,0) for k in range(turn+1)) else 0
        deltas.append(tt-t0)
    return paired_bootstrap(deltas), len(deltas), sum(1 for td in per.values() if td.get(0,0)), sum(1 for td in per.values() if any(td.get(k,0) for k in range(turn+1)))

def write_csv(path, rows):
    path.parent.mkdir(parents=True, exist_ok=True)
    keys=list(rows[0]) if rows else []
    with path.open('w', newline='', encoding='utf-8') as f:
        w=csv.DictWriter(f, fieldnames=keys); w.writeheader(); w.writerows(rows)

def main():
    ap=argparse.ArgumentParser()
    ap.add_argument('--check', action='store_true')
    args=ap.parse_args()
    all_rows=read_rows(ROOT/'data/headline_turns.csv')
    out=[]
    for run in sorted(set((r.get('run_id') or r['run']) for r in all_rows if r.get('included', 'True') == 'True')):
        rr=[r for r in all_rows if (r.get('run_id') or r['run'])==run]
        (mean,lo,hi),n,c0,c2=cumulative_lift(rr,2)
        out.append({'run':run,'n_items':n,'turn0_correct':c0,'turn2_cum_correct':c2,'lift':round(mean,4),'ci95_low':round(lo,4),'ci95_high':round(hi,4)})
    write_csv(ROOT/'reproduced_tables/turn2_lifts_from_rows.csv', out)
    adapters=json.loads((ROOT/'data/adapter_evals.json').read_text(encoding='utf-8'))['adapter_evals']
    write_csv(ROOT/'reproduced_tables/adapter_summary.csv', adapters)
    if args.check:
        by={r['run']:r for r in out}
        checks={
            'm500_c2_lift': abs(float(by['slotG-m500l5-full-c2']['lift'])-0.1343) <= 0.0002,
            'm500_c3_lift': abs(float(by['slotG-m500l5-full-c3']['lift'])-0.1716) <= 0.0002,
            'olympiad_c3_lift': abs(float(by['slotG-olympiad-real-c3']['lift'])-0.2414) <= 0.0002,
            'aime_c3_null': abs(float(by['slotG-aime-real-c3']['lift'])-0.0) <= 0.0002,
            'best_lora': any(a['run']=='lora-7b-field-r64-enriched' and int(a['pass_count'])==33 for a in adapters),
        }
        failed=[k for k,v in checks.items() if not v]
        if failed:
            raise SystemExit('failed checks: '+', '.join(failed))
        print('all supplement reproduction checks passed')
    else:
        print('wrote reproduced tables')
if __name__ == '__main__':
    main()
