#!/usr/bin/env python3
import json, glob, os, sys
import numpy as np
from collections import OrderedDict
from itertools import islice

def eval_file(path):
    with open(path, encoding='utf-8') as f:
        data = json.load(f)
    # if len(data) == 3:
    #     data = dict(islice(data.items(), 2))
    k_max = len(data)   
    # if k_max == 3:
    #     k_max =2# 最大 attempt 数
    print(k_max)
    problem_ids = list(next(iter(data.values())).keys())  # 所有问题 id
    
    n_prob = len(problem_ids)

    # 二维数组：每行是一个问题的 k_max 次结果
    arr = np.zeros((n_prob, k_max), dtype=np.uint8)
    for j, attempt in enumerate(data.values()):  # j = attempt 索引
        for i, pid in enumerate(problem_ids):
            correct = attempt[pid].get("is_correct_this_attempt", False)
            arr[i, j] = 1 if correct else 0

    # 向量化计算
    pass_k = np.any(arr, axis=1).mean()   # 至少对一次
    avg_k  = arr.mean()                   # 所有样本平均
    return pass_k, avg_k, k_max

def main():
    if len(sys.argv) != 2:
        print("用法: python eval_max_k_np.py  /path/to/json_dir")
        sys.exit(1)

    root = sys.argv[1]
    out  = os.path.join(root, "result_max_k.txt")
    files = glob.glob(os.path.join(root, "**", "*.json"), recursive=True)

    with open(out, 'w', encoding='utf-8') as f:
        for fp in files:
            pass_k, avg_k, k_max = eval_file(fp)
            name = os.path.relpath(fp, root)
            f.write(f"{name}\tk={k_max}\tpass@k={pass_k:.4f}\tavg@k={avg_k:.4f}\n")

    print(f"完成！结果写入 {out}")

if __name__ == '__main__':
    main()