import json
from collections import Counter
import sys
# 读取文件路径
file_path = sys.argv[1]
# 统计正确率分布
accuracy_distribution = Counter()
total_items = 0

# 读取JSONL文件
with open(file_path, 'r', encoding='utf-8') as f:
    for line in f:
        if line.strip():  # 跳过空行
            try:
                item = json.loads(line)
                if 'accuracies' in item:
                    accuracies = item['accuracies']
                    # 计算正确的数量
                    correct_count = sum(1 for acc in accuracies if acc)
                    accuracy_distribution[correct_count] += 1
                    total_items += 1
            except json.JSONDecodeError as e:
                print(f"解析JSON错误: {e}")
                continue

# 打印统计结果
print(f"总共处理了 {total_items} 条数据\n")
print("=" * 50)
print("正确率分布统计:")
print("=" * 50)

for i in range(9):  # 0到8
    count = accuracy_distribution.get(i, 0)
    percentage = (count / total_items * 100) if total_items > 0 else 0
    print(f"{i}/8: {count:6d} 条 ({percentage:5.2f}%)")

print("=" * 50)


