import json
import os

def calculate_accuracy(file_path):
    """
    计算JSONL文件中'judge'字段为'yes'的记录比例。

    Args:
        file_path (str): JSONL文件的路径。

    Returns:
        float: 正确记录的比例（0到1之间）。
        None: 如果文件不存在或发生其他错误。
    """
    total_records = 0
    correct_records = 0

    # try:
    with open(file_path, 'r', encoding='utf-8') as f:
        # 使用 json.load() 读取文件内容并解析为 Python 对象
        data = json.load(f)
    for record in data:
        total_records += 1
        if record.get("judge") == "Yes":
            correct_records += 1
    if total_records == 0:
        print("文件中没有记录。")
        return 0.0
    else:
        accuracy = correct_records / total_records
        return accuracy

# 示例使用
if __name__ == "__main__":
    step = 120
    model_name = f"train_step_140"
    full_name = f"{model_name}_seed42_answer.json"
    benchmarks = ["p-bench", "p-bench-crop","mmstar", "hrbench-4k", "hrbench-8k", "vstar", "cvbench-2d", "cvbench-3d", "countqa", "colorbench", "mathvision","babyvision",'loki','mme-realworld', 'mme-realworld-cn']
    for benchmark in benchmarks:
        jsonl_file = os.path.join("./judge", benchmark, full_name)
        try:
            accuracy = calculate_accuracy(jsonl_file)

            if accuracy is not None:
                print(f"{model_name}:{benchmark}:acc:{accuracy*100:.2f}")
        except:
            continue