import json
import os

def calculate_yes_percentage():
    # 加载人工评估数据
    human_eval_path = "/Users/wad3/Downloads/Research/AutoBench-V-private/annotations/easy_human_evaluation.json"
    aligned_images_path = "/Users/wad3/Downloads/Research/AutoBench-V-private/document/basic_understanding/aligned_image_json_stable_diffusion/easy_aligned_images.json"
    
    # 检查文件是否存在
    if not os.path.exists(human_eval_path):
        print(f"人工评估文件不存在: {human_eval_path}")
        return
    
    if not os.path.exists(aligned_images_path):
        print(f"对齐图像文件不存在: {aligned_images_path}")
        return
    
    # 加载数据
    with open(human_eval_path, 'r', encoding='utf-8') as f:
        human_evaluations = json.load(f)
    
    with open(aligned_images_path, 'r', encoding='utf-8') as f:
        aligned_images = json.load(f)
    
    # 创建图像路径到评估结果的映射
    image_to_eval = {}
    for item in human_evaluations:
        image_path = item.get('image_path', '')
        evaluation = item.get('evaluation', '')
        if image_path and evaluation:
            image_to_eval[image_path] = evaluation
    
    # 统计结果
    total_found = 0
    total_yes = 0
    not_found = []
    
    for aligned_item in aligned_images:
        image_path = aligned_item.get('image_path', '')
        if image_path in image_to_eval:
            total_found += 1
            if image_to_eval[image_path] == 'Yes':
                total_yes += 1
        else:
            not_found.append(image_path)
    
    # 计算百分比
    yes_percentage = (total_yes / total_found * 100) if total_found > 0 else 0
    
    # 打印结果
    print(f"总共找到的图像: {total_found}")
    print(f"评估为'Yes'的图像: {total_yes}")
    print(f"'Yes'占比: {yes_percentage:.2f}%")
    print(f"未找到人工评估的图像数量: {len(not_found)}")
    
    # 如果想查看哪些图像没有找到对应的评估
    if not_found:
        print("\n未找到人工评估的图像:")
        for i, path in enumerate(not_found[:5], 1):  # 只显示前5个
            print(f"{i}. {os.path.basename(path)}")
        if len(not_found) > 5:
            print(f"... 以及其他 {len(not_found) - 5} 个文件")
    
    # 分析按方面(aspect)的评估结果
    aspect_stats = {}
    for aligned_item in aligned_images:
        image_path = aligned_item.get('image_path', '')
        aspect = aligned_item.get('aspect', 'Unknown')
        
        if image_path in image_to_eval:
            if aspect not in aspect_stats:
                aspect_stats[aspect] = {'total': 0, 'yes': 0}
            
            aspect_stats[aspect]['total'] += 1
            if image_to_eval[image_path] == 'Yes':
                aspect_stats[aspect]['yes'] += 1
    
    # 打印按方面的统计结果
    print("\n按方面(aspect)的评估结果:")
    for aspect, stats in sorted(aspect_stats.items(), key=lambda x: x[1]['total'], reverse=True):
        yes_percent = (stats['yes'] / stats['total'] * 100) if stats['total'] > 0 else 0
        print(f"{aspect}: {stats['yes']}/{stats['total']} ({yes_percent:.2f}%)")

if __name__ == "__main__":
    calculate_yes_percentage()