import json
import os
import pandas as pd
import numpy as np

# 定义文件路径
json_directory = "document/basic_understanding/aligned_image_json_dall_e_3"
output_directory = "/Users/wad3/Downloads/Research/AutoBench-V-private/document/results"
os.makedirs(output_directory, exist_ok=True)

# 确保输出目录存在
if not os.path.exists(output_directory):
    os.makedirs(output_directory)

def extract_scores(difficulty):
    """从指定难度的JSON文件中提取分数"""
    file_path = os.path.join(json_directory, f"{difficulty}_aligned_images.json")
    
    if not os.path.exists(file_path):
        print(f"文件不存在: {file_path}")
        return []
    
    try:
        with open(file_path, 'r', encoding='utf-8') as f:
            data = json.load(f)
        
        # 提取分数和相关信息
        scores = []
        for item in data:
            # 检查项目是否有score字段
            if 'score' in item:
                scores.append({
                    'difficulty': difficulty,
                    'score': item['score'],
                    'model': item.get('model', 'unknown')
                })
        
        return scores
    except Exception as e:
        print(f"处理 {difficulty} 难度文件时出错: {str(e)}")
        return []

# 提取所有难度的分数
all_scores = []
for difficulty in ['easy', 'medium', 'hard']:
    difficulty_scores = extract_scores(difficulty)
    all_scores.extend(difficulty_scores)
    print(f"从 {difficulty} 难度提取了 {len(difficulty_scores)} 个评分")

# 转换为DataFrame
df = pd.DataFrame(all_scores)

# 计算每个难度的平均分
difficulty_avg = df.groupby('difficulty')['score'].agg(['mean', 'std', 'count', 'min', 'max']).reset_index()
difficulty_avg['mean'] = difficulty_avg['mean'].round(4)
difficulty_avg['std'] = difficulty_avg['std'].round(4)

# 创建分数范围分布统计
# 定义分数范围
score_bins = [0, 0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0.8, 0.9, 1.0]
bin_labels = [f'{score:.1f}-{score+0.1:.1f}' for score in score_bins[:-1]]

# 添加分数范围分类
df['score_range'] = pd.cut(df['score'], bins=score_bins, labels=bin_labels, include_lowest=True)

# 计算每个难度和分数范围的数量
score_distribution = df.groupby(['difficulty', 'score_range']).size().reset_index(name='count')

# 将分布转换为透视表格式，方便查看
score_pivot = score_distribution.pivot(index='difficulty', columns='score_range', values='count').fillna(0).astype(int)

# 计算每个难度下各分数段的百分比
percentages = {}
for difficulty in df['difficulty'].unique():
    difficulty_total = df[df['difficulty'] == difficulty].shape[0]
    difficulty_dist = score_distribution[score_distribution['difficulty'] == difficulty].copy()
    difficulty_dist['percentage'] = (difficulty_dist['count'] / difficulty_total * 100).round(2)
    percentages[difficulty] = difficulty_dist

# 合并所有难度的百分比数据
percentage_df = pd.concat(percentages.values())

# 保存结果
csv_path = os.path.join(output_directory, 'dall_e_3_image_scores.csv')
df.to_csv(csv_path, index=False)

summary_path = os.path.join(output_directory, 'dall_e_3_score_summary.csv')
difficulty_avg.to_csv(summary_path, index=False)

# 保存分数分布统计
distribution_path = os.path.join(output_directory, 'dall_e_3_score_distribution_counts.csv')
score_distribution.to_csv(distribution_path, index=False)

# 保存透视表格式的分数分布
# pivot_path = os.path.join(output_directory, 'dall_e_3_score_distribution_pivot.csv')
# score_pivot.to_csv(pivot_path)

# 保存百分比分布
percentage_path = os.path.join(output_directory, 'dall_e_3_score_distribution_percentage.csv')
percentage_df.to_csv(percentage_path, index=False)

print(f"\n总共处理了 {len(df)} 个图像评分")
print(f"保存评分数据到: {csv_path}")
print(f"保存难度摘要到: {summary_path}")
print(f"保存分数分布计数到: {distribution_path}")
# print(f"保存分数分布透视表到: {pivot_path}")
print(f"保存分数分布百分比到: {percentage_path}")

# 打印摘要统计
print("\n每个难度的平均分:")
for _, row in difficulty_avg.iterrows():
    print(f"{row['difficulty']}: {row['mean']:.4f} ± {row['std']:.4f} (样本数: {row['count']}, 范围: {row['min']:.2f}-{row['max']:.2f})")

# 打印分数分布
print("\n分数分布统计:")
for difficulty in sorted(df['difficulty'].unique()):
    print(f"\n{difficulty} 难度:")
    dist = score_pivot.loc[difficulty].to_dict()
    # 排序后打印
    for score_range, count in sorted(dist.items()):
        if count > 0:
            percentage = (count / difficulty_avg[difficulty_avg['difficulty'] == difficulty]['count'].values[0]) * 100
            print(f"  {score_range}: {count} ({percentage:.1f}%)")