# -*- coding: utf-8 -*-
"""
分析COCO Localized Narratives数据集中文本指代目标的准确边界框面积
通过文本匹配找到LN指代的COCO目标，使用COCO的ground truth边界框计算面积比例
"""

import json
import numpy as np
import matplotlib.pyplot as plt
import os
from collections import defaultdict, Counter
import seaborn as sns
from tqdm import tqdm
import re
import nltk
from nltk.corpus import stopwords
from nltk.stem import WordNetLemmatizer
from difflib import SequenceMatcher
from PIL import Image, ImageDraw, ImageFont
import matplotlib.patches as patches
import shutil

nltk.data.path.append('/storage-root/datasets/yangfan/ICLR_AAAI/Trajectory-VLM/tools/nltk_data')

# 下载必要的NLTK数据（如果没有的话）
try:
    nltk.data.find('tokenizers/punkt')
    nltk.data.find('corpora/stopwords')
    nltk.data.find('corpora/wordnet')
except LookupError:
    print("Downloading required NLTK data...")
    nltk.download('punkt', quiet=True)
    nltk.download('stopwords', quiet=True)
    nltk.download('wordnet', quiet=True)

def load_coco_annotations(annotation_path):
    """加载COCO标注文件"""
    print(f"Loading COCO annotations from: {annotation_path}")
    with open(annotation_path, 'r') as f:
        coco_data = json.load(f)
    
    # 构建image_id到图像信息的映射
    images_dict = {img['id']: img for img in coco_data['images']}
    
    # 构建image_id到标注的映射
    annotations_by_image = defaultdict(list)
    for ann in coco_data['annotations']:
        annotations_by_image[ann['image_id']].append(ann)
    
    # 构建category_id到category名称的映射
    categories_dict = {cat['id']: cat['name'] for cat in coco_data['categories']}
    
    # 构建category名称到id的反向映射
    category_name_to_id = {cat['name']: cat['id'] for cat in coco_data['categories']}
    
    return images_dict, annotations_by_image, categories_dict, category_name_to_id

def load_ln_jsonl_files(ln_base_path):
    """加载所有LN的jsonl文件"""
    ln_files = [
        'coco_train_localized_narratives-00000-of-00004.jsonl',
        'coco_train_localized_narratives-00001-of-00004.jsonl', 
        'coco_train_localized_narratives-00002-of-00004.jsonl',
        'coco_train_localized_narratives-00003-of-00004.jsonl'
    ]
    
    ln_data = []
    for file_name in ln_files:
        file_path = os.path.join(ln_base_path, file_name)
        if os.path.exists(file_path):
            print(f"Loading LN file: {file_path}")
            with open(file_path, 'r', encoding='utf-8') as f:
                for line_num, line in enumerate(f, 1):
                    try:
                        data = json.loads(line.strip())
                        ln_data.append(data)
                    except json.JSONDecodeError as e:
                        print(f"Error parsing line {line_num} in {file_name}: {e}")
        else:
            print(f"Warning: File not found: {file_path}")
    
    print(f"Loaded {len(ln_data)} LN annotations")
    return ln_data

class TextMatcher:
    """文本匹配器，用于将LN的token与COCO类别匹配"""
    
    def __init__(self, categories_dict, category_name_to_id):
        self.categories_dict = categories_dict
        self.category_name_to_id = category_name_to_id
        self.lemmatizer = WordNetLemmatizer()
        self.stop_words = set(stopwords.words('english'))
        
        # 构建类别名称的变体映射
        self.category_variants = self._build_category_variants()
        
    def _build_category_variants(self):
        """构建类别名称的各种变体"""
        variants = {}
        
        for cat_id, cat_name in self.categories_dict.items():
            variant_list = set()
            
            # 原始名称
            variant_list.add(cat_name.lower())
            
            # 单数/复数形式
            variant_list.add(self.lemmatizer.lemmatize(cat_name.lower()))
            
            # 处理特殊情况
            special_mappings = {
                'person': ['people', 'man', 'woman', 'boy', 'girl', 'child', 'adult'],
                'car': ['vehicle', 'automobile'],
                'motorcycle': ['bike', 'motorbike'],
                'airplane': ['plane', 'aircraft'],
                'bus': ['coach'],
                'train': ['locomotive'],
                'truck': ['lorry'],
                'boat': ['ship', 'vessel'],
                'traffic light': ['signal', 'light'],
                'fire hydrant': ['hydrant'],
                'stop sign': ['sign'],
                'parking meter': ['meter'],
                'bench': ['seat'],
                'bird': ['birds'],
                'cat': ['cats', 'kitten'],
                'dog': ['dogs', 'puppy'],
                'horse': ['horses'],
                'sheep': ['lamb'],
                'cow': ['cattle', 'bull'],
                'elephant': ['elephants'],
                'bear': ['bears'],
                'zebra': ['zebras'],
                'giraffe': ['giraffes'],
                'backpack': ['bag', 'rucksack'],
                'umbrella': ['parasol'],
                'handbag': ['purse', 'bag'],
                'tie': ['necktie'],
                'suitcase': ['luggage', 'bag'],
                'frisbee': ['disc'],
                'skis': ['ski'],
                'snowboard': ['board'],
                'sports ball': ['ball'],
                'kite': ['kites'],
                'baseball bat': ['bat'],
                'baseball glove': ['glove', 'mitt'],
                'skateboard': ['board'],
                'surfboard': ['board'],
                'tennis racket': ['racket', 'racquet'],
                'bottle': ['bottles'],
                'wine glass': ['glass', 'wineglass'],
                'cup': ['cups', 'mug'],
                'fork': ['forks'],
                'knife': ['knives'],
                'spoon': ['spoons'],
                'bowl': ['bowls'],
                'banana': ['bananas'],
                'apple': ['apples'],
                'sandwich': ['sandwiches'],
                'orange': ['oranges'],
                'broccoli': ['vegetables'],
                'carrot': ['carrots'],
                'hot dog': ['hotdog'],
                'pizza': ['pizzas'],
                'donut': ['donuts', 'doughnut'],
                'cake': ['cakes'],
                'chair': ['chairs', 'seat'],
                'couch': ['sofa', 'settee'],
                'potted plant': ['plant', 'pot'],
                'bed': ['beds'],
                'dining table': ['table'],
                'toilet': ['loo', 'bathroom'],
                'tv': ['television', 'screen'],
                'laptop': ['computer', 'notebook'],
                'mouse': ['mice'],
                'remote': ['controller'],
                'keyboard': ['keys'],
                'cell phone': ['phone', 'mobile'],
                'microwave': ['oven'],
                'oven': ['stove'],
                'toaster': ['toasters'],
                'sink': ['basin'],
                'refrigerator': ['fridge'],
                'book': ['books'],
                'clock': ['clocks', 'time'],
                'vase': ['vases'],
                'scissors': ['shears'],
                'teddy bear': ['bear', 'toy'],
                'hair drier': ['dryer'],
                'toothbrush': ['brush']
            }
            
            if cat_name in special_mappings:
                variant_list.update(special_mappings[cat_name])
            
            variants[cat_id] = list(variant_list)
        
        return variants
    
    def preprocess_token(self, token):
        """预处理token"""
        # 移除标点符号和转为小写
        token = re.sub(r'[^\w\s]', '', token.lower())
        # 词干化
        token = self.lemmatizer.lemmatize(token)
        return token
    
    def match_token_to_categories(self, token):
        """将token匹配到COCO类别"""
        processed_token = self.preprocess_token(token)
        
        if not processed_token or processed_token in self.stop_words:
            return []
        
        matched_categories = []
        
        # 精确匹配
        for cat_id, variants in self.category_variants.items():
            if processed_token in variants:
                matched_categories.append(cat_id)
        
        # 如果没有精确匹配，尝试部分匹配
        if not matched_categories:
            for cat_id, variants in self.category_variants.items():
                for variant in variants:
                    if (processed_token in variant or variant in processed_token) and len(processed_token) > 2:
                        similarity = SequenceMatcher(None, processed_token, variant).ratio()
                        if similarity > 0.8:  # 相似度阈值
                            matched_categories.append(cat_id)
        
        return matched_categories

def calculate_bbox_area_ratio(bbox, image_width, image_height):
    """计算边界框面积相对于图像面积的比例"""
    x, y, w, h = bbox
    bbox_area = w * h
    image_area = image_width * image_height
    return bbox_area / image_area if image_area > 0 else 0

def analyze_ln_with_coco_bboxes(ln_base_path, coco_annotation_path, coco_images_path, area_threshold=0.1, save_images=True, output_dir="coco_bbox_analysis"):
    """使用COCO ground truth边界框分析LN数据"""
    
    # 加载COCO标注
    images_dict, annotations_by_image, categories_dict, category_name_to_id = load_coco_annotations(coco_annotation_path)
    
    # 加载LN数据
    ln_data = load_ln_jsonl_files(ln_base_path)
    
    # 初始化文本匹配器
    text_matcher = TextMatcher(categories_dict, category_name_to_id)
    
    # 统计数据
    results = {
        'total_tokens': 0,
        'matched_tokens': 0,
        'total_matched_bboxes': 0,
        'small_bboxes': 0,
        'area_ratios': [],
        'category_stats': defaultdict(list),
        'token_match_stats': defaultdict(int),
        'unmatched_tokens': defaultdict(int),
        'bbox_size_distribution': [],
        'image_stats': defaultdict(int),
        'small_target_data': [],  # 保存小目标的详细信息
        'image_paths': {}  # 保存图片路径信息
    }
    
    # 创建保存目录
    os.makedirs(output_dir, exist_ok=True)
    if save_images:
        original_images_dir = os.path.join(output_dir, "original_images")
        annotated_images_dir = os.path.join(output_dir, "annotated_images")
        os.makedirs(original_images_dir, exist_ok=True)
        os.makedirs(annotated_images_dir, exist_ok=True)
        print(f"图像将保存到:")
        print(f"  - 原图: {original_images_dir}")
        print(f"  - LN小目标标注图: {annotated_images_dir}/*_ln_annotated.jpg")
        print(f"  - COCO原有标注图: {annotated_images_dir}/*_coco_annotated.jpg")
    
    print(f"Analyzing {len(ln_data)} LN annotations with COCO ground truth bboxes...")
    
    # 记录处理过的图像，避免重复处理
    processed_images = set()
    
    for ln_annotation in tqdm(ln_data):
        image_id = int(ln_annotation['image_id'])
        
        # 检查图像是否存在于COCO中
        if image_id not in images_dict:
            continue
            
        image_info = images_dict[image_id]
        image_width = image_info['width']
        image_height = image_info['height']
        
        # 构建图像路径
        image_filename = f"{image_id:012d}.jpg"
        image_path = os.path.join(coco_images_path, "train2017", image_filename)
        
        # 保存图像路径信息
        results['image_paths'][image_id] = {
            'filename': image_filename,
            'full_path': image_path,
            'width': image_width,
            'height': image_height
        }
        
        # 获取该图像的所有COCO标注
        coco_annotations = annotations_by_image.get(image_id, [])
        if not coco_annotations:
            continue
        
        # 用于存储当前图像的小目标信息
        current_image_small_targets = []
        
        # 获取LN的时间标注文本
        timed_caption = ln_annotation['timed_caption']
        
        for tcap in timed_caption:
            token = tcap['utterance'].strip()
            results['total_tokens'] += 1
            
            if not token or len(token) < 2:
                continue
            
            # 匹配token到COCO类别
            matched_category_ids = text_matcher.match_token_to_categories(token)
            
            if matched_category_ids:
                results['matched_tokens'] += 1
                results['token_match_stats'][token] += 1
                
                # 在该图像的COCO标注中查找匹配的类别
                for ann in coco_annotations:
                    if ann['category_id'] in matched_category_ids:
                        bbox = ann['bbox']  # [x, y, width, height]
                        area_ratio = calculate_bbox_area_ratio(bbox, image_width, image_height)
                        
                        results['total_matched_bboxes'] += 1
                        results['area_ratios'].append(area_ratio)
                        results['category_stats'][categories_dict[ann['category_id']]].append(area_ratio)
                        
                        bbox_info = {
                            'area_ratio': area_ratio,
                            'category': categories_dict[ann['category_id']],
                            'token': token,
                            'bbox_width': bbox[2],
                            'bbox_height': bbox[3],
                            'image_width': image_width,
                            'image_height': image_height,
                            'bbox_coords': bbox,  # [x, y, w, h]
                            'image_id': image_id,
                            'annotation_id': ann['id']
                        }
                        results['bbox_size_distribution'].append(bbox_info)
                        
                        if area_ratio < area_threshold:
                            results['small_bboxes'] += 1
                            
                            # 保存小目标详细信息
                            small_target_info = {
                                'image_id': image_id,
                                'image_filename': image_filename,
                                'image_path': image_path,
                                'category': categories_dict[ann['category_id']],
                                'token': token,
                                'bbox': bbox,  # [x, y, w, h]
                                'area_ratio': area_ratio,
                                'annotation_id': ann['id']
                            }
                            results['small_target_data'].append(small_target_info)
                            current_image_small_targets.append(small_target_info)
                        
                        results['image_stats'][image_id] += 1
            else:
                results['unmatched_tokens'][token] += 1
        
        # 如果当前图像有小目标且需要保存图像，则生成可视化
        if save_images and current_image_small_targets and image_id not in processed_images:
            try:
                # 准备COCO标注数据，添加类别名称
                coco_anns_with_names = []
                for ann in coco_annotations:
                    ann_with_name = ann.copy()
                    ann_with_name['category_name'] = categories_dict.get(ann['category_id'], f"unknown_{ann['category_id']}")
                    coco_anns_with_names.append(ann_with_name)
                
                visualize_single_image_small_targets(
                    image_path, 
                    current_image_small_targets, 
                    original_images_dir,
                    annotated_images_dir,
                    image_id,
                    coco_annotations=coco_anns_with_names
                )
                processed_images.add(image_id)
            except Exception as e:
                print(f"Error processing image {image_id}: {e}")
    
    # 计算统计指标
    if results['area_ratios']:
        results['small_ratio'] = results['small_bboxes'] / results['total_matched_bboxes']
        results['mean_area_ratio'] = np.mean(results['area_ratios'])
        results['median_area_ratio'] = np.median(results['area_ratios'])
        results['std_area_ratio'] = np.std(results['area_ratios'])
        results['min_area_ratio'] = np.min(results['area_ratios'])
        results['max_area_ratio'] = np.max(results['area_ratios'])
    
    results['match_ratio'] = results['matched_tokens'] / results['total_tokens'] if results['total_tokens'] > 0 else 0
    results['area_threshold'] = area_threshold
    
    # 打印统计结果
    print(f"\n=== LN文本与COCO边界框匹配分析结果 ===")
    print(f"总token数量: {results['total_tokens']}")
    print(f"成功匹配的token数量: {results['matched_tokens']}")
    print(f"匹配率: {results['match_ratio']:.2%}")
    print(f"匹配到的边界框总数: {results['total_matched_bboxes']}")
    print(f"面积比例 < {area_threshold} 的边界框数量: {results['small_bboxes']}")
    
    if results['area_ratios']:
        print(f"小面积目标框比例: {results['small_ratio']:.2%}")
        print(f"平均面积比例: {results['mean_area_ratio']:.4f}")
        print(f"中位数面积比例: {results['median_area_ratio']:.4f}")
        print(f"最小面积比例: {results['min_area_ratio']:.6f}")
        print(f"最大面积比例: {results['max_area_ratio']:.4f}")
    
    return results

def visualize_single_image_small_targets(image_path, small_targets, original_dir, annotated_dir, image_id, coco_annotations=None):
    """为单个图像生成三张图：原图、LN小目标标注图像、COCO原有标注图像"""
    try:
        # 检查原图是否存在
        if not os.path.exists(image_path):
            print(f"Warning: Image not found at {image_path}")
            return
        
        # 打开图像
        image = Image.open(image_path).convert('RGB')
        
        # 复制原图到original_images文件夹
        original_save_path = os.path.join(original_dir, f"{image_id:012d}.jpg")
        image.save(original_save_path, quality=95)
        
        # 尝试加载字体
        try:
            font = ImageFont.truetype("/usr/share/fonts/truetype/dejavu/DejaVuSans-Bold.ttf", 20)
            small_font = ImageFont.truetype("/usr/share/fonts/truetype/dejavu/DejaVuSans.ttf", 16)
        except:
            try:
                font = ImageFont.truetype("arial.ttf", 20)
                small_font = ImageFont.truetype("arial.ttf", 16)
            except:
                font = ImageFont.load_default()
                small_font = ImageFont.load_default()
        
        # 定义颜色列表
        colors = ['red', 'blue', 'green', 'orange', 'purple', 'yellow', 'pink', 'cyan', 'magenta', 'lime']
        
        # 创建LN小目标标注图像
        ln_annotated_image = image.copy()
        ln_draw = ImageDraw.Draw(ln_annotated_image)
        
        # 绘制LN小目标边界框
        for i, target in enumerate(small_targets):
            bbox = target['bbox']  # [x, y, w, h]
            x, y, w, h = bbox
            
            # 选择颜色
            color = colors[i % len(colors)]
            
            # 绘制边界框
            ln_draw.rectangle([x, y, x + w, y + h], outline=color, width=3)
            
            # 准备标签文本
            label = f"LN-{target['category']} ({target['area_ratio']:.4f})"
            
            # 计算文本位置
            bbox_text = ln_draw.textbbox((0, 0), label, font=font)
            text_width = bbox_text[2] - bbox_text[0]
            text_height = bbox_text[3] - bbox_text[1]
            
            # 确保文本在图像内
            text_x = max(0, min(x, image.width - text_width))
            text_y = max(0, y - text_height - 5) if y > text_height + 5 else y + h + 5
            
            # 绘制文本背景
            ln_draw.rectangle([text_x, text_y, text_x + text_width, text_y + text_height], 
                         fill='white', outline=color, width=2)
            
            # 绘制文本
            ln_draw.text((text_x, text_y), label, fill=color, font=font)
        
        # 保存LN标注图像
        ln_annotated_save_path = os.path.join(annotated_dir, f"{image_id:012d}_ln_annotated.jpg")
        ln_annotated_image.save(ln_annotated_save_path, quality=95)
        
        # 创建COCO原有标注图像
        if coco_annotations:
            coco_annotated_image = image.copy()
            coco_draw = ImageDraw.Draw(coco_annotated_image)
            
            # 绘制所有COCO标注
            for i, ann in enumerate(coco_annotations):
                bbox = ann['bbox']  # [x, y, w, h]
                x, y, w, h = bbox
                category_name = ann.get('category_name', f"cat_{ann['category_id']}")
                
                # 选择颜色 (使用不同的颜色策略以区分)
                color = colors[(i + len(small_targets)) % len(colors)]
                
                # 绘制边界框
                coco_draw.rectangle([x, y, x + w, y + h], outline=color, width=2)
                
                # 计算面积比例
                bbox_area = w * h
                image_area = image.width * image.height
                area_ratio = bbox_area / image_area if image_area > 0 else 0
                
                # 准备标签文本
                label = f"COCO-{category_name} ({area_ratio:.4f})"
                
                # 计算文本位置
                bbox_text = coco_draw.textbbox((0, 0), label, font=small_font)
                text_width = bbox_text[2] - bbox_text[0]
                text_height = bbox_text[3] - bbox_text[1]
                
                # 确保文本在图像内
                text_x = max(0, min(x, image.width - text_width))
                text_y = max(0, y - text_height - 3) if y > text_height + 3 else y + h + 3
                
                # 绘制文本背景（半透明）
                coco_draw.rectangle([text_x, text_y, text_x + text_width, text_y + text_height], 
                             fill=(255, 255, 255, 200), outline=color, width=1)
                
                # 绘制文本
                coco_draw.text((text_x, text_y), label, fill=color, font=small_font)
            
            # 保存COCO标注图像
            coco_annotated_save_path = os.path.join(annotated_dir, f"{image_id:012d}_coco_annotated.jpg")
            coco_annotated_image.save(coco_annotated_save_path, quality=95)
        
    except Exception as e:
        print(f"Error visualizing image {image_id}: {e}")

def save_small_targets_json(results, output_dir):
    """保存小目标的详细信息到JSON文件"""
    # 整理小目标数据
    small_targets_summary = {
        'metadata': {
            'total_small_targets': len(results['small_target_data']),
            'area_threshold': results['area_threshold'],
            'unique_images_with_small_targets': len(set([t['image_id'] for t in results['small_target_data']])),
            'categories_with_small_targets': len(set([t['category'] for t in results['small_target_data']]))
        },
        'small_targets': results['small_target_data']
    }
    
    # 保存到JSON文件
    json_path = os.path.join(output_dir, 'small_targets_details.json')
    with open(json_path, 'w', encoding='utf-8') as f:
        json.dump(small_targets_summary, f, indent=2, ensure_ascii=False)
    
    # 保存图像路径信息
    image_paths_json = os.path.join(output_dir, 'image_paths.json')
    with open(image_paths_json, 'w', encoding='utf-8') as f:
        json.dump(results['image_paths'], f, indent=2, ensure_ascii=False)
    
    # 按图像分组的小目标信息
    small_targets_by_image = defaultdict(list)
    for target in results['small_target_data']:
        small_targets_by_image[target['image_id']].append(target)
    
    grouped_json_path = os.path.join(output_dir, 'small_targets_by_image.json')
    with open(grouped_json_path, 'w', encoding='utf-8') as f:
        json.dump(dict(small_targets_by_image), f, indent=2, ensure_ascii=False)
    
    print(f"Small targets JSON saved to: {json_path}")
    print(f"Image paths JSON saved to: {image_paths_json}")
    print(f"Small targets by image JSON saved to: {grouped_json_path}")
    
    return json_path, image_paths_json, grouped_json_path

def visualize_coco_bbox_results(results, output_dir="coco_bbox_analysis"):
    """可视化COCO边界框分析结果"""
    os.makedirs(output_dir, exist_ok=True)
    
    if not results['area_ratios']:
        print("No area ratios to visualize")
        return
    
    area_ratios = results['area_ratios']
    area_threshold = results['area_threshold']
    
    # 创建子图
    fig, axes = plt.subplots(2, 3, figsize=(18, 12))
    
    # 1. 面积比例分布直方图
    axes[0, 0].hist(area_ratios, bins=50, alpha=0.7, edgecolor='black', color='skyblue')
    axes[0, 0].axvline(area_threshold, color='red', linestyle='--', 
                      label=f'Threshold = {area_threshold}')
    axes[0, 0].set_xlabel('Area Ratio')
    axes[0, 0].set_ylabel('Frequency')
    axes[0, 0].set_title('Distribution of Area Ratios (COCO GT Bboxes)')
    axes[0, 0].legend()
    axes[0, 0].set_yscale('log')
    
    # 2. 累积分布
    sorted_ratios = np.sort(area_ratios)
    cumulative = np.arange(1, len(sorted_ratios) + 1) / len(sorted_ratios)
    axes[0, 1].plot(sorted_ratios, cumulative, color='green', linewidth=2)
    axes[0, 1].axvline(area_threshold, color='red', linestyle='--',
                      label=f'Threshold = {area_threshold}')
    axes[0, 1].set_xlabel('Area Ratio')
    axes[0, 1].set_ylabel('Cumulative Probability')
    axes[0, 1].set_title('Cumulative Distribution of Area Ratios')
    axes[0, 1].legend()
    axes[0, 1].grid(True, alpha=0.3)
    
    # 3. 对数尺度的面积比例分布
    log_ratios = np.log10(np.array(area_ratios) + 1e-10)
    axes[0, 2].hist(log_ratios, bins=50, alpha=0.7, edgecolor='black', color='lightcoral')
    axes[0, 2].axvline(np.log10(area_threshold), color='red', linestyle='--',
                      label=f'log10({area_threshold}) = {np.log10(area_threshold):.2f}')
    axes[0, 2].set_xlabel('log10(Area Ratio)')
    axes[0, 2].set_ylabel('Frequency')
    axes[0, 2].set_title('Distribution of log10(Area Ratios)')
    axes[0, 2].legend()
    
    # 4. 按类别的面积比例分布
    category_stats = results['category_stats']
    if category_stats:
        # 选择前10个最常见的类别
        top_categories = sorted(category_stats.items(), 
                               key=lambda x: len(x[1]), reverse=True)[:10]
        category_names = [cat[0] for cat in top_categories]
        category_ratios = [cat[1] for cat in top_categories]
        
        axes[1, 0].boxplot(category_ratios, labels=category_names)
        axes[1, 0].axhline(area_threshold, color='red', linestyle='--', alpha=0.7)
        axes[1, 0].set_ylabel('Area Ratio')
        axes[1, 0].set_title('Area Ratio Distribution by Category (Top 10)')
        axes[1, 0].tick_params(axis='x', rotation=45)
    
    # 5. 匹配统计
    match_data = [
        results['matched_tokens'],
        results['total_tokens'] - results['matched_tokens']
    ]
    labels = ['Matched', 'Unmatched']
    axes[1, 1].pie(match_data, labels=labels, autopct='%1.1f%%', 
                   colors=['lightgreen', 'lightcoral'])
    axes[1, 1].set_title('Token Matching Statistics')
    
    # 6. 小面积目标框统计
    small_large_data = [
        results['small_bboxes'],
        results['total_matched_bboxes'] - results['small_bboxes']
    ]
    labels = [f'Small (< {area_threshold})', f'Large (>= {area_threshold})']
    axes[1, 2].pie(small_large_data, labels=labels, autopct='%1.1f%%',
                   colors=['orange', 'lightblue'])
    axes[1, 2].set_title('Bbox Size Distribution')
    
    plt.tight_layout()
    plt.savefig(os.path.join(output_dir, 'coco_bbox_area_analysis.png'), 
               dpi=300, bbox_inches='tight')
    plt.close()
    
    # 7. 最常见的匹配token
    token_stats = results['token_match_stats']
    if token_stats:
        top_tokens = sorted(token_stats.items(), key=lambda x: x[1], reverse=True)[:20]
        tokens, counts = zip(*top_tokens)
        
        plt.figure(figsize=(12, 8))
        plt.barh(range(len(tokens)), counts, color='steelblue')
        plt.yticks(range(len(tokens)), tokens)
        plt.xlabel('Frequency')
        plt.title('Most Frequently Matched Tokens')
        plt.gca().invert_yaxis()
        plt.tight_layout()
        plt.savefig(os.path.join(output_dir, 'matched_tokens_frequency.png'), 
                   dpi=300, bbox_inches='tight')
        plt.close()
    
    # 8. 最常见的未匹配token
    unmatched_stats = results['unmatched_tokens']
    if unmatched_stats:
        top_unmatched = sorted(unmatched_stats.items(), key=lambda x: x[1], reverse=True)[:20]
        if top_unmatched:
            tokens, counts = zip(*top_unmatched)
            
            plt.figure(figsize=(12, 8))
            plt.barh(range(len(tokens)), counts, color='lightcoral')
            plt.yticks(range(len(tokens)), tokens)
            plt.xlabel('Frequency')
            plt.title('Most Frequently Unmatched Tokens')
            plt.gca().invert_yaxis()
            plt.tight_layout()
            plt.savefig(os.path.join(output_dir, 'unmatched_tokens_frequency.png'), 
                       dpi=300, bbox_inches='tight')
            plt.close()
    
    print(f"Visualizations saved to: {output_dir}")

def save_detailed_statistics(results, output_dir="coco_bbox_analysis"):
    """保存详细统计信息到文件"""
    os.makedirs(output_dir, exist_ok=True)
    
    # 保存统计摘要
    stats_file = os.path.join(output_dir, 'coco_bbox_statistics.txt')
    with open(stats_file, 'w', encoding='utf-8') as f:
        f.write("=== COCO Localized Narratives 与 COCO Ground Truth 边界框分析结果 ===\n\n")
        f.write(f"总token数量: {results['total_tokens']}\n")
        f.write(f"成功匹配的token数量: {results['matched_tokens']}\n")
        f.write(f"匹配率: {results['match_ratio']:.2%}\n")
        f.write(f"匹配到的边界框总数: {results['total_matched_bboxes']}\n")
        f.write(f"面积比例 < {results['area_threshold']} 的边界框数量: {results['small_bboxes']}\n")
        f.write(f"包含小目标的图像数量: {len(set([t['image_id'] for t in results['small_target_data']]))}\n")
        
        if results['area_ratios']:
            f.write(f"小面积目标框比例: {results['small_ratio']:.2%}\n")
            f.write(f"平均面积比例: {results['mean_area_ratio']:.4f}\n")
            f.write(f"中位数面积比例: {results['median_area_ratio']:.4f}\n")
            f.write(f"标准差: {results['std_area_ratio']:.4f}\n")
            f.write(f"最小面积比例: {results['min_area_ratio']:.6f}\n")
            f.write(f"最大面积比例: {results['max_area_ratio']:.4f}\n")
            
            # 百分位数统计
            percentiles = [1, 5, 10, 25, 50, 75, 90, 95, 99]
            f.write(f"\n面积比例百分位数:\n")
            for p in percentiles:
                value = np.percentile(results['area_ratios'], p)
                f.write(f"  {p}%: {value:.6f}\n")
        
        # 按类别统计
        f.write(f"\n按类别统计 (前20个):\n")
        category_stats = results['category_stats']
        sorted_categories = sorted(category_stats.items(), 
                                 key=lambda x: len(x[1]), reverse=True)[:20]
        for cat_name, ratios in sorted_categories:
            mean_ratio = np.mean(ratios)
            small_count = sum(1 for r in ratios if r < results['area_threshold'])
            small_percent = small_count / len(ratios) * 100
            f.write(f"  {cat_name}: {len(ratios)} 个目标, "
                   f"平均面积比例 {mean_ratio:.4f}, "
                   f"小目标比例 {small_percent:.1f}%\n")
    
    # 保存详细的bbox信息到JSON
    bbox_details_file = os.path.join(output_dir, 'bbox_details.json')
    with open(bbox_details_file, 'w', encoding='utf-8') as f:
        json.dump(results['bbox_size_distribution'], f, indent=2, ensure_ascii=False)
    
    # 保存小目标的JSON文件
    save_small_targets_json(results, output_dir)
    
    print(f"Detailed statistics saved to: {stats_file}")
    print(f"Bbox details saved to: {bbox_details_file}")

if __name__ == '__main__':
    # 配置路径
    LN_BASE_PATH = '/storage-root/datasets/yangfan/Seg_LLaVA_v2/datasets/Localized_Narratives'
    # COCO_ANNOTATION_PATH = '/storage-root/datasets/yangfan/coco2017/annotations/instances_train2017.json'
    COCO_ANNOTATION_PATH = '/storage-root/datasets/yangfan/ICLR_AAAI/Trajectory-VLM/processed_coco_phrases/processed_phrases_train_chunk0_20250901_132607.json'
    COCO_IMAGES_PATH = '/storage-root/datasets/yangfan/coco2017'  # COCO图像的根目录
    
    # 设置面积阈值
    AREA_THRESHOLD = 0.001

    # 创建输出目录
    import datetime
    timestamp = datetime.datetime.now().strftime("%Y%m%d_%H%M%S")
    output_dir = f"coco_bbox_analysis_qwen_{timestamp}"
    
    try:
        print("="*60)
        print("COCO Localized Narratives 小目标分析")
        print("="*60)
        
        # 执行分析
        results = analyze_ln_with_coco_bboxes(
            ln_base_path=LN_BASE_PATH,
            coco_annotation_path=COCO_ANNOTATION_PATH,
            coco_images_path=COCO_IMAGES_PATH,
            area_threshold=AREA_THRESHOLD,
            save_images=True,  # 保存图像
            output_dir=output_dir
        )
        
        print(f"\n{'='*60}")
        print("生成可视化结果和统计报告...")
        print(f"{'='*60}")
        
        # 生成可视化结果
        visualize_coco_bbox_results(results, output_dir)
        
        # 保存详细统计
        save_detailed_statistics(results, output_dir)
        
        print(f"\n{'='*60}")
        print("分析完成！")
        print(f"{'='*60}")
        print(f"结果保存在: {os.path.abspath(output_dir)}")
        print(f"- 原图保存在: {os.path.join(output_dir, 'original_images')}")
        print(f"- 标注图保存在: {os.path.join(output_dir, 'annotated_images')}")
        print(f"  * _ln_annotated.jpg: LN小目标标注图像")
        print(f"  * _coco_annotated.jpg: COCO原有标注图像")
        print(f"- 小目标详情JSON: {os.path.join(output_dir, 'small_targets_details.json')}")
        print(f"- 图像路径JSON: {os.path.join(output_dir, 'image_paths.json')}")
        print(f"- 按图像分组JSON: {os.path.join(output_dir, 'small_targets_by_image.json')}")
        
        # 打印一些关键统计信息
        if results['small_target_data']:
            print(f"\n关键统计信息:")
            print(f"- 发现 {len(results['small_target_data'])} 个小目标")
            print(f"- 涉及 {len(set([t['image_id'] for t in results['small_target_data']]))} 张图像")
            print(f"- 涉及 {len(set([t['category'] for t in results['small_target_data']]))} 个类别")
            
            # 显示最常见的小目标类别
            small_target_categories = [t['category'] for t in results['small_target_data']]
            category_counts = Counter(small_target_categories)
            print(f"\n最常见的小目标类别:")
            for category, count in category_counts.most_common(10):
                print(f"  {category}: {count} 个")
        
    except Exception as e:
        print(f"分析过程中出现错误: {e}")
        import traceback
        traceback.print_exc()