#!/usr/bin/env python3
"""
Optimized Grounding DINO Medical Image Testing Script
Main optimizations:
1. Integrate complete vocabulary database from get_enhanced_medical_vocabulary_data function
2. Intelligent prompt generation based on real statistical data
3. Improved normal/abnormal report judgment logic
4. Unified maximum anatomical structure region detection strategy
5. Retain excellent quality control and selection algorithms
"""

import os
import json
import cv2
import numpy as np
import random
import torch
import re
from pathlib import Path
from groundingdino.util.inference import load_model, load_image, predict, annotate
import argparse


def load_jsonl(file_path):
    """Load JSONL file"""
    data = []
    with open(file_path, 'r', encoding='utf-8') as f:
        for line in f:
            data.append(json.loads(line.strip()))
    return data


def get_enhanced_medical_vocabulary_data():
    """
    Return complete enhanced medical vocabulary table data

    Returns:
        dict: Vocabulary data containing all medical imaging categories
    """

    vocabulary_data = {
        'Abdominal': {
            'high_priority': ['ct', 'axial', 'significant', 'liver', 'mass', 'lesion', 'hypodense', 'enhancement',
                              'calcification', 'dilation'],
            'anatomy_specific': ['abdomen', 'abdominal', 'liver', 'pancreas', 'kidney', 'spleen', 'gallbladder',
                                 'stomach'],
            'medical_phrases': ['hypodense lesion', 'significant inflammation', 'hypodense mass', 'acute inflammation',
                                'significant organ'],
            'suggested_prompts': [  # 15 items
                'liver lesion', 'liver mass', 'kidney lesion', 'kidney mass', 'pancreas lesion', 'pancreas mass',
                'spleen lesion', 'spleen mass',
                'gallbladder lesion', 'gallbladder mass', 'significant liver', 'significant stones',
                'significant abdominal', 'significant mass', 'significant aorta'
            ],
            'high_priority_combinations': [  # 20 items
                'significant liver', 'significant stones', 'significant abdominal', 'significant mass',
                'significant aorta', 'significant inflammation', 'significant spleen', 'significant abdomen',
                'significant obstruction', 'significant hemorrhage', 'significant lesion', 'significant gallbladder',
                'significant pancreas', 'significant bowel', 'significant fluid', 'liver lesion',
                'liver mass', 'liver cyst', 'kidney lesion', 'kidney mass'
            ],
            'no_expressions': [  # 30 items
                'no obvious', 'no evidence', 'no significant', 'no apparent', 'no obvious mass', 'no obvious masses',
                'no apparent artifacts', 'no apparent mass',
                'no apparent masses', 'no significant structural abnormalities', 'no evidence of mass', 'no focal',
                'no acute', 'no significant artifacts', 'no evidence of masses', 'no obvious abnormalities',
                'no focal lesions', 'no evidence of free fluid or', 'no significant abnormalities',
                'no significant structural abnormalities are observed', 'no significant mass', 'no significant masses',
                'no obvious abnormalities of the liver', 'no visible masses',
                'no evidence of hemorrhage', 'no evident masses',
                'no significant structural abnormalities are identified', 'no clear', 'no focal masses',
                'no evidence of hydronephrosis'
            ],
        },

        'Bone and Joint': {
            'high_priority': ['joint', 'bone', 'fracture', 'space', 'dislocation', 'infection', 'subluxation',
                              'arthritis', 'displacement'],
            'anatomy_specific': ['bone', 'joint', 'spine', 'ligament', 'tendon', 'muscle', 'fracture', 'arthritis'],
            'medical_phrases': ['significant bone', 'acute infection', 'abnormal bone', 'acute inflammation',
                                'mild bone'],
            'suggested_prompts': [  # 15 items
                'bone fracture', 'bone dislocation', 'joint fracture', 'joint dislocation', 'fracture fracture',
                'fracture dislocation', 'significant joint', 'significant bone',
                'significant fracture', 'significant osteoporosis', 'significant space', 'obvious joint',
                'obvious bone', 'obvious fracture', 'obvious osteoporosis'
            ],
            'high_priority_combinations': [  # 20 items
                'significant joint', 'significant bone', 'significant fracture', 'significant osteoporosis',
                'significant space', 'significant dislocation', 'significant fractures', 'significant infection',
                'significant radius', 'significant soft', 'significant subluxation', 'significant tissue',
                'significant humerus', 'significant swelling', 'significant alignment', 'bone fracture',
                'bone dislocation', 'bone lesion', 'joint fracture', 'joint dislocation'
            ],
            'no_expressions': [  # 30 items
                'no evidence', 'no obvious', 'no obvious fracture', 'no obvious fractures', 'no significant',
                'no apparent', 'no evidence of dislocation', 'no significant artifacts',
                'no apparent artifacts', 'no evidence of fracture', 'no evidence of joint dislocation or',
                'no evidence of dislocation or joint', 'no obvious fractures or joint abnormalities',
                'no signs of infection', 'no evidence of fractures', 'no apparent fractures',
                'no obvious fractures or dislocations', 'no overt fractures', 'no evidence of osteoporosis',
                'no evidence of joint space narrowing', 'no evidence of osteoporosis or osteophyte',
                'no evidence of dislocation or subluxation', 'no apparent foreign bodies or signs',
                'no evidence of joint dislocation',
                'no fracture', 'no fractures', 'no evidence of osteoporosis or bone', 'no evidence of displacement',
                'no evidence of osteoporosis or other', 'no obvious joint abnormalities'
            ]
        },

        'Breast': {
            'high_priority': ['mammogram', 'mass', 'calcification', 'abnormal', 'benign', 'scattered', 'density',
                              'tissue', 'focal', 'irregular'],
            'anatomy_specific': ['breast', 'mammary', 'nipple', 'ductal', 'fibroglandular', 'fibroadenoma',
                                 'calcification', 'microcalcification'],
            'medical_phrases': ['increased density', 'benign lesion', 'focal mass', 'irregular mass', 'dense tissue'],
            'suggested_prompts': [  # 15 items
                'breast mass', 'breast lesion', 'spiculated breast', 'spiculated density', 'spiculated mass',
                'spiculated distortion', 'spiculated calcifications', 'focal breast',
                'focal density', 'focal mass', 'focal distortion', 'focal calcifications', 'suspicious breast',
                'suspicious density', 'suspicious mass'
            ],
            'high_priority_combinations': [  # 20 items
                'spiculated breast', 'spiculated density', 'spiculated mass', 'spiculated distortion',
                'spiculated calcifications', 'spiculated asymmetry', 'spiculated calcification', 'spiculated implant',
                'spiculated malignancy', 'spiculated masses', 'spiculated tissue', 'spiculated densities',
                'spiculated biopsy', 'spiculated lesion', 'spiculated tumor', 'breast mass',
                'breast calcification', 'breast lesion', 'breast distortion', 'mass calcification'
            ],
            'no_expressions': [  # 30 items
                'no abnormal', 'no palpable', 'no palpable mass', 'no obvious', 'no evidence', 'no calcification',
                'no calcifications', 'no obvious mass',
                'no signs of malignancy', 'no abnormal findings', 'no mass', 'no obvious masses',
                'no abnormal findings are identified', 'no suspicious', 'no evidence of post',
                'no architectural distortion',
                'no abnormal findings are observed', 'no abnormal findings are noted',
                'no evidence of architectural distortion or', 'no apparent', 'no abnormal findings identified',
                'no suspicious findings', 'no significant', 'no suspicious calcifications',
                'no abnormal findings detected', 'no focal', 'no palpable masses', 'no focal mass', 'no masses',
                'no evidence of malignancy'
            ]
        },

        'Cardiac': {
            'high_priority': ['effusion', 'infarction', 'ischemia', 'stenosis', 'ventricle', 'artery', 'valve',
                              'dilation', 'thickened', 'enlarged'],
            'anatomy_specific': ['heart', 'cardiac', 'coronary', 'aorta', 'ventricle', 'atrium', 'valve', 'mitral'],
            'medical_phrases': ['focal thickening', 'abnormal enhancement', 'significant stenosis',
                                'significant calcification', 'mild dilation'],
            'suggested_prompts': [  # 15 items
                'heart dysfunction', 'cardiac dysfunction', 'coronary dysfunction', 'significant effusion',
                'significant cardiac', 'significant myocardium', 'significant infarction', 'significant ischemia',
                'focal effusion', 'focal cardiac', 'focal myocardium', 'focal infarction', 'focal ischemia',
                'abnormal effusion', 'abnormal cardiac'
            ],
            'high_priority_combinations': [  # 20 items
                'significant effusion', 'significant cardiac', 'significant myocardium', 'significant infarction',
                'significant ischemia', 'significant coronary', 'significant hypertrophy', 'significant stenosis',
                'significant ventricle', 'significant chambers', 'significant artery', 'significant thickening',
                'significant ventricles', 'significant calcifications', 'significant signal', 'heart dysfunction',
                'heart stenosis', 'heart regurgitation', 'cardiac dysfunction', 'cardiac stenosis'
            ],
            'no_expressions': [  # 30 items
                'no evidence', 'no significant', 'no apparent', 'no evidence of myocardial infarction',
                'no pericardial effusion', 'no evidence of pericardial effusion or',
                'no evidence of pericardial effusion', 'no evidence of myocardial hypertrophy or',
                'no significant artifacts', 'no evidence of myocardial infarction or', 'no obvious',
                'no evidence of myocardial hypertrophy', 'no significant vascular abnormalities are observed',
                'no significant vascular abnormalities', 'no evidence of myocardial ischemia or',
                'no evidence of coronary artery stenosis',
                'no focal', 'no pericardial effusion noted', 'no evidence of myocardial ischemia',
                'no significant coronary artery stenosis', 'no significant coronary artery stenosis or',
                'no pericardial effusion is observed', 'no significant vascular abnormalities or pericardial',
                'no evidence of wall thickening or',
                'no significant vascular abnormalities or functional',
                'no significant vascular abnormalities are identified', 'no evidence of wall motion abnormalities',
                'no significant vascular abnormalities such as', 'no acute', 'no pericardial effusion is noted'
            ]
        },

        'Chest': {
            'high_priority': ['chest', 'effusion', 'lung', 'pneumothorax', 'consolidation', 'atelectasis', 'pneumonia',
                              'opacity', 'pleural'],
            'anatomy_specific': ['chest', 'lung', 'pulmonary', 'mediastinum', 'bronchus', 'alveolar', 'pneumonia',
                                 'atelectasis'],
            'medical_phrases': ['increased lung', 'mild atelectasis', 'significant lung', 'increased opacity',
                                'mild lung'],
            'suggested_prompts': [  # 15 items
                'lung opacity', 'lung effusion', 'chest opacity', 'chest effusion', 'pulmonary opacity',
                'pulmonary effusion', 'thoracic opacity', 'thoracic effusion',
                'pleural chest', 'pleural effusion', 'pleural lung', 'pleural consolidation', 'pleural pneumothorax',
                'significant chest', 'significant effusion'
            ],
            'high_priority_combinations': [  # 20 items
                'pleural chest', 'pleural effusion', 'pleural lung', 'pleural consolidation', 'pleural pneumothorax',
                'pleural pulmonary', 'pleural opacity', 'pleural edema',
                'pleural fracture', 'pleural pneumonia', 'pleural opacities', 'pleural effusions', 'pleural fractures',
                'pleural cardiac', 'pleural heart', 'lung opacity',
                'lung effusion', 'lung pneumonia', 'lung consolidation', 'chest opacity'
            ],
            'no_expressions': [  # 30 items
                'no significant', 'no evidence', 'no significant abnormalities', 'no evidence of cardiomegaly',
                'no significant findings', 'no cardiomegaly', 'no pleural effusion', 'no pneumothorax',
                'no consolidation', 'no fracture', 'no evidence of consolidation', 'no atelectasis',
                'no evidence of pleural effusion', 'no evidence of pulmonary edema', 'no evidence of pneumothorax',
                'no evidence of lung opacity',
                'no significant cardiomegaly', 'no significant abnormalities including cardiomegaly', 'no lung opacity',
                'no significant lung opacities', 'no fractures', 'no pleural other', 'no pleural effusions', 'no clear',
                'no evidence of pleural effusion or', 'no obvious', 'no pneumonia', 'no lung lesion',
                'no significant lung opacity', 'no lung opacity or lesion'
            ]
        },

        'Cranial': {
            'high_priority': ['lesion', 'mass', 'edema', 'hyperintense', 'hypointense', 'lobe', 'brain', 'enhancement',
                              'hyperdense', 'tumor'],
            'anatomy_specific': ['brain', 'cerebral', 'cerebellar', 'brainstem', 'skull', 'cranial', 'intracranial',
                                 'ventricular'],
            'medical_phrases': ['significant mass', 'mild mass', 'significant enhancement', 'hypodense lesion',
                                'significant brain'],
            'suggested_prompts': [  # 15 items
                'brain lesion', 'brain mass', 'white lesion', 'white mass', 'matter lesion', 'matter mass',
                'acute stroke', 'acute lesion',
                'acute lobe', 'acute mass', 'acute edema', 'ischemic stroke', 'ischemic lesion', 'ischemic lobe',
                'ischemic mass'
            ],
            'high_priority_combinations': [  # 20 items
                'acute stroke', 'acute lesion', 'acute lobe', 'acute mass', 'acute edema', 'acute brain',
                'acute hemorrhage', 'acute tumor',
                'acute area', 'acute enhancement', 'acute hemisphere', 'acute signal', 'acute flair', 'acute atrophy',
                'acute intensity', 'brain lesion',
                'brain mass', 'brain infarct', 'brain hemorrhage', 'brain edema'
            ],
            'no_expressions': [  # 30 items
                'no significant', 'no evidence', 'no midline shift', 'no significant midline shift or ventricular',
                'no significant mass effect', 'no evidence of midline shift or', 'no obvious',
                'no midline shift or significant ventricular',
                'no significant mass effect or midline', 'no apparent', 'no obvious acute ischemic stroke', 'no acute',
                'no acute ischemic stroke', 'no evidence of acute ischemic stroke', 'no evidence of mass effect or',
                'no significant enhancement',
                'no significant midline shift noted', 'no evidence of significant midline shift',
                'no significant midline shift', 'no enhancement', 'no significant mass effect noted',
                'no midline shift noted', 'no significant midline shift or mass',
                'no evidence of significant mass effect',
                'no clear', 'no midline shift or significant atrophy', 'no evidence of mass effect',
                'no midline shift is observed', 'no significant midline shift is observed',
                'no evidence of hydrocephalus'
            ]
        },

        'Dental': {
            'high_priority': ['bone', 'root', 'radiolucent', 'radiopaque', 'cavity', 'canal', 'occlusion', 'partial',
                              'severe', 'sclerotic'],
            'anatomy_specific': ['tooth', 'teeth', 'dental', 'oral', 'mandible', 'maxilla', 'periodontal', 'root'],
            'medical_phrases': ['significant bone', 'minimal bone', 'mild bone', 'increased density',
                                'chronic inflammation'],
            'suggested_prompts': [  # 15 items
                'tooth caries', 'tooth decay', 'root caries', 'root decay', 'crown caries', 'crown decay',
                'gingival caries', 'gingival decay',
                'periapical caries', 'periapical teeth', 'periapical resorption', 'periapical tooth',
                'periapical molars', 'significant caries', 'significant teeth'
            ],
            'high_priority_combinations': [  # 20 items
                'periapical caries', 'periapical teeth', 'periapical resorption', 'periapical tooth',
                'periapical molars', 'periapical root', 'periapical restoration', 'periapical amalgam',
                'periapical mandible', 'periapical premolars', 'periapical implant', 'periapical area',
                'periapical crown', 'periapical composite', 'periapical apex', 'tooth caries',
                'tooth decay', 'tooth resorption', 'root caries', 'root decay'
            ],
            'no_expressions': [  # 30 items
                'no obvious', 'no obvious caries', 'no visible', 'no apparent', 'no significant',
                'no significant artifacts', 'no cyst', 'no evidence',
                'no restoration', 'no obvious carious lesions', 'no evidence of caries', 'no signs',
                'no visible caries', 'no evidence of cysts', 'no missing teeth', 'no significant artifacts noted',
                'no obvious signs of caries', 'no evidence of bone destruction or', 'no evidence of periapical lesions',
                'no significant abnormalities noted', 'no significant bone destruction or alveolar',
                'no significant resorption', 'no obvious periapical lesions', 'no obvious cysts',
                'no obvious restorations', 'no clear', 'no caries', 'no evidence of cysts or tumors',
                'no significant bone destruction', 'no obvious fractures'
            ]
        },

        'Dermatological': {
            'high_priority': ['lesion', 'irregular', 'multiple', 'skin', 'elevated', 'area', 'melanoma', 'carcinoma',
                              'nodule', 'localized'],
            'anatomy_specific': ['skin', 'dermal', 'epidermal', 'subcutaneous', 'cutaneous', 'lesion', 'rash', 'ulcer'],
            'medical_phrases': ['benign lesion', 'significant inflammation', 'significant thickening',
                                'malignant lesion', 'mild edema'],
            'suggested_prompts': [  # 15 items
                'skin melanoma', 'skin carcinoma', 'lesion melanoma', 'lesion carcinoma', 'nevus melanoma',
                'nevus carcinoma', 'pigmented melanoma', 'pigmented carcinoma',
                'melanocytic melanoma', 'melanocytic carcinoma', 'irregular lesion', 'irregular ulceration',
                'irregular distribution', 'irregular skin', 'irregular texture'
            ],
            'high_priority_combinations': [  # 20 items
                'irregular lesion', 'irregular ulceration', 'irregular distribution', 'irregular skin',
                'irregular texture', 'irregular area', 'irregular lesions', 'irregular seborrheic',
                'irregular keratosis', 'irregular macule', 'irregular erythema', 'irregular acne',
                'irregular psoriasis', 'irregular border', 'irregular eczema', 'skin melanoma',
                'skin carcinoma', 'skin lesion', 'lesion melanoma', 'lesion carcinoma'
            ],
            'no_expressions': [  # 30 items
                'no evidence', 'no evidence of ulceration or crusting', 'no visible', 'no ulceration', 'no signs',
                'no significant', 'no signs of ulceration or crusting', 'no visible ulceration or crusting',
                'no apparent', 'no evidence of ulceration or significant', 'no evidence of ulceration',
                'no significant color changes', 'no obvious', 'no evidence of irregular borders',
                'no significant color changes or irregular', 'no signs of ulceration',
                'no visible irregular borders', 'no clear', 'no crusting', 'no visible signs of ulceration or',
                'no visible lesions', 'no significant ulceration or crusting', 'no signs of ulceration or significant',
                'no evidence of irregular borders or',
                'no significant ulceration or crusting noted', 'no evidence of crusting or ulceration',
                'no visible ulceration', 'no visible crusting or ulceration',
                'no significant irregular borders or crusting', 'no visible artifacts'
            ]
        },

        'Endoscopy': {
            'high_priority': ['stomach', 'lesion', 'bleeding', 'inflammation', 'polyp', 'tract', 'segment', 'mucosa',
                              'nerve', 'blood'],
            'anatomy_specific': ['endoscopic', 'gastroscopy', 'mucosa', 'polyp', 'stricture', 'inflammation'],
            'medical_phrases': ['significant inflammation', 'mild inflammation', 'chronic inflammation', 'mild edema',
                                'benign lesion'],
            'suggested_prompts': [  # 15 items
                'bleeding mucosa', 'bleeding stomach', 'bleeding lesion', 'bleeding ulcers', 'bleeding lesions',
                'irregular mucosa', 'irregular stomach', 'irregular lesion',
                'irregular ulcers', 'irregular lesions', 'elevated mucosa', 'elevated stomach', 'elevated lesion',
                'elevated ulcers', 'elevated lesions'
            ],
            'high_priority_combinations': [  # 20 items
                'bleeding mucosa', 'bleeding stomach', 'bleeding lesion', 'bleeding ulcers', 'bleeding lesions',
                'bleeding polyps', 'bleeding inflammation', 'bleeding erosion',
                'bleeding area', 'bleeding polyp', 'bleeding ulcer', 'bleeding gastritis', 'bleeding erosions',
                'bleeding esophagus', 'bleeding folds', 'polyp inflammation',
                'lesion inflammation', 'ulcer inflammation', 'mass inflammation', 'tumor inflammation'
            ],
            'no_expressions': [  # 30 items
                'no visible', 'no visible lesions', 'no ulcer', 'no evidence', 'no apparent', 'no significant',
                'no obvious', 'no polyp',
                'no polyps', 'no signs', 'no visible abnormalities', 'no visible lesions or abnormalities',
                'no visible ulcers', 'no visible polyps', 'no visible ulceration or bleeding',
                'no significant artifacts',
                'no evidence of ulceration or bleeding', 'no ulcers', 'no visible abnormalities such as polyps',
                'no obvious lesions', 'no abnormal', 'no evidence of ulcers', 'no visible ulcers or polyps',
                'no lesions',
                'no lesion', 'no visible lesions or abnormalities in', 'no obvious ulcers', 'no obvious polyps',
                'no visible ulceration', 'no significant lesions'
            ]
        },

        'Fundus': {
            'high_priority': ['edema', 'scattered', 'hemorrhage', 'vessel', 'disc', 'macula', 'retinal', 'optic',
                              'dilation'],
            'anatomy_specific': ['fundus', 'retina', 'retinal', 'optic', 'disc', 'macula', 'macular', 'vessel'],
            'medical_phrases': ['small hemorrhage', 'dark lesion', 'significant dilation', 'significant edema',
                                'minimal hemorrhage'],
            'suggested_prompts': [  # 15 items
                'macula atrophy', 'retina atrophy', 'vessels atrophy', 'hemorrhage atrophy', 'hard fundus',
                'hard neovascularization', 'hard atrophy', 'hard macula',
                'hard vessels', 'soft fundus', 'soft neovascularization', 'soft atrophy', 'soft macula', 'soft vessels',
                'scattered fundus'
            ],
            'high_priority_combinations': [  # 20 items
                'hard fundus', 'hard neovascularization', 'hard atrophy', 'hard macula', 'hard vessels', 'hard dr',
                'hard retina', 'hard fovea',
                'hard hemorrhage', 'hard exudate', 'hard microaneurysm', 'hard veins', 'hard pdr', 'hard cup',
                'hard telangiectasia', 'macula atrophy',
                'macula degeneration', 'macula neovascularization', 'macula exudate', 'retina atrophy'
            ],
            'no_expressions': [  # 30 items
                'no apparent', 'no signs', 'no evidence', 'no signs of cupping or atrophy', 'no microaneurysm',
                'no signs of diabetic retinopathy', 'no evidence of macular edema or', 'no evidence of macular edema',
                'no signs of diabetic retinopathy or', 'no evidence of diabetic retinopathy',
                'no signs of optic disc cupping', 'no significant', 'no macular edema', 'no diabetic retinopathy',
                'no evidence of hemorrhages', 'no evidence of microaneurysms',
                'no evidence of diabetic retinopathy or', 'no signs of cupping', 'no signs of macular edema',
                'no evidence of optic disc cupping', 'no visible', 'no signs of macular edema or',
                'no signs of hemorrhages', 'no evidence of cupping or atrophy',
                'no visible microaneurysms', 'no evidence of neovascularization', 'no signs of edema',
                'no signs of microaneurysms', 'no hemorrhage', 'no dr'
            ]
        },

        'Gynecological': {
            'high_priority': ['lesion', 'uterus', 'ovary', 'cervix', 'abnormal', 'inflammation', 'artifact',
                              'hypoechoic', 'solid', 'complex'],
            'anatomy_specific': ['uterus', 'uterine', 'cervix', 'cervical', 'ovary', 'ovarian', 'endometrium',
                                 'myometrium'],
            'medical_phrases': ['mild inflammation', 'chronic inflammation', 'moderate inflammation',
                                'significant inflammation', 'minimal inflammation'],
            'suggested_prompts': [  # 15 items
                'uterus cyst', 'uterus mass', 'ovary cyst', 'ovary mass', 'cervix cyst', 'cervix mass', 'adnexa cyst',
                'adnexa mass',
                'pelvis cyst', 'pelvis mass', 'atypical lesion', 'atypical lesions', 'atypical fibroids',
                'atypical ultrasound', 'atypical cervix'
            ],
            'high_priority_combinations': [  # 20 items
                'atypical lesion', 'atypical lesions', 'atypical fibroids', 'atypical ultrasound', 'atypical cervix',
                'atypical area', 'atypical mass', 'atypical uterus',
                'atypical ovaries', 'atypical cyst', 'atypical ovary', 'atypical pelvis', 'atypical cysts',
                'atypical transvaginal', 'atypical tumors', 'uterus cyst',
                'uterus mass', 'uterus fibroid', 'uterus carcinoma', 'ovary cyst'
            ],
            'no_expressions': [  # 30 items
                'no evidence', 'no evidence of high', 'no clear', 'no significant', 'no apparent', 'no visible',
                'no significant artifacts', 'no evidence of low',
                'no abnormal', 'no obvious', 'no evidence of dysplasia or malignancy',
                'no evidence of other abnormalities', 'no visible cellular abnormalities', 'no signs', 'no definite',
                'no visible artifacts',
                'no significant artifacts present', 'no significant abnormalities',
                'no evidence of abnormal cellular changes', 'no visible abnormalities', 'no evidence of abnormal cells',
                'no evidence of cellular atypia or', 'no evidence of hsil or cancer',
                'no evidence of cervical cytology abnormalities',
                'no visible ovarian lesions', 'no significant cellular abnormalities', 'no significant artifacts noted',
                'no evidence of ovarian lesions', 'no evidence of abnormal cell morphology', 'no evidence of hsil'
            ]
        },

        'Pathology Slide': {
            'high_priority': ['tissue', 'malignancy', 'cancer', 'lesion', 'infiltrative', 'necrosis', 'tumor', 'cell',
                              'nucleus', 'stain'],
            'anatomy_specific': ['microscopic', 'histologic', 'cytologic', 'tissue', 'cell', 'nucleus', 'cytoplasm',
                                 'stain'],
            'medical_phrases': ['malignant lesion', 'malignant tumor', 'benign lesion', 'benign tissue',
                                'chronic inflammation'],
            'suggested_prompts': [  # 20 items
                'malignant cells', 'malignant tissue', 'malignant tumor', 'malignant neoplasm', 'malignant lesion',
                'carcinoma cells',
                'carcinoma tissue', 'carcinoma tumor', 'carcinoma neoplasm', 'carcinoma lesion', 'sarcoma cells',
                'sarcoma tissue',
                'sarcoma tumor', 'sarcoma neoplasm', 'sarcoma lesion', 'lymphoma cells', 'lymphoma tissue',
                'lymphoma tumor',
                'lymphoma neoplasm', 'lymphoma lesion'
            ],
            'high_priority_combinations': [  # 25 items
                'mitotic adenocarcinoma', 'mitotic atypia', 'mitotic tissue', 'mitotic slide', 'mitotic nuclei',
                'mitotic lesion',
                'mitotic pleomorphism', 'mitotic neoplasm', 'mitotic cells', 'mitotic growth', 'mitotic carcinoma',
                'mitotic stroma',
                'mitotic section', 'mitotic tumor', 'mitotic primary', 'malignant cells', 'malignant tissue',
                'malignant lesion',
                'malignant tumor', 'malignant carcinoma', 'atypical cells', 'atypical tissue', 'atypical lesion',
                'atypical tumor',
                'atypical carcinoma'
            ],
            'no_expressions': [  # 40 items
                'no significant', 'no evidence', 'no apparent', 'no mitotic figures', 'no clear',
                'no significant artifacts',
                'no significant mitotic activity', 'no evidence of benign features', 'no obvious', 'no visible',
                'no visible artifacts', 'no obvious artifacts',
                'no significant mitotic figures', 'no evidence of benign structures',
                'no significant artifacts present', 'no evidence of benign components',
                'no evidence of necrosis or significant', 'no clear glandular formation',
                'no significant nuclear atypia or mitotic', 'no clear evidence of benign features',
                'no evidence of significant stromal invasion', 'no significant artifacts noted',
                'no evidence of benign elements', 'no clear glandular structures',
                'no evidence of benign characteristics', 'no evidence of benign tissue', 'no abnormal',
                'no obvious mitotic figures', 'no signs', 'no evidence of significant mitotic activity',
                'no clear evidence of benign components', 'no significant artifacts are present',
                'no significant artifacts observed', 'no evidence of glandular formation',
                'no evidence of significant necrosis', 'no significant architectural preservation',
                'no clear benign structures present', 'no evidence of significant necrosis or',
                'no significant mitotic activity is observed', 'no obvious glandular structures'
            ]
        }
    }

    # Directional terminology
    direction_terms = {
        'left': ['left', 'l.', 'sinister'],
        'right': ['right', 'r.', 'dexter'],
        'upper': ['upper', 'superior', 'cranial', 'cephalic', 'top'],
        'lower': ['lower', 'inferior', 'caudal', 'bottom'],
        'anterior': ['anterior', 'front', 'ventral'],
        'posterior': ['posterior', 'back', 'dorsal'],
        'medial': ['medial', 'inner', 'central'],
        'lateral': ['lateral', 'outer', 'side'],
        'proximal': ['proximal', 'near'],
        'distal': ['distal', 'far'],
        # Additional combination directions
        'right_upper': ['right upper', 'upper right', 'right superior', 'superior right', 'right cranial',
                        'cranial right'],
        'right_lower': ['right lower', 'lower right', 'right inferior', 'inferior right', 'right caudal',
                        'caudal right'],
        'left_upper': ['left upper', 'upper left', 'left superior', 'superior left', 'left cranial', 'cranial left'],
        'left_lower': ['left lower', 'lower left', 'left inferior', 'inferior left', 'left caudal', 'caudal left']
    }

    # Strong normal report indicators
    strong_normal_indicators = [
        'normal', 'unremarkable', 'clear', 'negative', 'within normal limits',
        'no abnormalities', 'no pathology', 'healthy', 'intact', 'stable'
    ]

    # "no" related normal indicator patterns
    no_patterns = [
        'no obvious', 'no significant', 'no evidence', 'no abnormal',
        'no masses', 'no lesions', 'no acute', 'no pathology',
        'no abnormalities', 'no findings', 'no changes'
    ]

    return {
        'vocabulary_data': vocabulary_data,
        'direction_terms': direction_terms,
        'strong_normal_indicators': strong_normal_indicators,
        'no_patterns': no_patterns
    }


def get_category_fallback_prompts():
    """
    Return fallback detection prompts for each category

    Returns:
        dict: Mapping from categories to fallback prompts
    """
    fallback_mapping = {
        'Abdominal': ['abdomen', 'abdominal cavity', 'abdominal organs'],
        'Chest': ['chest', 'thorax', 'lung fields'],
        'Cardiac': ['heart', 'cardiac shadow', 'mediastinum'],
        'Breast': ['breast', 'mammary tissue', 'chest wall'],
        'Cranial': ['brain', 'skull', 'head'],
        'Bone and Joint': ['bone', 'joint', 'skeletal structure'],
        'Dental': ['teeth', 'jaw', 'oral cavity'],
        'Dermatological': ['skin', 'surface', 'tissue'],
        'Endoscopy': ['mucosa', 'lumen', 'wall'],
        'Fundus': ['retina', 'optic disc', 'macula'],
        'Gynecological': ['pelvis', 'uterus', 'ovary'],
        'Pathology Slide': ['tissue', 'cells', 'sample']
    }

    return fallback_mapping


class OptimizedMedicalVocabularyManager:
    """Optimized medical vocabulary manager - intelligent detection based on real statistical data"""

    def __init__(self):
        # Load complete vocabulary data
        vocab_data = get_enhanced_medical_vocabulary_data()
        self.category_vocabularies = vocab_data['vocabulary_data']
        self.direction_terms = vocab_data['direction_terms']
        self.strong_normal_indicators = vocab_data['strong_normal_indicators']
        self.no_patterns = vocab_data['no_patterns']

        # Load fallback prompts
        self.fallback_prompts = get_category_fallback_prompts()

        print("✅ Optimized vocabulary manager initialization complete")
        print(f"   📊 Supporting {len(self.category_vocabularies)} medical imaging categories")
        print(f"   🎯 Vocabulary database optimized based on real statistical data")

    def get_category_from_folder(self, folder_name):
        """Infer medical imaging category from folder name"""
        folder_lower = folder_name.lower()

        category_mapping = {
            'abdominal': 'Abdominal',
            'bone': 'Bone and Joint',
            'joint': 'Bone and Joint',
            'breast': 'Breast',
            'cardiac': 'Cardiac',
            'chest': 'Chest',
            'cranial': 'Cranial',
            'dental': 'Dental',
            'dermatological': 'Dermatological',
            'endoscopy': 'Endoscopy',
            'fundus': 'Fundus',
            'gynecological': 'Gynecological',
            'pathology': 'Pathology Slide'
        }

        for key, category in category_mapping.items():
            if key in folder_lower:
                return category

        return 'Abdominal'  # Default category

    def extract_direction_info(self, caption):
        """Extract direction information from description"""
        caption_lower = caption.lower()
        directions = {}

        for direction, terms in self.direction_terms.items():
            for term in terms:
                if term in caption_lower:
                    # Extract context, see what anatomical structures the directional term modifies
                    pattern = rf'\b{re.escape(term)}\s+(\w+)'
                    matches = re.finditer(pattern, caption_lower)
                    for match in matches:
                        anatomy = match.group(1)
                        if direction not in directions:
                            directions[direction] = []
                        directions[direction].append(anatomy)

        return directions

    def is_sentence_normal(self, sentence):
        """Determine if individual sentence indicates normal/no abnormal status"""
        sentence = sentence.strip().lower()
        if not sentence:
            return True  # Empty sentence considered normal

        print(f"      Analyzing sentence: '{sentence[:50]}...'")

        # Check for strong normal indicators
        for indicator in self.strong_normal_indicators:
            if indicator in sentence:
                print(f"        ✓ Found strong normal indicator: '{indicator}'")
                return True

        # Split sentence by commas into segments
        segments = [seg.strip() for seg in sentence.split(',')]

        for i, segment in enumerate(segments):
            # Check segments containing "no" (case insensitive)
            segment_lower = segment.lower()
            if 'no ' in segment_lower or segment_lower.startswith('no'):
                print(f"        Checking 'no' segment: '{segment}'")

                # Find position of "no", analyze from "no" onwards (case insensitive)
                no_pos = segment_lower.find('no ')
                if no_pos == -1:
                    no_pos = 0 if segment_lower.startswith('no') else -1

                if no_pos >= 0:
                    # Content from "no" to end of segment (use original segment to preserve case)
                    if no_pos == 0:
                        no_content = segment.strip()
                    else:
                        no_content = segment[no_pos:].strip()

                    # Check if this segment is very short (only 1-2 words), if so continue merging next segment
                    words_in_no_content = no_content.split()
                    if len(words_in_no_content) <= 2 and i < len(segments) - 1:
                        # Merge next segment
                        next_segment = segments[i + 1].strip()
                        no_content += " " + next_segment
                        print(f"        Merged next segment: '{no_content}'")

                    # Check if "no" content indicates normal
                    if self.is_no_phrase_normal(no_content):
                        print(f"        ✓ 'no' segment indicates normal: '{no_content}'")
                        return True

        # Check other normal patterns
        normal_patterns = [
            r'within\s+normal\s+limits',
            r'unremarkable',
            r'negative\s+for',
            r'clear\s+of',
            r'free\s+of'
        ]

        for pattern in normal_patterns:
            if re.search(pattern, sentence):
                print(f"        ✓ Matched normal pattern: '{pattern}'")
                return True

        print(f"        ✗ Sentence may contain abnormal information")
        return False

    def is_no_phrase_normal(self, no_phrase):
        """Determine if phrases containing 'no' indicate normal status"""
        no_phrase = no_phrase.lower().strip()

        print(f"          Analyzing 'no' phrase: '{no_phrase}'")

        # Check predefined "no" patterns
        for pattern in self.no_patterns:
            if pattern in no_phrase:
                print(f"          ✓ Matched predefined pattern: '{pattern}'")
                return True

        # Check "no + abnormal vocabulary" patterns
        abnormal_terms = [
            'abnormalities', 'abnormality', 'lesions', 'lesion', 'masses', 'mass',
            'nodules', 'nodule', 'tumors', 'tumor', 'pathology', 'disease',
            'findings', 'changes', 'enhancement', 'enlargement', 'calcification',
            'inflammation', 'infection', 'fracture', 'dislocation', 'hemorrhage',
            'fluid', 'air', 'pneumothorax', 'effusion', 'consolidation', 'stones',
            'obstruction', 'distension', 'bleeding', 'swelling', 'edema'
        ]

        # Check various "no + abnormal vocabulary" combinations
        for term in abnormal_terms:
            patterns_to_check = [
                f"no {term}",
                f"no obvious {term}",
                f"no significant {term}",
                f"no evidence of {term}",
                f"no signs of {term}",
                f"no apparent {term}",
                f"no visible {term}",
                f"no free {term}",  # For "no free fluid" type expressions
                f"no {term} or",  # For "no fluid or air" type expressions
                f"no {term} is seen",
                f"no {term} are seen"
            ]

            for pattern in patterns_to_check:
                if pattern in no_phrase:
                    print(f"          ✓ Matched 'no + abnormal vocabulary' pattern: '{pattern}'")
                    return True

        # Special handling: Check if it's "no [adjective] [abnormal vocabulary]" pattern
        # Like: "no free fluid", "no active bleeding", "no acute changes"
        adjectives = ['free', 'active', 'acute', 'chronic', 'significant', 'obvious', 'apparent', 'visible', 'clear',
                      'definite']

        for adj in adjectives:
            for term in abnormal_terms:
                pattern = f"no {adj} {term}"
                if pattern in no_phrase:
                    print(f"          ✓ Matched 'no + adjective + abnormal vocabulary' pattern: '{pattern}'")
                    return True

        # Check if contains vocabulary indicating normal status (even without abnormal vocabulary)
        # Like: "no abnormalities", "no pathology" etc.
        normal_indicators_after_no = [
            'abnormalities', 'abnormality', 'pathology', 'disease', 'findings',
            'changes', 'problems', 'issues', 'concerns', 'complications'
        ]

        for indicator in normal_indicators_after_no:
            if f"no {indicator}" in no_phrase:
                print(f"          ✓ Matched 'no + normal indicator' pattern: 'no {indicator}'")
                return True

        print(f"          ✗ No normal patterns matched")
        return False

    def is_normal_report(self, caption):
        """
        Improved normal report judgment logic:
        1. First split by periods into sentences
        2. Analyze whether each sentence is in normal status
        3. Special rule: If last sentence contains no/No, treat that sentence as no abnormalities
        4. Enhanced rule: If "no" or "No" is in segment after last comma, also treat as last sentence
        5. Only when all sentences are normal status, judge as normal report
        """
        if not caption or len(caption.strip()) < 5:
            return True  # Too short reports treated as normal

        print(f"    📋 Starting report normality analysis...")

        # Split by periods into sentences
        sentences = [s.strip() for s in caption.split('.') if s.strip()]

        if not sentences:
            return True  # No valid sentences treated as normal

        print(f"    Split into {len(sentences)} sentences")

        normal_sentence_count = 0

        for i, sentence in enumerate(sentences):
            is_last_sentence = (i == len(sentences) - 1)

            # Special rule: If last sentence contains no/No, treat that sentence as no abnormalities
            # Enhanced version: Also check last segment after comma
            if is_last_sentence:
                sentence_lower = sentence.lower()
                no_in_sentence = 'no ' in sentence_lower or sentence_lower.startswith('no')

                if no_in_sentence:
                    # Further check: If sentence has commas, ensure "no" is after last comma
                    if ',' in sentence:
                        last_comma_pos = sentence.rfind(',')
                        after_last_comma = sentence[last_comma_pos + 1:].strip().lower()

                        # If "no" is after last comma, only this part is treated as normal
                        # Rest needs normal analysis
                        if 'no ' in after_last_comma or after_last_comma.startswith('no'):
                            print(f"      Sentence {i + 1} (last sentence): 🔍 Detected 'no' segment after last comma")

                            # Analyze part before comma
                            before_last_comma = sentence[:last_comma_pos].strip()
                            print(f"        Before comma: '{before_last_comma}'")
                            print(f"        After comma: '{sentence[last_comma_pos + 1:].strip()}'")

                            # Part before comma analyzed with normal logic
                            before_comma_normal = self.is_sentence_normal(before_last_comma)

                            if before_comma_normal:
                                print(
                                    f"        ✅ Entire sentence normal (before comma normal + after comma 'no' segment)")
                                normal_sentence_count += 1
                            else:
                                print(
                                    f"        ⚠️ Entire sentence abnormal (before comma has abnormal info, despite 'no' after comma)")
                            continue
                        else:
                            # "no" not after last comma, process with normal logic
                            print(
                                f"      Sentence {i + 1} (last sentence): 🔍 'no' not after last comma, analyze with normal logic")
                    else:
                        # No comma in sentence, directly apply last sentence rule
                        print(f"      Sentence {i + 1} (last sentence): ✅ Normal (last sentence with 'no' rule)")
                        normal_sentence_count += 1
                        continue

            # Regular sentence analysis
            is_normal = self.is_sentence_normal(sentence)
            if is_normal:
                normal_sentence_count += 1
                print(f"      Sentence {i + 1}: ✅ Normal")
            else:
                print(f"      Sentence {i + 1}: ⚠️ Potentially abnormal")

        # Only when all sentences are normal, judge as normal report
        all_normal = (normal_sentence_count == len(sentences))

        print(f"    Normal sentences: {normal_sentence_count}/{len(sentences)}")
        print(f"    📊 Final judgment: {'✅ Normal report' if all_normal else '⚠️ Abnormal report'}")

        return all_normal

    def generate_anatomical_prompts(self, category):
        """Generate anatomical structure detection prompts for normal reports"""
        if category not in self.category_vocabularies:
            category = 'Abdominal'

        vocab = self.category_vocabularies[category]

        # Prioritize anatomy-specific vocabulary
        prompts = []
        prompts.extend(vocab['anatomy_specific'][:4])  # Anatomical structures
        prompts.extend([f"normal {term}" for term in vocab['anatomy_specific'][:2]])  # Add "normal" modifier
        prompts.extend([f"healthy {term}" for term in vocab['anatomy_specific'][:2]])  # Add "healthy" modifier

        return prompts[:6]  # Maximum 6 prompts

    def generate_detection_prompts(self, category, positive_caption=None):
        """Generate detection prompts for specific category, optimized based on real statistical data"""
        if category not in self.category_vocabularies:
            category = 'Abdominal'

        vocab = self.category_vocabularies[category]
        prompts = []

        # Check if normal report
        if positive_caption and self.is_normal_report(positive_caption):
            print(f"    🎯 Identified as normal report, using anatomical region prompts")
            return self.generate_anatomical_prompts(category)

        # Extract direction information
        directions = {}
        if positive_caption:
            directions = self.extract_direction_info(positive_caption)
            if directions:
                print(f"    🧭 Extracted direction info: {directions}")

        # 1. Use high-frequency combinations based on statistical frequency (highest priority)
        print(f"    📊 Using statistical data-based high-frequency vocabulary combinations")
        prompts.extend(vocab['high_priority_combinations'][:4])

        # 2. Use suggested specialized prompts
        prompts.extend(vocab['suggested_prompts'][:4])

        # 3. High-priority individual terms
        prompts.extend(vocab['high_priority'][:3])

        # 4. If direction info available, generate direction-related prompts
        if directions and positive_caption:
            direction_prompts = self.generate_direction_prompts(directions, vocab, positive_caption)
            prompts.extend(direction_prompts)

        # 5. If original description available, extract key phrases
        if positive_caption and not self.is_normal_report(positive_caption):
            medical_phrases = self.extract_medical_phrases(positive_caption, vocab)
            prompts.extend(medical_phrases)

        # 6. Deduplicate and limit quantity
        unique_prompts = []
        for prompt in prompts:
            if prompt and prompt not in unique_prompts and len(prompt.strip()) > 2:
                unique_prompts.append(prompt.strip())

        return unique_prompts[:8]  # Maximum 8 prompts

    def generate_fallback_prompts(self, category, is_normal=False):
        """Generate fallback detection prompts - broader anatomical regions"""
        base_prompts = self.fallback_prompts.get(category, ['anatomical structure', 'tissue'])

        if is_normal:
            # Fallback prompts for normal reports
            return base_prompts[:3]
        else:
            # Fallback prompts for abnormal reports
            enhanced_prompts = []
            for prompt in base_prompts[:2]:
                enhanced_prompts.extend([
                    f"abnormal {prompt}",
                    f"{prompt} lesion",
                    f"{prompt} abnormality"
                ])
            return enhanced_prompts[:4]

    def generate_direction_prompts(self, directions, vocab, caption):
        """Generate specialized detection prompts based on direction information"""
        direction_prompts = []

        # Combine directional terms with anatomical structures
        for direction, anatomies in directions.items():
            for anatomy in anatomies:
                # Check if anatomy is in vocabulary table
                all_terms = vocab['high_priority'] + vocab['anatomy_specific']
                if anatomy in [term.lower() for term in all_terms]:
                    direction_prompts.append(f"{direction} {anatomy}")

        # If description has specific lesions, combine with directions
        caption_lower = caption.lower()
        lesion_terms = ['lesion', 'mass', 'nodule', 'tumor', 'abnormality']

        for term in lesion_terms:
            if term in caption_lower:
                for direction in directions.keys():
                    direction_prompts.append(f"{direction} {term}")

        return direction_prompts[:3]

    def extract_medical_phrases(self, caption, vocab):
        """Extract key medical phrases from description"""
        phrases = []

        # Use predefined medical phrases
        caption_lower = caption.lower()
        for phrase in vocab.get('medical_phrases', []):
            if phrase.lower() in caption_lower:
                phrases.append(phrase)

        # Extract "adjective+noun" pattern medical terminology
        import re

        # Common medical adjectives
        medical_adjectives = ['hypodense', 'hyperdense', 'well-defined', 'ill-defined', 'irregular',
                              'homogeneous', 'heterogeneous', 'enhancing', 'non-enhancing']

        # Common medical nouns
        medical_nouns = ['lesion', 'mass', 'nodule', 'tumor', 'cyst', 'calcification', 'enhancement']

        for adj in medical_adjectives:
            for noun in medical_nouns:
                pattern = rf'\b{adj}\s+{noun}\b'
                if re.search(pattern, caption_lower):
                    phrases.append(f"{adj} {noun}")

        return phrases[:2]


def calculate_iou(box1, box2):
    """Calculate IoU (Intersection over Union) of two boxes"""
    x1_1, y1_1, x2_1, y2_1 = box1
    x1_2, y1_2, x2_2, y2_2 = box2

    # Calculate intersection
    x1_inter = max(x1_1, x1_2)
    y1_inter = max(y1_1, y1_2)
    x2_inter = min(x2_1, x2_2)
    y2_inter = min(y2_1, y2_2)

    if x2_inter <= x1_inter or y2_inter <= y1_inter:
        return 0.0

    inter_area = (x2_inter - x1_inter) * (y2_inter - y1_inter)

    # Calculate union
    area1 = (x2_1 - x1_1) * (y2_1 - y1_1)
    area2 = (x2_2 - x1_2) * (y2_2 - y1_2)
    union_area = area1 + area2 - inter_area

    return inter_area / union_area if union_area > 0 else 0.0


def calculate_box_quality_v2(box_area, image_area, confidence):
    """Redesigned quality scoring function - strict quality control matching 0.1 confidence threshold"""
    area_ratio = box_area / image_area

    # Confidence weight (85%) - further increase confidence importance, matching 0.1 threshold
    confidence_score = confidence * 0.85

    # Basic reasonableness weight (12%) - area requirements
    if area_ratio < 0.015:  # Too small (1.5%)
        reasonableness_score = 0.0
    elif area_ratio > 0.6:  # Too large (60%), may include too much background
        reasonableness_score = 0.03
    elif 0.05 <= area_ratio <= 0.4:  # Ideal range
        reasonableness_score = 0.12
    else:  # Other ranges
        reasonableness_score = 0.08

    # Position stability weight (3%) - not at image edges
    position_score = 0.03

    total_score = confidence_score + reasonableness_score + position_score
    return total_score


def calculate_containment_relationship(box1, box2):
    """Calculate containment relationship between two boxes"""
    x1_1, y1_1, x2_1, y2_1 = box1
    x1_2, y1_2, x2_2, y2_2 = box2

    # Check if box1 contains box2
    box1_contains_box2 = (x1_1 <= x1_2 and y1_1 <= y1_2 and x2_1 >= x2_2 and y2_1 >= y2_2)

    # Check if box2 contains box1
    box2_contains_box1 = (x1_2 <= x1_1 and y1_2 <= y1_1 and x2_2 >= x2_1 and y2_2 >= y2_1)

    if box1_contains_box2:
        return 'box1_contains_box2'
    elif box2_contains_box1:
        return 'box2_contains_box1'
    else:
        return 'no_containment'


def calculate_iou_boxes(box1, box2):
    """Calculate IoU of pixel coordinate boxes"""
    x1_1, y1_1, x2_1, y2_1 = box1
    x1_2, y1_2, x2_2, y2_2 = box2

    # Calculate intersection
    x1_inter = max(x1_1, x1_2)
    y1_inter = max(y1_1, y1_2)
    x2_inter = min(x2_1, x2_2)
    y2_inter = min(y2_1, y2_2)

    if x2_inter <= x1_inter or y2_inter <= y1_inter:
        return 0.0

    inter_area = (x2_inter - x1_inter) * (y2_inter - y1_inter)

    # Calculate union
    area1 = (x2_1 - x1_1) * (y2_1 - y1_1)
    area2 = (x2_2 - x1_2) * (y2_2 - y1_2)
    union_area = area1 + area2 - inter_area

    return inter_area / union_area if union_area > 0 else 0.0


def smart_roi_selection_with_direction(boxes, logits, phrases, image_size=(256, 256), directions=None, max_rois=3):
    """
    Intelligent ROI selection: integrated direction filtering, completely solve overlap, achieve true best selection
    """
    if len(boxes) == 0:
        return boxes, logits, phrases

    # Convert to numpy
    if isinstance(boxes, torch.Tensor):
        boxes_np = boxes.cpu().numpy()
        scores = logits.max(dim=1)[0].cpu().numpy() if logits.dim() > 1 else logits.cpu().numpy()
    else:
        boxes_np = boxes
        scores = logits

    w, h = image_size
    candidates = []

    print(f"    🔍 Original detection: {len(boxes_np)} boxes")

    # Step 1: Basic filtering and quality assessment
    for i, (box, score, phrase) in enumerate(zip(boxes_np, scores, phrases)):
        # Convert coordinates to pixels
        if all(0 <= coord <= 1.0 for coord in box):
            x1, y1, x2, y2 = box
            x1_px, y1_px = int(x1 * w), int(y1 * h)
            x2_px, y2_px = int(x2 * w), int(y2 * h)
        else:
            x1_px, y1_px, x2_px, y2_px = map(int, box)

        # Ensure correct coordinate order
        x1_px, x2_px = min(x1_px, x2_px), max(x1_px, x2_px)
        y1_px, y2_px = min(y1_px, y2_px), max(y1_px, y2_px)

        # Calculate box dimensions
        box_w = x2_px - x1_px
        box_h = y2_px - y1_px
        box_area = box_w * box_h
        area_ratio = box_area / (w * h)

        print(f"    Candidate box{i + 1}: {box_w}x{box_h}, area ratio {area_ratio:.3f}, confidence {score:.3f}")

        # Basic filtering - raise quality standards
        if box_w < 15 or box_h < 15:  # Raise minimum size requirement
            print(f"      -> ❌ Filtered: size too small")
            continue

        if score < 0.2:  # Strict confidence requirement, filter all boxes below 0.1
            print(f"      -> ❌ Filtered: confidence too low ({score:.3f} < 0.2)")
            continue

        # Edge detection - avoid selecting boxes too close to edges
        margin = 8  # Increase edge distance, avoid including too much black area
        if (x1_px < margin or y1_px < margin or
                x2_px > w - margin or y2_px > h - margin):
            print(f"      -> ❌ Filtered: too close to edge")
            continue

        # Extreme aspect ratio check
        aspect_ratio = max(box_w, box_h) / min(box_w, box_h)
        if aspect_ratio > 6:  # Lower aspect ratio limit
            print(f"      -> ❌ Filtered: aspect ratio too large ({aspect_ratio:.1f})")
            continue

        # Area reasonableness check - avoid too small or too large boxes
        if area_ratio < 0.01:  # Too small boxes
            print(f"      -> ❌ Filtered: area too small ({area_ratio:.3f})")
            continue
        elif area_ratio > 0.7:  # Too large boxes, may include too much background
            print(f"      -> ❌ Filtered: area too large ({area_ratio:.3f})")
            continue

        # Direction filtering: If direction info available, filter boxes not matching direction
        position_bonus = 0
        if directions:
            position_bonus = calculate_position_bonus(x1_px, y1_px, x2_px, y2_px, w, h, directions, phrase)
            if position_bonus < 0:  # Position clearly doesn't match
                print(f"      -> ❌ Filtered: direction doesn't match")
                continue

        # Calculate quality score
        quality_score = calculate_box_quality_v2(box_area, w * h, score) + position_bonus

        candidates.append({
            'index': i,
            'box': [x1_px, y1_px, x2_px, y2_px],
            'box_norm': box,
            'score': score,
            'phrase': phrase,
            'area': box_area,
            'quality_score': quality_score,
            'center': [(x1_px + x2_px) // 2, (y1_px + y2_px) // 2],
            'width': box_w,
            'height': box_h
        })
        print(f"      -> ✅ Candidate (quality score: {quality_score:.3f})")

    if not candidates:
        print("    ❌ No qualified candidate boxes")
        return torch.empty(0, 4), torch.empty(0), []

    print(f"    📊 Candidate boxes after filtering: {len(candidates)}")

    # Step 2: Sort by quality score
    candidates.sort(key=lambda x: x['quality_score'], reverse=True)

    # Step 3: Stricter NMS, handle containment relationships and overlaps
    final_rois = []
    OVERLAP_THRESHOLD = 0.1  # Lower overlap threshold, stricter overlap avoidance
    MIN_QUALITY_THRESHOLD = 0.2  # Raise minimum quality requirement

    for candidate in candidates:
        # Quality gate check
        if candidate['quality_score'] < MIN_QUALITY_THRESHOLD:
            print(
                f"    Skip low quality box: {candidate['phrase']} quality score {candidate['quality_score']:.3f} < {MIN_QUALITY_THRESHOLD}")
            continue

        is_valid = True
        rois_to_remove = []

        # Check relationship with already selected boxes
        for j, existing in enumerate(final_rois):
            # Calculate containment relationship
            containment = calculate_containment_relationship(candidate['box'], existing['box'])

            if containment == 'box1_contains_box2':
                # Current box contains existing box, choose higher confidence
                if candidate['score'] > existing['score']:
                    print(
                        f"    🔄 Current box contains existing box, current confidence higher: {candidate['phrase']}({candidate['score']:.3f}) > {existing['phrase']}({existing['score']:.3f})")
                    rois_to_remove.append(j)
                else:
                    print(
                        f"    ❌ Current box contains existing box, but confidence lower: {candidate['phrase']}({candidate['score']:.3f}) < {existing['phrase']}({existing['score']:.3f})")
                    is_valid = False
                    break

            elif containment == 'box2_contains_box1':
                # Existing box contains current box, choose higher confidence
                if candidate['score'] > existing['score']:
                    print(
                        f"    🔄 Existing box contains current box, current confidence higher: {candidate['phrase']}({candidate['score']:.3f}) > {existing['phrase']}({existing['score']:.3f})")
                    rois_to_remove.append(j)
                else:
                    print(
                        f"    ❌ Existing box contains current box, but confidence lower: {candidate['phrase']}({candidate['score']:.3f}) < {existing['phrase']}({existing['score']:.3f})")
                    is_valid = False
                    break

            else:
                # No containment relationship, check overlap
                iou = calculate_iou_boxes(candidate['box'], existing['box'])

                if iou > OVERLAP_THRESHOLD:
                    # Has overlap, choose higher confidence
                    if candidate['score'] > existing['score']:
                        print(
                            f"    🔄 Overlapping boxes, current confidence higher: {candidate['phrase']}({candidate['score']:.3f}) > {existing['phrase']}({existing['score']:.3f}) IoU={iou:.3f}")
                        rois_to_remove.append(j)
                    else:
                        print(
                            f"    ❌ Overlapping boxes, confidence lower: {candidate['phrase']}({candidate['score']:.3f}) < {existing['phrase']}({existing['score']:.3f}) IoU={iou:.3f}")
                        is_valid = False
                        break

        if is_valid:
            # Remove replaced boxes
            for idx in sorted(rois_to_remove, reverse=True):
                removed_roi = final_rois.pop(idx)
                print(f"    🗑️ Removed: {removed_roi['phrase']}")

            final_rois.append(candidate)
            print(
                f"    ✅ Selected: {candidate['phrase']} (confidence: {candidate['score']:.3f}, quality score: {candidate['quality_score']:.3f})")

            if len(final_rois) >= max_rois:
                break

    print(f"    🎯 Final ROI count: {len(final_rois)}")

    # Step 4: Convert back to model format
    if final_rois:
        final_boxes = torch.tensor([roi['box_norm'] for roi in final_rois])
        final_scores = torch.tensor([roi['score'] for roi in final_rois])
        final_phrases = [roi['phrase'] for roi in final_rois]

        # Ensure correct dimensions
        if final_boxes.dim() > 2:
            final_boxes = final_boxes.squeeze(1)
        if final_boxes.dim() == 1 and len(final_rois) == 1:
            final_boxes = final_boxes.unsqueeze(0)

        if logits.dim() > 1 and final_scores.dim() == 1:
            final_scores = final_scores.unsqueeze(1)

        return final_boxes, final_scores, final_phrases
    else:
        return torch.empty(0, 4), torch.empty(0), []


def calculate_position_bonus(x1, y1, x2, y2, w, h, directions, phrase):
    """Calculate position bonus/penalty based on direction info - supports combination directions"""
    center_x = (x1 + x2) // 2
    center_y = (y1 + y2) // 2

    bonus = 0
    phrase_lower = phrase.lower()

    # Prioritize combination directions (higher accuracy, larger bonus)
    if 'right_upper' in directions:
        if center_x > w * 0.6 and center_y < h * 0.4:  # Right upper region
            bonus += 0.15  # Combination direction bonus higher
        elif center_x < w * 0.4 or center_y > h * 0.6:  # Clearly not right upper
            return -1

    if 'right_lower' in directions:
        if center_x > w * 0.6 and center_y > h * 0.6:  # Right lower region
            bonus += 0.15
        elif center_x < w * 0.4 or center_y < h * 0.4:  # Clearly not right lower
            return -1

    if 'left_upper' in directions:
        if center_x < w * 0.4 and center_y < h * 0.4:  # Left upper region
            bonus += 0.15
        elif center_x > w * 0.6 or center_y > h * 0.6:  # Clearly not left upper
            return -1

    if 'left_lower' in directions:
        if center_x < w * 0.4 and center_y > h * 0.6:  # Left lower region
            bonus += 0.15
        elif center_x > w * 0.6 or center_y < h * 0.4:  # Clearly not left lower
            return -1

    # If no combination directions, check individual directions
    combination_found = any(combo in directions for combo in ['right_upper', 'right_lower', 'left_upper', 'left_lower'])

    if not combination_found:
        # Check left/right directions
        if 'left' in directions:
            if center_x < w * 0.4:  # In image left side
                bonus += 0.1
            elif center_x > w * 0.6:  # In image right side but labeled as left side
                return -1  # Clearly wrong, direct filter

        if 'right' in directions:
            if center_x > w * 0.6:  # In image right side
                bonus += 0.1
            elif center_x < w * 0.4:  # In image left side but labeled as right side
                return -1  # Clearly wrong, direct filter

        # Check upper/lower directions
        if 'upper' in directions:
            if center_y < h * 0.4:  # In image upper part
                bonus += 0.1
            elif center_y > h * 0.6:  # In image lower part but labeled as upper part
                bonus -= 0.1

        if 'lower' in directions:
            if center_y > h * 0.6:  # In image lower part
                bonus += 0.1
            elif center_y < h * 0.4:  # In image upper part but labeled as lower part
                bonus -= 0.1

    # Check directional terms in phrases (including combination directions)
    if ('right upper' in phrase_lower or 'upper right' in phrase_lower or 'right superior' in phrase_lower):
        if not (center_x > w * 0.6 and center_y < h * 0.4):
            return -1

    if ('right lower' in phrase_lower or 'lower right' in phrase_lower or 'right inferior' in phrase_lower):
        if not (center_x > w * 0.6 and center_y > h * 0.6):
            return -1

    if ('left upper' in phrase_lower or 'upper left' in phrase_lower or 'left superior' in phrase_lower):
        if not (center_x < w * 0.4 and center_y < h * 0.4):
            return -1

    if ('left lower' in phrase_lower or 'lower left' in phrase_lower or 'left inferior' in phrase_lower):
        if not (center_x < w * 0.4 and center_y > h * 0.6):
            return -1

    # Original individual direction checks
    if 'left' in phrase_lower and center_x > w * 0.6:
        return -1
    if 'right' in phrase_lower and center_x < w * 0.4:
        return -1

    return bonus


def adaptive_roi_selection(boxes, logits, phrases, image_size=(256, 256), directions=None):
    """Adaptive ROI selection: dynamically adjust quantity based on detection quality, integrated direction filtering"""
    if len(boxes) == 0:
        return boxes, logits, phrases

    # First perform basic selection
    selected_boxes, selected_logits, selected_phrases = smart_roi_selection_with_direction(
        boxes, logits, phrases, image_size, directions, max_rois=5
    )

    if len(selected_boxes) == 0:
        return selected_boxes, selected_logits, selected_phrases

    # Analyze quality distribution, decide final quantity
    if isinstance(selected_logits, torch.Tensor):
        scores = selected_logits.max(dim=1)[0] if selected_logits.dim() > 1 else selected_logits
        scores_np = scores.cpu().numpy()
    else:
        scores_np = selected_logits

    # Dynamic adjustment strategy
    if len(scores_np) > 0:
        max_score = scores_np[0]  # Already sorted by quality

        # Decide retention quantity based on highest quality score (matching 0.1 confidence threshold)
        if max_score > 0.5:  # High quality detection (confidence usually >0.1)
            keep_count = min(3, len(scores_np))
        elif max_score > 0.35:  # Medium quality detection
            keep_count = min(2, len(scores_np))
        else:  # Low quality detection
            keep_count = 1

        # Quality gap filtering: If quality gap too large, only keep high quality ones
        if len(scores_np) > 1:
            quality_gap = scores_np[0] - scores_np[-1]
            if quality_gap > 0.2:  # Large quality gap
                # Find quality jump point
                for i in range(1, len(scores_np)):
                    if scores_np[0] - scores_np[i] > 0.15:
                        keep_count = min(keep_count, i)
                        break

        print(f"    🎯 Adaptive selection: keep highest quality {keep_count} ROIs")

        # Take highest quality ROIs
        final_boxes = selected_boxes[:keep_count]
        final_logits = selected_logits[:keep_count]
        final_phrases = selected_phrases[:keep_count]

        # Ensure correct dimensions
        if isinstance(final_boxes, torch.Tensor):
            if final_boxes.dim() == 3:
                final_boxes = final_boxes.squeeze(1)
            elif final_boxes.dim() == 1 and keep_count == 1:
                final_boxes = final_boxes.unsqueeze(0)

        if isinstance(final_logits, torch.Tensor):
            if final_logits.dim() == 2 and final_logits.shape[1] == 1:
                final_logits = final_logits.squeeze(1)
            elif final_logits.dim() == 0:
                final_logits = final_logits.unsqueeze(0)

        return final_boxes, final_logits, final_phrases

    return selected_boxes, selected_logits, selected_phrases


def detect_black_regions_and_get_max_roi(image_source, category):
    """
    Detect black regions and generate maximum ROI region excluding black areas
    Improved version: better handling of black backgrounds in medical images
    """
    import cv2
    import numpy as np

    # Convert to grayscale
    if len(image_source.shape) == 3:
        gray = cv2.cvtColor(image_source, cv2.COLOR_BGR2GRAY)
    else:
        gray = image_source

    h, w = gray.shape

    print(f"    🔍 Image size: {w}x{h}")

    # More precise black/extremely dark region detection
    # Use adaptive threshold based on image brightness distribution
    mean_brightness = np.mean(gray)
    std_brightness = np.std(gray)

    # Dynamic threshold: if image is overall darker, use lower threshold
    if mean_brightness < 50:
        threshold_value = max(15, int(mean_brightness * 0.3))
    else:
        threshold_value = max(25, int(mean_brightness * 0.2))

    print(f"    💡 Image mean brightness: {mean_brightness:.1f}, using threshold: {threshold_value}")

    # Detect non-black regions
    _, binary = cv2.threshold(gray, threshold_value, 255, cv2.THRESH_BINARY)

    # Morphological operations, remove noise and fill small holes
    kernel_size = max(3, min(7, min(w, h) // 50))  # Adjust kernel based on image size
    kernel = np.ones((kernel_size, kernel_size), np.uint8)

    # First closing operation to fill internal holes, then opening operation to remove noise
    binary = cv2.morphologyEx(binary, cv2.MORPH_CLOSE, kernel, iterations=2)
    binary = cv2.morphologyEx(binary, cv2.MORPH_OPEN, kernel, iterations=1)

    # Find contours
    contours, _ = cv2.findContours(binary, cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE)

    if not contours:
        print("    ⚠️ No valid contours detected, using conservative center region")
        return [0.2, 0.2, 0.8, 0.8]

    # Find largest contour (main anatomical structure)
    largest_contour = max(contours, key=cv2.contourArea)
    largest_area = cv2.contourArea(largest_contour)

    print(f"    📊 Largest contour area: {largest_area} ({largest_area / (w * h) * 100:.1f}%)")

    # If largest contour too small, may be detection error, use bounding box of all larger contours
    min_area_threshold = (w * h) * 0.1  # At least 10% of image area

    if largest_area < min_area_threshold:
        print("    🔍 Largest contour area too small, try merging multiple contours")

        # Select all contours with area larger than certain threshold
        valid_contours = [c for c in contours if cv2.contourArea(c) > min_area_threshold * 0.3]

        if valid_contours:
            # Merge bounding boxes of all valid contours
            all_points = np.vstack([c.reshape(-1, 2) for c in valid_contours])
            x, y, contour_w, contour_h = cv2.boundingRect(all_points)
        else:
            # If still no sufficiently large contours, use original largest contour
            x, y, contour_w, contour_h = cv2.boundingRect(largest_contour)
    else:
        # Use largest contour
        x, y, contour_w, contour_h = cv2.boundingRect(largest_contour)

    # Adjust margin strategy based on medical imaging category
    category_margin_factor = {
        'Chest': 0.05,  # Chest images usually have more black background
        'Abdominal': 0.06,  # Abdominal CT has black edges
        'Cranial': 0.04,  # Brain images relatively tight
        'Cardiac': 0.05,  # Heart images
        'Breast': 0.03,  # Breast images
        'Bone and Joint': 0.04,  # Bone and joint images
        'Dental': 0.02,  # Dental images usually tighter
        'Fundus': 0.02,  # Fundus images are circular, margins should be small
        'Pathology Slide': 0.03  # Pathology slides
    }

    margin_factor = category_margin_factor.get(category, 0.05)

    # Calculate margins
    margin_x = max(5, int(contour_w * margin_factor))
    margin_y = max(5, int(contour_h * margin_factor))

    # Ensure margins don't make box exceed image boundaries
    x1 = max(0, x - margin_x)
    y1 = max(0, y - margin_y)
    x2 = min(w, x + contour_w + margin_x)
    y2 = min(h, y + contour_h + margin_y)

    # Verify ROI reasonableness
    roi_w = x2 - x1
    roi_h = y2 - y1
    roi_area = roi_w * roi_h
    roi_area_ratio = roi_area / (w * h)

    print(f"    📦 Detected ROI: {roi_w}x{roi_h} (area ratio: {roi_area_ratio:.3f})")

    # If ROI area too small or too large, make adjustments
    if roi_area_ratio < 0.3:  # Area too small, may be detection error
        print("    🔧 ROI area too small, expanding range")
        center_x, center_y = x + contour_w // 2, y + contour_h // 2
        extend_w = max(contour_w, int(w * 0.4))
        extend_h = max(contour_h, int(h * 0.4))

        x1 = max(0, center_x - extend_w // 2)
        y1 = max(0, center_y - extend_h // 2)
        x2 = min(w, center_x + extend_w // 2)
        y2 = min(h, center_y + extend_h // 2)

    elif roi_area_ratio > 0.9:  # Area too large, may include too much background
        print("    🔧 ROI area too large, reducing range")
        shrink_factor = 0.85
        center_x, center_y = (x1 + x2) // 2, (y1 + y2) // 2
        new_w = int(roi_w * shrink_factor)
        new_h = int(roi_h * shrink_factor)

        x1 = center_x - new_w // 2
        y1 = center_y - new_h // 2
        x2 = center_x + new_w // 2
        y2 = center_y + new_h // 2

    # Convert to normalized coordinates
    x1_norm = max(0.0, min(1.0, x1 / w))
    y1_norm = max(0.0, min(1.0, y1 / h))
    x2_norm = max(0.0, min(1.0, x2 / w))
    y2_norm = max(0.0, min(1.0, y2 / h))

    print(f"    🔍 Final anatomical structure ROI: ({x1}, {y1}) -> ({x2}, {y2})")
    print(f"    🎯 Normalized coordinates: ({x1_norm:.3f}, {y1_norm:.3f}) -> ({x2_norm:.3f}, {y2_norm:.3f})")

    return [x1_norm, y1_norm, x2_norm, y2_norm]


def extract_abnormal_terms_from_report(caption):
    """Extract abnormal feature keywords from report"""
    caption_lower = caption.lower()

    # Common abnormal feature vocabulary
    abnormal_terms = [
        'lesion', 'mass', 'nodule', 'tumor', 'cyst', 'calcification',
        'enhancement', 'enlargement', 'thickening', 'irregular', 'hypodense',
        'hyperdense', 'infiltrate', 'consolidation', 'effusion', 'hemorrhage',
        'infarct', 'ischemia', 'stenosis', 'obstruction', 'fracture', 'dislocation',
        'inflammation', 'infection', 'abscess', 'necrosis', 'edema', 'fibrosis'
    ]

    found_terms = []
    for term in abnormal_terms:
        if term in caption_lower:
            found_terms.append(term)

    return found_terms[:2]  # Return maximum 2 keywords


def generate_intelligent_roi(model, image, category, positive_caption, vocab_manager,
                             box_threshold=0.08, text_threshold=0.04, directions=None):
    """
    Intelligent ROI generation: fixed version - normal reports directly generate anatomical structure ROI
    Optimized version: intelligent prompt generation based on real statistical data
    """
    print(f"    🚀 Starting intelligent ROI generation...")

    # Check if normal report
    is_normal = vocab_manager.is_normal_report(positive_caption)

    # ===== Fixed core logic =====
    if is_normal:
        print(f"    🏥 Normal report - directly generate maximum anatomical structure ROI")
        print(f"    ⭐️ Skip model detection, directly use anatomical structure region")
        # Normal reports directly generate maximum anatomical structure ROI without model detection
        return generate_anatomical_structure_roi(image, category, positive_caption, is_normal)

    # ===== Only abnormal reports undergo model detection =====
    print(f"    ⚠️ Abnormal report - using lesion feature detection")

    # 1. First try direct detection based on report content (abnormal reports only)
    all_detections = []

    # 1.1 Generate detection prompts (abnormal reports only)
    detection_prompts = vocab_manager.generate_detection_prompts(category, positive_caption)
    print(f"    🎯 Detection prompts: {detection_prompts}")

    # 1.2 Use generated prompts for detection
    for prompt_idx, text_prompt in enumerate(detection_prompts):
        print(f"    🔍 Trying prompt {prompt_idx + 1}: '{text_prompt}'")

        try:
            boxes, logits, phrases = predict(
                model=model,
                image=image,
                caption=text_prompt,
                box_threshold=box_threshold,
                text_threshold=text_threshold
            )

            if len(boxes) > 0:
                print(f"      ✅ Detected {len(boxes)} regions")
                for j in range(len(boxes)):
                    all_detections.append({
                        'box': boxes[j],
                        'logit': logits[j],
                        'phrase': f"{text_prompt}" if not phrases or j >= len(phrases) else phrases[j],
                        'prompt': text_prompt
                    })
            else:
                print(f"      ❌ No targets detected")

        except Exception as pred_error:
            print(f"      ⚠️ Detection error: {pred_error}")
            continue

    # 1.3 If detection results available, perform intelligent selection
    if all_detections:
        combined_boxes = torch.stack([det['box'] for det in all_detections])
        combined_logits = torch.stack([det['logit'] for det in all_detections])
        combined_phrases = [det['phrase'] for det in all_detections]

        print(f"    📊 Combined detection results: {len(combined_boxes)} candidate boxes")

        # Apply intelligent selection
        final_boxes, final_logits, final_phrases = adaptive_roi_selection(
            combined_boxes, combined_logits, combined_phrases,
            image_size=(image.shape[2], image.shape[1]), directions=directions
        )

        if len(final_boxes) > 0:
            return final_boxes, final_logits, final_phrases, is_normal

    # 2. If model detection fails, try broader prompts (abnormal reports only)
    print(f"    🔄 Initial detection failed, trying broader anatomical region detection...")
    fallback_prompts = vocab_manager.generate_fallback_prompts(category, is_normal)

    for prompt in fallback_prompts:
        print(f"    🔧 Fallback prompt: '{prompt}'")
        try:
            boxes, logits, phrases = predict(
                model=model, image=image, caption=prompt,
                box_threshold=max(0.1, box_threshold - 0.03),  # Lower threshold
                text_threshold=max(0.1, text_threshold - 0.02)
            )

            if len(boxes) > 0:
                print(f"      ✅ Fallback detection successful: {len(boxes)} regions")
                # Simple selection of highest confidence
                if isinstance(logits, torch.Tensor):
                    scores = logits.max(dim=1)[0] if logits.dim() > 1 else logits
                    best_idx = scores.argmax().item()
                    return boxes[best_idx:best_idx + 1], logits[best_idx:best_idx + 1], [
                        phrases[best_idx] if phrases else prompt], is_normal
        except Exception as e:
            print(f"      ❌ Fallback detection failed: {e}")
            continue

    # 3. Final fallback solution: use maximum anatomical structure region (only when abnormal report detection completely fails)
    print(
        f"    🏗️ Model detection completely failed, use maximum anatomical structure region as potential abnormal region...")
    return generate_anatomical_structure_roi(image, category, positive_caption, is_normal)


def generate_anatomical_structure_roi(image, category, caption, is_normal):
    """
    Maximum anatomical structure ROI generation based on image processing
    Applicable to: 1. Normal reports  2. Abnormal but unable to generate any ROI regions
    """
    print(f"    🏗️ Using maximum anatomical structure region detection...")

    # Convert to numpy format
    if isinstance(image, torch.Tensor):
        image_np = image.permute(1, 2, 0).cpu().numpy()
        image_np = (image_np * 255).astype(np.uint8)
    else:
        image_np = image

    # Detect maximum anatomical structure region (non-black background)
    max_roi_coords = detect_black_regions_and_get_max_roi(image_np, category)

    # Generate semantic annotation
    if is_normal:
        phrase = f"normal {category.lower()} anatomy"
        confidence = 0.75  # Normal reports have slightly higher confidence
        print(f"    ✅ Normal report: generate maximum anatomical structure ROI")
    else:
        # Extract abnormal keywords from report
        abnormal_terms = extract_abnormal_terms_from_report(caption)
        if abnormal_terms:
            phrase = f"region with potential {abnormal_terms[0]}"
        else:
            phrase = f"suspected abnormal region in {category.lower()}"
        confidence = 0.65  # Abnormal but detection failed, confidence slightly lower
        print(
            f"    ⚠️ Abnormal report (detection failed): generate maximum anatomical structure ROI as potential abnormal region")

    # Return standard format
    boxes = torch.tensor([max_roi_coords], dtype=torch.float32)
    scores = torch.tensor([confidence], dtype=torch.float32)
    phrases = [phrase]

    print(f"    🎯 Maximum anatomical structure ROI: {phrase} (confidence: {confidence:.2f})")

    return boxes, scores, phrases, is_normal


def visualize_results(image_source, boxes, logits, phrases, save_path, original_caption, category, is_normal=False):
    """Visualize results and save"""
    try:
        # Copy image
        annotated_frame = image_source.copy()
        h, w = annotated_frame.shape[:2]

        print(f"    🔍 Image size: {w}x{h}")

        if len(boxes) > 0:
            # Manually draw detection boxes
            if isinstance(boxes, torch.Tensor):
                boxes_np = boxes.cpu().numpy()
            else:
                boxes_np = np.array(boxes)

            # Ensure boxes_np is 2D array [N, 4]
            if boxes_np.ndim == 3:
                boxes_np = boxes_np.squeeze(1)  # Remove middle dimension
            elif boxes_np.ndim == 1:
                boxes_np = boxes_np.reshape(1, -1)  # Single box becomes [1, 4]

            print(f"    📦 Number of detection boxes: {len(boxes_np)}")
            print(f"    📊 boxes_np shape: {boxes_np.shape}")

            # Choose colors based on whether it's normal report
            if is_normal:
                colors = [(0, 255, 255), (255, 255, 0),
                          (255, 0, 255)]  # Normal reports use bright colors (yellow, cyan, magenta)
            else:
                colors = [(0, 255, 0), (255, 0, 0), (0, 0, 255), (255, 255, 0), (255, 0, 255), (0, 255, 255)]

            # Draw rectangle for each box
            for i, box in enumerate(boxes_np):
                print(f"    📦 Box{i + 1} original coordinates: {box}")
                print(
                    f"    📊 Box{i + 1} coordinate type: {type(box)}, shape: {box.shape if hasattr(box, 'shape') else 'no shape'}")

                # Ensure box is 1D array
                if box.ndim > 1:
                    box = box.flatten()

                if len(box) != 4:
                    print(f"    ❌ Box{i + 1} coordinate format error, skip")
                    continue

                # Handle coordinate format
                try:
                    # Check if normalized coordinates
                    if np.all((box >= 0) & (box <= 1.0)):
                        x1, y1, x2, y2 = box
                        x1_px = max(0, min(w - 1, int(x1 * w)))
                        y1_px = max(0, min(h - 1, int(y1 * h)))
                        x2_px = max(0, min(w - 1, int(x2 * w)))
                        y2_px = max(0, min(h - 1, int(y2 * h)))
                    else:
                        x1_px = max(0, min(w - 1, int(box[0])))
                        y1_px = max(0, min(h - 1, int(box[1])))
                        x2_px = max(0, min(w - 1, int(box[2])))
                        y2_px = max(0, min(h - 1, int(box[3])))
                except Exception as coord_error:
                    print(f"    ❌ Box{i + 1} coordinate conversion error: {coord_error}")
                    continue

                # Ensure correct coordinate order
                if x1_px > x2_px:
                    x1_px, x2_px = x2_px, x1_px
                if y1_px > y2_px:
                    y1_px, y2_px = y2_px, y1_px

                print(f"    🔍 Box{i + 1} pixel coordinates: ({x1_px}, {y1_px}) -> ({x2_px}, {y2_px})")

                # Check box validity
                box_width = x2_px - x1_px
                box_height = y2_px - y1_px

                if box_width < 5 or box_height < 5:
                    print(f"    ❌ Box{i + 1} too small, skip")
                    continue

                # Select color
                color = colors[i % len(colors)]
                thickness = 3 if is_normal else 2  # Normal report boxes slightly thicker

                # Draw rectangle box
                cv2.rectangle(annotated_frame, (x1_px, y1_px), (x2_px, y2_px), color, thickness)

                # Add corner markers
                cv2.circle(annotated_frame, (x1_px, y1_px), 4, color, -1)
                cv2.circle(annotated_frame, (x2_px, y2_px), 4, color, -1)

                # Add label
                if i < len(phrases) and phrases[i]:
                    label = phrases[i].replace('[SEP]', '').strip()
                    if not label:
                        label = f"roi_{i + 1}"
                else:
                    label = f"roi_{i + 1}"

                # Get confidence
                if isinstance(logits, torch.Tensor):
                    if logits.dim() > 1:
                        conf = logits[i].max().item() if i < len(logits) else 0.0
                    else:
                        conf = logits[i].item() if i < len(logits) else 0.0
                else:
                    conf = 0.0

                # Draw label
                label_text = f"{label}:{conf:.2f}"
                font = cv2.FONT_HERSHEY_SIMPLEX
                font_scale = 0.4
                label_thickness = 1

                # Calculate label position
                (text_width, text_height), _ = cv2.getTextSize(label_text, font, font_scale, label_thickness)

                # Label position strategy
                if y1_px > text_height + 8:
                    label_x = x1_px
                    label_y = y1_px - 3
                    bg_y1 = y1_px - text_height - 8
                    bg_y2 = y1_px - 3
                elif y2_px + text_height + 8 < h:
                    label_x = x1_px
                    label_y = y2_px + text_height + 3
                    bg_y1 = y2_px + 3
                    bg_y2 = y2_px + text_height + 8
                else:
                    label_x = x1_px + 3
                    label_y = y1_px + text_height + 3
                    bg_y1 = y1_px + 3
                    bg_y2 = y1_px + text_height + 8

                # Ensure label doesn't exceed image boundaries
                label_x = max(0, min(w - text_width, label_x))
                bg_x2 = min(w, label_x + text_width)

                # Draw label background
                cv2.rectangle(annotated_frame, (label_x, bg_y1), (bg_x2, bg_y2), color, -1)

                # Draw label text
                cv2.putText(annotated_frame, label_text, (label_x, label_y),
                            font, font_scale, (255, 255, 255), label_thickness)

        # Enlarge display
        display_scale = 1.5
        display_w = int(w * display_scale)
        display_h = int(h * display_scale)

        large_frame = cv2.resize(annotated_frame, (display_w, display_h), interpolation=cv2.INTER_NEAREST)

        # Add title
        text_height = 100
        canvas = np.ones((display_h + text_height, display_w, 3), dtype=np.uint8) * 255
        canvas[text_height:, :] = large_frame

        # Add title text
        font = cv2.FONT_HERSHEY_SIMPLEX
        font_scale = 0.45
        color = (0, 0, 0)
        thickness = 1

        # Display category and report type
        report_type = "Normal Report" if is_normal else "Abnormal Report"
        category_line = f"Category: {category} | Type: {report_type}"
        cv2.putText(canvas, category_line, (8, 18), font, font_scale, (0, 0, 200), thickness)

        # Truncate description text
        max_chars = 80
        display_caption = original_caption[:max_chars] + "..." if len(
            original_caption) > max_chars else original_caption

        # Intelligent line breaking
        if len(display_caption) > 40:
            mid = len(display_caption) // 2
            split_pos = display_caption.rfind(' ', mid - 15, mid + 15)
            if split_pos == -1:
                split_pos = mid
            line1 = display_caption[:split_pos]
            line2 = display_caption[split_pos:].strip()
            lines = [line1, line2]
        else:
            lines = [display_caption]

        for i, line in enumerate(lines[:2]):
            y_pos = 40 + i * 20
            cv2.putText(canvas, line, (8, y_pos), font, 0.4, color, thickness)

        # Add detection info
        if len(boxes) > 0:
            if is_normal:
                info_line = f"Max Anatomical ROI: Statistical data-driven detection for normal reports"
                info_color = (0, 150, 150)
            else:
                info_line = f"Smart Detection: Statistical vocabulary + anatomical structure fallback"
                info_color = (0, 100, 0)

            cv2.putText(canvas, info_line, (8, display_h + text_height - 25), font, 0.35, info_color, thickness)

            # Add algorithm info
            algo_line = "Optimized: Real statistical data + Enhanced vocab management"
            cv2.putText(canvas, algo_line, (8, display_h + text_height - 8), font, 0.3, (100, 100, 100), thickness)

        # Save results
        cv2.imwrite(save_path, canvas)
        print(f"    ✅ Visualization successfully saved: {save_path}")
        return canvas

    except Exception as e:
        print(f"    ❌ Visualization error: {e}")
        import traceback
        traceback.print_exc()
        # Save original image
        try:
            large_orig = cv2.resize(image_source, (int(image_source.shape[1] * 1.5), int(image_source.shape[0] * 1.5)))
            cv2.imwrite(save_path, large_orig)
        except:
            cv2.imwrite(save_path, image_source)
        return image_source


def test_grounding_dino_optimized():
    """Optimized main testing function - fixed normal report detection logic"""
    # Suppress warning messages
    import warnings
    warnings.filterwarnings("ignore", category=FutureWarning)
    warnings.filterwarnings("ignore", category=UserWarning)

    # Configuration parameters
    dataset_root = "/root/autodl-tmp/dataset"
    output_dir = "DINO_optimized_statistical_result"
    model_config = "groundingdino/config/GroundingDINO_SwinT_OGC.py"
    model_weights = "weights/groundingdino_swint_ogc.pth"

    # Set local BERT model path
    local_bert_path = "/root/autodl-tmp/pubmedbert-base-uncased-abstract-local"

    # Detection parameters - precise control matching optimized vocabulary database
    BOX_THRESHOLD = 0.08  # Threshold optimized based on statistical data
    TEXT_THRESHOLD = 0.04  # Raise text threshold
    MAX_BOXES = 6  # Reduce candidate quantity, improve quality
    SAMPLES_PER_FOLDER = 20

    # Create output directory
    os.makedirs(output_dir, exist_ok=True)

    print("🚀 Loading Grounding DINO model...")

    # Temporarily modify BERT model path
    import groundingdino.util.get_tokenlizer as tokenizer_utils
    original_get_model = tokenizer_utils.get_pretrained_language_model

    def custom_get_model(text_encoder_type):
        from transformers import BertModel
        print(f"🤖 Using local BERT model: {local_bert_path}")
        return BertModel.from_pretrained(local_bert_path)

    tokenizer_utils.get_pretrained_language_model = custom_get_model

    # Temporarily disable torch.load security check
    original_load = torch.load

    def safe_load(*args, **kwargs):
        if 'weights_only' in kwargs:
            del kwargs['weights_only']
        return original_load(*args, **kwargs)

    torch.load = safe_load

    try:
        model = load_model(model_config, model_weights)
        print("✅ Model loaded successfully!")
    except Exception as e:
        print(f"❌ Model loading failed: {e}")
        return
    finally:
        tokenizer_utils.get_pretrained_language_model = original_get_model
        torch.load = original_load

    # Initialize optimized vocabulary manager
    vocab_manager = OptimizedMedicalVocabularyManager()

    # Get all subfolders
    subfolders = [d for d in os.listdir(dataset_root)
                  if os.path.isdir(os.path.join(dataset_root, d)) and "Imaging" in d]

    print(f"🔍 Found {len(subfolders)} medical imaging folders")

    total_processed = 0
    total_detected = 0
    total_saved = 0
    normal_reports = 0
    abnormal_reports = 0
    model_detection_success = 0
    anatomical_roi_fallback = 0

    for folder in subfolders:
        folder_path = os.path.join(dataset_root, folder)
        jsonl_file = os.path.join(folder_path, f"{folder}_en.jsonl")
        images_dir = os.path.join(folder_path, "images")

        if not os.path.exists(jsonl_file) or not os.path.exists(images_dir):
            print(f"⚠️ Skip {folder}: missing required files")
            continue

        print(f"\n📂 Processing folder: {folder}")

        # Determine medical imaging category
        category = vocab_manager.get_category_from_folder(folder)
        print(f"  🏷️ Identified category: {category}")

        # Load data
        try:
            data = load_jsonl(jsonl_file)
            print(f"  📊 Loaded {len(data)} English data entries")
        except Exception as e:
            print(f"  ❌ Failed to load English data: {e}")
            continue

        # Select first 20 samples
        samples = data[:min(SAMPLES_PER_FOLDER, len(data))]

        folder_output_dir = os.path.join(output_dir, folder)
        os.makedirs(folder_output_dir, exist_ok=True)

        folder_detected = 0
        folder_saved = 0
        folder_normal = 0
        folder_abnormal = 0
        folder_model_success = 0
        folder_anatomical_fallback = 0

        for i, sample in enumerate(samples):
            try:
                image_name = sample['image']
                positive_caption = sample['report']

                # Build image path
                image_path = os.path.join(images_dir, image_name)
                if not os.path.exists(image_path):
                    print(f"❌ Image does not exist: {image_path}")
                    continue

                print(f"  🔬 Processing {i + 1}/{len(samples)}: {image_name}")
                print(f"    📄 Original description: {positive_caption[:100]}...")

                # Load image
                image_source, image = load_image(image_path)

                # ===== Fix: First check if normal report =====
                is_normal = vocab_manager.is_normal_report(positive_caption)

                if is_normal:
                    print(f"    ✅ Normal report identified - directly generate anatomical structure ROI")
                    folder_normal += 1

                    # Directly generate anatomical structure ROI without model detection
                    boxes, logits, phrases, _ = generate_anatomical_structure_roi(
                        image, category, positive_caption, is_normal
                    )

                    folder_detected += 1
                    folder_anatomical_fallback += 1  # Normal reports all use anatomical structure

                    print(f"    🏥 Normal report: generated maximum anatomical structure ROI")
                    if len(phrases) > 0:
                        conf = logits[0].item() if isinstance(logits, torch.Tensor) else logits[0]
                        print(f"      🎯 Anatomical ROI: {phrases[0]} (confidence: {conf:.3f})")

                else:
                    print(f"    ⚠️ Abnormal report identified - start model detection")
                    folder_abnormal += 1

                    # Extract direction information
                    directions = vocab_manager.extract_direction_info(positive_caption)
                    if directions:
                        print(f"    🧭 Direction info: {directions}")

                    # Use optimized intelligent ROI generation (abnormal reports only)
                    boxes, logits, phrases, _ = generate_intelligent_roi(
                        model=model,
                        image=image,
                        category=category,
                        positive_caption=positive_caption,
                        vocab_manager=vocab_manager,
                        box_threshold=BOX_THRESHOLD,
                        text_threshold=TEXT_THRESHOLD,
                        directions=directions
                    )

                    # Determine if maximum anatomical structure region fallback strategy was used
                    if len(phrases) > 0:
                        first_phrase = phrases[0].lower()
                        if ('region with potential' in first_phrase or
                                'suspected abnormal region' in first_phrase):
                            folder_anatomical_fallback += 1
                            print(
                                f"    🏗️ Abnormal report: fallback to maximum anatomical structure region (potential abnormal region)")
                        else:
                            folder_model_success += 1
                            print(f"    🎯 Abnormal report: model detection successful")

                    if len(boxes) > 0:
                        folder_detected += 1
                        print(f"    ⚠️ Abnormal report: detected {len(boxes)} lesion ROI regions")

                        for j, phrase in enumerate(phrases):
                            if isinstance(logits, torch.Tensor):
                                if logits.dim() == 1:
                                    conf = logits[j].item() if j < len(logits) else 0.0
                                else:
                                    conf = logits[j].max().item() if j < len(logits) else 0.0
                            else:
                                conf = logits[j] if j < len(logits) else 0.0
                            print(f"      🎯 Lesion ROI{j + 1}: {phrase} (confidence: {conf:.3f})")
                    else:
                        print("    ❌ Abnormal report generated no ROI regions")

                # Generate visualization results and save
                if len(boxes) > 0:
                    try:
                        output_filename = f"{folder}_{i + 1:03d}_{image_name}"
                        output_path = os.path.join(folder_output_dir, output_filename)

                        visualize_results(image_source, boxes, logits, phrases, output_path,
                                          positive_caption, category, is_normal)
                        print(f"    💾 Results saved: {output_filename}")
                        folder_saved += 1

                    except Exception as viz_error:
                        print(f"    ❌ Visualization failed: {viz_error}")
                else:
                    print("    ❌ No ROI regions generated, skip saving")

                total_processed += 1

            except Exception as e:
                print(f"    ❌ Processing failed: {e}")
                continue

        total_detected += folder_detected
        total_saved += folder_saved
        normal_reports += folder_normal
        abnormal_reports += folder_abnormal
        model_detection_success += folder_model_success
        anatomical_roi_fallback += folder_anatomical_fallback

        print(f"  📊 {folder} completed:")
        print(f"    Detection successful: {folder_detected}/{len(samples)}")
        print(f"    Save successful: {folder_saved}")
        print(f"    Normal reports: {folder_normal}, Abnormal reports: {folder_abnormal}")
        print(
            f"    Model detection successful: {folder_model_success}, Anatomical structure fallback: {folder_anatomical_fallback}")

    print(f"\n🎉 === Optimized Intelligent Normal/Abnormal Report Analysis Testing Complete ===")
    print(f"📊 Total processed samples: {total_processed}")
    print(f"✅ Successfully generated ROI: {total_detected}")
    print(f"💾 Actually saved samples: {total_saved}")
    print(f"🏥 Normal reports: {normal_reports} (directly generate anatomical structure ROI)")
    print(
        f"⚠️ Abnormal reports: {abnormal_reports} (intelligent lesion detection based on high-frequency vocabulary combinations)")
    print(f"🎯 Model detection successful: {model_detection_success}")
    print(f"🏗️ Maximum anatomical structure fallback: {anatomical_roi_fallback}")

    if total_processed > 0:
        print(f"📈 ROI generation success rate: {total_detected / total_processed * 100:.1f}%")
        print(f"💾 Save success rate: {total_saved / total_processed * 100:.1f}%")
        print(f"🎯 Model detection success rate: {model_detection_success / total_processed * 100:.1f}%")
        print(f"🏗️ Anatomical structure fallback rate: {anatomical_roi_fallback / total_processed * 100:.1f}%")
    else:
        print("📊 Various success rates: 0.0% (no samples processed)")

    print(f"\n🚀 === Core Optimizations ===")
    print(
        f"✅ Fixed normal report detection logic (normal reports directly generate anatomical ROI, no model detection)")
    print(
        f"✅ Integrated real statistical data vocabulary database (based on 1060 terms and 431 vocabulary combinations)")
    print(
        f"✅ Intelligent prompt generation based on high-frequency vocabulary combinations (such as hyperintense lesion and other high-frequency combinations)")
    print(f"✅ Improved normal/abnormal report judgment logic (sentence-level analysis)")
    print(f"✅ Unified maximum anatomical structure region fallback strategy")
    print(f"✅ Normal reports: direct anatomical structure ROI generation (no model detection overhead)")
    print(f"✅ Abnormal reports: lesion detection based on statistical frequency + potential abnormal region fallback")
    print(f"✅ Completely removed hard coding, intelligent region detection based on image processing")
    print(f"✅ Retained excellent quality control and direction filtering algorithms")
    print(f"🔍 Results saved in: {output_dir}")


def test_normal_report_detection():
    """Test normal report detection functionality fix effect"""
    print("🧪 === Testing Normal Report Detection Functionality ===")

    # Initialize vocabulary manager
    vocab_manager = OptimizedMedicalVocabularyManager()

    # Test cases
    test_cases = [
        {
            "report": "The axial CT scan shows no obvious masses or stones in the abdomen. The liver, gallbladder, pancreas, spleen, and kidneys appear unremarkable. The bowel loops demonstrate normal gas pattern and no signs of obstruction or significant distension. No free fluid or air is seen within the peritoneal cavity.",
            "expected": True,
            "description": "Normal report starting with capital No"
        },
        {
            "report": "The chest X-ray shows clear lung fields. no pneumothorax or pleural effusion is identified. The heart size is normal.",
            "expected": True,
            "description": "Normal report starting with lowercase no"
        },
        {
            "report": "There is a large mass in the liver measuring 5cm. The lesion shows enhancement on contrast study.",
            "expected": False,
            "description": "Clearly abnormal report"
        },
        {
            "report": "Normal study. No abnormalities detected.",
            "expected": True,
            "description": "Brief normal report"
        },
        {
            "report": "The patient shows signs of pneumonia with consolidation in the right lower lobe. No other abnormalities seen.",
            "expected": False,
            "description": "Mixed report (has abnormal and normal parts)"
        }
    ]

    print(f"📊 Total {len(test_cases)} test cases\n")

    passed = 0
    failed = 0

    for i, case in enumerate(test_cases):
        print(f"🔬 Test case {i + 1}: {case['description']}")
        print(f"   📄 Report: {case['report']}")

        result = vocab_manager.is_normal_report(case['report'])
        expected = case['expected']

        if result == expected:
            print(f"   ✅ Passed: expected={expected}, actual={result}")
            passed += 1
        else:
            print(f"   ❌ Failed: expected={expected}, actual={result}")
            failed += 1
        print()

    print(f"📈 Test results: {passed}/{len(test_cases)} passed")
    print(f"✅ Pass rate: {passed / len(test_cases) * 100:.1f}%")

    if failed == 0:
        print("🎉 All test cases passed! Fix successful!")
    else:
        print(f"⚠️ Still {failed} test cases failed, need further optimization")


if __name__ == "__main__":
    # Can run tests separately
    import sys

    if len(sys.argv) > 1 and sys.argv[1] == "test":
        test_normal_report_detection()
    else:
        test_grounding_dino_optimized()