import os
import shutil
import xml.etree.ElementTree as ET

# Paths
original_image_dir = '/path/to/imagenet/ILSVRC/Data/CLS-LOC/val'
annotations_dir = '/path/to/imagenet/ILSVRC/Annotations/CLS-LOC/val'
output_image_dir = '/path/to/imagenet/ILSVRC/Data/CLS-LOC/val'

# Ensure the output directory exists
if not os.path.exists(output_image_dir):
    os.makedirs(output_image_dir)

def parse_annotation(annotation_path):
    try:
        tree = ET.parse(annotation_path)
        root = tree.getroot()
        classes = set()
        # Find all <object> tags and extract the class names
        for obj in root.findall('object'):
            object_name = obj.find('name').text
            classes.add(object_name)
        return classes
    except Exception as e:
        print(f"Error parsing {annotation_path}: {e}")
        return set()

def organize_images():
    # List all XML files
    xml_files = [f for f in os.listdir(annotations_dir) if f.endswith('.xml')]
    
    for xml_file in xml_files:
        image_file = xml_file.replace('.xml', '.JPEG')
        annotation_path = os.path.join(annotations_dir, xml_file)
        image_path = os.path.join(original_image_dir, image_file)
        
        # Parse annotation to get all class names
        class_names = parse_annotation(annotation_path)
        if not class_names:
            print(f"Skipping image {image_file} due to missing class names.")
            continue
        
        # Move image to each class directory
        for class_name in class_names:
            class_dir = os.path.join(output_image_dir, class_name)
            if not os.path.exists(class_dir):
                os.makedirs(class_dir)
            
            # Check if the image exists before copying
            if os.path.exists(image_path):
                shutil.copy(image_path, os.path.join(class_dir, image_file))
            else:
                print(f"Image {image_file} does not exist, skipping.")

if __name__ == "__main__":
    organize_images()
