import shutil
import random
from pathlib import Path

random.seed(42)


src_root = Path("./")
domains = ["Caltech101", "LabelMe", "SUN09", "VOC2007"]


train_root = src_root / "train"
test_root = src_root / "test"


for folder in [train_root, test_root]:
    if folder.exists():
        shutil.rmtree(folder)
    folder.mkdir(parents=True)


for domain in domains:
    category_to_images = {}
    domain_path = src_root / domain


    for class_dir in domain_path.iterdir():
        if not class_dir.is_dir():
            continue
        category = class_dir.name
        images = list(class_dir.glob("*.*"))
        images = [img for img in images if img.suffix.lower() in ['.jpg', '.jpeg', '.png']]


        if category not in category_to_images:
            category_to_images[category] = []
        category_to_images[category].extend(images)


    for category, image_list in category_to_images.items():
        random.shuffle(image_list)
        n_total = len(image_list)
        n_test = int(n_total * 0.25)
        test_images = image_list[:n_test]
        train_images = image_list[n_test:]


        domain_name = domain.split("/")[0]


        train_class_dir = train_root / domain_name / category
        test_class_dir = test_root / domain_name / category

        train_class_dir.mkdir(parents=True, exist_ok=True)
        test_class_dir.mkdir(parents=True, exist_ok=True)


        for img in train_images:
            shutil.copy(img, train_class_dir / img.name)
        for img in test_images:
            shutil.copy(img, test_class_dir / img.name)


print("down")
