import os

import torch
import torch.utils.data
import torchvision.datasets as datasets

from torch.utils.data import Subset
import numpy as np


class SUN397:
    def __init__(
        self,
        preprocess,
        location: str = os.path.expanduser("~/data"),
        batch_size: int = 32,
        num_workers: int = 0,
    ):
        # Data loading code
        traindir = os.path.join(location, "sun397", "train")
        valdir = os.path.join(location, "sun397", "test")

        assert os.path.isdir(traindir), f"Train directory not found: {traindir}"
        self.train_dataset = datasets.ImageFolder(traindir, transform=preprocess)
        self.train_loader = torch.utils.data.DataLoader(
            self.train_dataset,
            shuffle=True,
            batch_size=batch_size,
            num_workers=num_workers,
        )

        self.test_dataset = datasets.ImageFolder(valdir, transform=preprocess)
        self.test_loader = torch.utils.data.DataLoader(self.test_dataset, batch_size=batch_size, num_workers=num_workers)
        self.test_loader_shuffle = torch.utils.data.DataLoader(self.test_dataset, shuffle=True, batch_size=batch_size, num_workers=num_workers)
        idx_to_class = dict((v, k) for k, v in self.train_dataset.class_to_idx.items())
        #print("idx_to_class:", idx_to_class)
        self.classnames = [idx_to_class[i][2:].replace("_", " ") for i in range(len(idx_to_class))]
        #print("sun397 classnames:", self.classnames)

        n_total = len(self.test_dataset)
        n_sample = n_total // 4 # 取四分之一
        indices = np.random.choice(n_total, n_sample, replace=False)  # 随机且不重复
        subset = Subset(self.test_dataset, indices)
        self.test_loader_subset = torch.utils.data.DataLoader(subset, batch_size=batch_size, num_workers=num_workers)
        self.test_loader_subset_shuffle = torch.utils.data.DataLoader(subset, shuffle=True, batch_size=batch_size, num_workers=num_workers)
