import os
from src.dataset_processing.common.config.base_configs import BaseDatasetConfig
from src.dataset_processing.common.enums.dataset_types import DatasetType

def get_data_path(path):
    value = os.environ.get(path)
    if not value:
        raise ValueError(f"Required environment variable '{path}' is missing or empty in .env file")
    return value

data_path = get_data_path('DATA_PATH')

class BaseDatasetManager:
    """Base class for dataset managers implementing common functionality"""
    
    def __init__(self, cache_base_dir: str = data_path):
        self.cache_base_dir = cache_base_dir
        self._initialize_cache_dirs()
    
    def _initialize_cache_dirs(self):
        """Initialize cache directories for different dataset types"""
        for dataset_type in DatasetType:
            cache_dir = self._get_cache_dir(dataset_type)
            os.makedirs(cache_dir, exist_ok=True)
    
    def _get_cache_dir(self, dataset_type: DatasetType) -> str:
        """Get cache directory for specific dataset type"""
        return os.path.join(self.cache_base_dir, dataset_type.name.lower(), "processed")
    
    def _get_cache_path(self, config: BaseDatasetConfig) -> str:
        """Generate cache path for dataset configuration"""
        merged_suffix = "_merged" if config.is_merged else ""
        filename = (f"{config.dataset_name}_pert-{config.perturbation_type}_intensity-{config.perturbation_intensity}{merged_suffix}.csv")
        return os.path.join(self._get_cache_dir(config.dataset_type), filename)
