"""GPU optimization module for Expected GradCAM.

This module provides optimized implementations for GPU acceleration:
- Batched path integration (IG, EG)
- Automatic Mixed Precision (AMP) management
- Memory estimation and management
- Multi-GPU support (DataParallel, DDP)

Optimizations achieve ~3-5x speedup over sequential implementations.
"""

from __future__ import annotations

from expected_gradcam.gpu.amp_context import (
    AMPContext,
    amp_autocast,
    get_amp_dtype,
    is_amp_available,
)
from expected_gradcam.gpu.batched_ops import (
    BatchedExpectedGradients,
    BatchedIntegratedGradients,
    FullyBatchedExpectedGradients,
    compute_optimal_weights_batched,
)
from expected_gradcam.gpu.memory import (
    MemoryEstimator,
    estimate_batch_size,
    get_available_memory,
    get_optimal_batch_size,
)
from expected_gradcam.gpu.multi_gpu import (
    MultiGPUWrapper,
    get_device_count,
    is_multi_gpu_available,
    setup_distributed,
)

__all__ = [
    # Batched operations
    "BatchedIntegratedGradients",
    "BatchedExpectedGradients",
    "FullyBatchedExpectedGradients",
    "compute_optimal_weights_batched",
    # AMP
    "AMPContext",
    "amp_autocast",
    "is_amp_available",
    "get_amp_dtype",
    # Memory
    "MemoryEstimator",
    "estimate_batch_size",
    "get_available_memory",
    "get_optimal_batch_size",
    # Multi-GPU
    "MultiGPUWrapper",
    "is_multi_gpu_available",
    "get_device_count",
    "setup_distributed",
]
