import torch.nn as nn

class LeNet(nn.Module):
    """
    LeNet convolutional neural network implementation.
    
    Args:
        num_classes (int): Number of output classes. Default is 10.
        in_channels (int): Number of input channels. Default is 1.
    """
    def __init__(self, num_classes=10, in_channels=1):
        super().__init__()
        self.num_classes = num_classes
        
        self.conv1 = nn.Sequential(
            nn.Conv2d(in_channels, 6, kernel_size=5, padding=2),
            nn.ReLU(inplace=True),
            nn.MaxPool2d(kernel_size=2, stride=2)
        )
        
        self.conv2 = nn.Sequential(
            nn.Conv2d(6, 16, kernel_size=5),
            nn.ReLU(inplace=True),
            nn.MaxPool2d(kernel_size=2, stride=2)
        )
        self.adaptive_pool = nn.AdaptiveAvgPool2d((5, 5))
        feature_size = 16 * 5 * 5
        self.fc = nn.Sequential(
            nn.Flatten(),
            nn.Linear(feature_size, 120),
            nn.ReLU(inplace=True),
            nn.Linear(120, 84),
            nn.ReLU(inplace=True),
            nn.Linear(84, num_classes)
        )
        
        self._initialize_weights()
        
    def forward(self, x, return_activations=False):
        """
        Forward pass of the network.
        
        Args:
            x (torch.Tensor): Input tensor.
            return_activations (bool): Whether to return intermediate activations. Default is False.
            
        Returns:
            torch.Tensor or tuple: Output tensor, or tuple of (output, activation1, activation2) if return_activations is True.
        """
        activation1 = self.conv1[0](x)
        x = self.conv1[1](activation1)
        x = self.conv1[2](x)
        
        activation2 = self.conv2[0](x)
        x = self.conv2[1](activation2)
        x = self.conv2[2](x)
        
        x = self.adaptive_pool(x)
        
        x = self.fc(x)
        
        if return_activations:
            return (x, activation1, activation2)
        return x
        
    def _initialize_weights(self):
        """Initialize network weights using appropriate initialization strategies."""
        for m in self.modules():
            if isinstance(m, nn.Conv2d):
                nn.init.kaiming_normal_(m.weight, mode='fan_out', nonlinearity='relu')
                if m.bias is not None:
                    nn.init.constant_(m.bias, 0)
            elif isinstance(m, nn.Linear):
                nn.init.normal_(m.weight, 0, 0.01)
                nn.init.constant_(m.bias, 0)
