import torch
import torch.nn as nn


class NLinear(nn.Module):
    """
    Normalization-Linear
    """

    def __init__(self, configs, individual=False):
        super(NLinear, self).__init__()
        self.task_name = configs.task_name
        self.seq_len = configs.seq_len
        if self.task_name == 'classification' or self.task_name == 'anomaly_detection' or self.task_name == 'imputation':
            self.pred_len = configs.seq_len
        else:
            self.pred_len = configs.pred_len

        # Use this line if you want to visualize the weights
        # self.Linear.weight = nn.Parameter((1/self.seq_len)*torch.ones([self.pred_len,self.seq_len]))
        self.channels = configs.enc_in
        self.individual = individual
        if self.individual:
            self.Linear = nn.ModuleList()
            for i in range(self.channels):
                self.Linear.append(nn.Linear(self.seq_len, self.pred_len))
        else:
            self.Linear = nn.Linear(self.seq_len, self.pred_len)

    def encoder(self, x):
        # x: [Batch, Input length, Channel]
        seq_last = x[:, -1:, :].detach()
        x = x - seq_last
        if self.individual:
            output = torch.zeros([x.size(0), self.pred_len, x.size(2)], dtype=x.dtype).to(x.device)
            for i in range(self.channels):
                output[:, :, i] = self.Linear[i](x[:, :, i])
            x = output
        else:
            x = self.Linear(x.permute(0, 2, 1)).permute(0, 2, 1)
        x = x + seq_last
        return x  # [Batch, Output length, Channel]

    def forecast(self, x_enc):
        # Encoder
        return self.encoder(x_enc)

    def imputation(self, x_enc):
        # Encoder
        return self.encoder(x_enc)

    def anomaly_detection(self, x_enc):
        # Encoder
        return self.encoder(x_enc)

    def classification(self, x_enc):
        # Encoder
        enc_out = self.encoder(x_enc)
        # Output
        # (batch_size, seq_length * d_model)
        output = enc_out.reshape(enc_out.shape[0], -1)
        # (batch_size, num_classes)
        output = self.projection(output)
        return output

    def forward(self, x_enc, x_mark_enc, x_dec, x_mark_dec, mask=None):
        if self.task_name == 'long_term_forecast' or self.task_name == 'short_term_forecast':
            dec_out = self.forecast(x_enc)
            return dec_out[:, -self.pred_len:, :]  # [B, L, D]
        if self.task_name == 'imputation':
            dec_out = self.imputation(x_enc)
            return dec_out  # [B, L, D]
        if self.task_name == 'anomaly_detection':
            dec_out = self.anomaly_detection(x_enc)
            return dec_out  # [B, L, D]
        if self.task_name == 'classification':
            dec_out = self.classification(x_enc)
            return dec_out  # [B, N]
        return None


    def compute_expert_l1_loss(self):
        loss = torch.tensor(0.0, device='cuda' if torch.cuda.is_available() else 'cpu')
        for param in self.Linear.parameters():
            if param.requires_grad:
                l1_sum = torch.norm(param, p=1)
                param_count = param.numel()
                loss += l1_sum / param_count
                
        return loss
        
    def compute_expert_entropy(self):
        
        """
        
        Compute the entropy of model parameters (e.g., expert Linear weights),
        treating the absolute value of weights as a probability distribution.
        """
        entropy = torch.tensor(0.0, device=next(self.parameters()).device)
        eps = 1e-10
        for param in self.Linear.parameters():
            if param.requires_grad:
                flat = param.view(-1)
                abs_weights = torch.abs(flat)
                weight_sum = torch.sum(abs_weights)
                if weight_sum < eps:
                    continue  # skip zero-weight layers
                prob = abs_weights / (weight_sum + eps)
                entropy_component = -torch.sum(prob * torch.log(prob + eps))
                entropy += entropy_component
        # print(entropy)
        return entropy
