from typing import List

import torch
import torch.nn as nn

from greatx.defense import GUARDDUAL as GUARDDUALLayer
from greatx.nn.layers import GCNConv, Sequential, activations
from greatx.utils import wrapper


class GUARDDUAL(nn.Module):
    r"""Graph Convolution Network (GCN) with dual-threshold :class:`greatx.defense.GUARDDUAL`
    
    A dual-threshold variant of GNNGUARD that uses conservative thresholds during training
    and balanced thresholds during testing for better robustness without sacrificing training stability.

    Parameters
    ----------
    in_channels : int,
        the input dimensions of model
    out_channels : int,
        the output dimensions of model
    hids : List[int], optional
        the number of hidden units for each hidden layer,
        by default [16]
    acts : List[str], optional
        the activation function for each hidden layer,
        by default ['relu']
    dropout : float, optional
        the dropout ratio of model, by default 0.5
    bias : bool, optional
        whether to use bias in the layers, by default True
    bn: bool, optional
        whether to use :class:`BatchNorm1d` after the convolution layer,
        by default False
    dataset_name : str
        Name of the dataset to load appropriate dual thresholds

    Examples
    --------
    >>> # GUARDDUAL with one hidden layer for Cora dataset
    >>> model = GUARDDUAL(100, 10, dataset_name='cora')

    >>> # GUARDDUAL with two hidden layers for CiteSeer dataset  
    >>> model = GUARDDUAL(100, 10, hids=[32, 16], acts=['relu', 'elu'], dataset_name='citeseer')

    See also
    --------
    :class:`greatx.defense.GUARDDUAL`
    :class:`greatx.nn.models.supervised.GNNGUARD`
    :class:`greatx.nn.models.supervised.GCN`
    """
    @wrapper
    def __init__(self, in_channels: int, out_channels: int,
                 hids: List[int] = [16], acts: List[str] = ['relu'],
                 dropout: float = 0.5, bn: bool = False,
                 normalize: bool = True, bias: bool = True, 
                 dataset_name: str = 'cora', train_mask: torch.Tensor = None, 
                 val_mask: torch.Tensor = None):

        super().__init__()
        self.dataset_name = dataset_name
        self.train_mask = train_mask
        self.val_mask = val_mask

        conv = []
        # Add self-loops in the first input layer
        guard_layer_1 = GUARDDUALLayer(dataset_name=dataset_name, add_self_loops=True, 
                                       train_mask=train_mask, val_mask=val_mask)
        conv.append(guard_layer_1)
        
        # Store reference to guard layers for training mode updates
        self.guard_layers = [guard_layer_1]
        
        for hid, act in zip(hids, acts):
            conv.append(
                GCNConv(in_channels, hid, bias=bias, add_self_loops=False,
                        normalize=normalize))
            if bn:
                conv.append(nn.BatchNorm1d(hid))
            conv.append(activations.get(act))
            
            guard_layer = GUARDDUALLayer(dataset_name=dataset_name, add_self_loops=True,
                                         train_mask=train_mask, val_mask=val_mask)
            conv.append(guard_layer)
            self.guard_layers.append(guard_layer)
            
            conv.append(nn.Dropout(dropout))
            in_channels = hid
            
        conv.append(
            GCNConv(in_channels, out_channels, add_self_loops=False, bias=bias,
                    normalize=normalize))
        self.conv = Sequential(*conv)
    
    def set_split_info(self, train_mask: torch.Tensor, val_mask: torch.Tensor):
        """Set split information for all guard layers"""
        self.train_mask = train_mask
        self.val_mask = val_mask
        for guard_layer in self.guard_layers:
            guard_layer.set_split_info(train_mask, val_mask)

    def reset_parameters(self):
        self.conv.reset_parameters()

    def train(self, mode: bool = True):
        """Override train method to update all guard layers"""
        super().train(mode)
        # Update all guard layers to training mode
        for guard_layer in self.guard_layers:
            guard_layer.set_training_mode(mode)
        return self

    def eval(self):
        """Override eval method to update all guard layers"""
        super().eval()
        # Update all guard layers to eval mode
        for guard_layer in self.guard_layers:
            guard_layer.set_training_mode(False)
        return self

    def forward(self, x, edge_index, edge_weight=None):
        """"""
        for layer in self.conv:
            if isinstance(layer, GUARDDUALLayer):
                edge_index, edge_weight = layer(x, edge_index)
            elif isinstance(layer, GCNConv):
                x = layer(x, edge_index, edge_weight)
            else:
                x = layer(x)
        return x

    def extra_repr(self) -> str:
        return f"dataset_name={self.dataset_name}"