
import torch
import torch.nn as nn
from torch.nn.parameter import Parameter
import numpy as np
import torch.nn.functional as F
from torch_geometric.nn import GCNConv,GraphConv,GatedGraphConv,ResGatedGraphConv
from torch_geometric.nn import GINEConv
import torch
import torch.nn as nn
from torch.nn.utils.rnn import pad_sequence
import torch.nn.functional as F
from torchvision.ops import focal_loss
#from torch_geometric.transforms  import NormalizeFeatures
import networkx as nx
import matplotlib.pyplot as plt
#from torchmetrics.functional import auroc
from torchmetrics import AUROC,AveragePrecision
import dgl.nn as dglnn
import torch
import torch.nn as nn
from dgl.nn import GINConv as DW_GINConv
import torch.nn.functional as F
#from torch_geometric.nn import GINConv, global_add_pool,GCN2Conv,GATConv
from torch_geometric.data import Data
def positive_negtive_processing(matrix,type="0"):
   if type =="0":
       pos_counts = (matrix > 0).sum(dim=0)
       neg_counts = (matrix < 0).sum(dim=0)
       mask = neg_counts > pos_counts
       #print(mask)
       matrix[:, mask] = -matrix[:, mask]
   if type =="1":
       pos_sum = torch.where(matrix > 0, matrix, torch.tensor(0., dtype=matrix.dtype)).sum(dim=0)
       neg_sum = torch.where(matrix < 0, matrix, torch.tensor(0., dtype=matrix.dtype)).sum(dim=0)
       mask = (-neg_sum) > pos_sum
       #print(mask)
       #print(matrix[:, mask].shape)
       matrix[:, mask] = -matrix[:, mask]   
   if type=="2":
       pos_matrix = torch.where(matrix > 0, matrix, torch.tensor(0., dtype=matrix.dtype))
       pos_norm = torch.norm(pos_matrix, p=2, dim=0)
       neg_matrix = torch.where(matrix < 0, matrix, torch.tensor(0., dtype=matrix.dtype))
       neg_norm = torch.norm(neg_matrix, p=2, dim=0) 
       mask = neg_norm > pos_norm
       #print(mask)
       matrix[:, mask] = -matrix[:, mask]
   return matrix

class GIN(torch.nn.Module):
    def __init__(self, in_feats, hidden_feats, out_feats):
        super(GIN, self).__init__()

        # MLP for GINConv
        mlp1 = nn.Sequential(
            nn.Linear(in_feats, hidden_feats),
            nn.SELU(),
            nn.LayerNorm(hidden_feats),
            nn.Linear(hidden_feats, hidden_feats),
        )
        mlp2 = nn.Sequential(
            nn.Linear(hidden_feats, hidden_feats),
            nn.SELU(),
            nn.LayerNorm(hidden_feats),
            nn.Linear(hidden_feats, hidden_feats),
        )
        mlp3 = nn.Sequential(
            nn.Linear(hidden_feats, hidden_feats),
            nn.SELU(),
            nn.LayerNorm(hidden_feats),
            nn.Linear(hidden_feats, out_feats)
        )

        self.hidden_ln1 = nn.LayerNorm(hidden_feats)
        self.hidden_ln2 = nn.LayerNorm(hidden_feats)

        # Define GIN layers
        self.conv1 = GINEConv(mlp1)
        self.conv2 = GINEConv(mlp2)
        self.conv3 = GINEConv(mlp3)

    def forward(self, data):
        x, edge_index, edge_weight = data.x, data.edge_index, data.edge_attr

        x = F.silu(self.hidden_ln1(self.conv1(x, edge_index, edge_weight)))
        x = F.silu(self.hidden_ln2(self.conv2(x, edge_index, edge_weight))) + x  # skip connection
        x = self.conv3(x, edge_index, edge_weight)
        return x

class NLayerGIN(torch.nn.Module):
    def __init__(self, in_feats, hidden_feats, out_feats, n_layers=3,dp=0.2):
        super(NLayerGIN, self).__init__()

        self.n_layers = n_layers

        # MLP for GINConv
        mlp1 = nn.Sequential(
            nn.Linear(in_feats, hidden_feats),
            nn.SELU(),
            nn.BatchNorm1d(hidden_feats),
            #nn.LayerNorm(hidden_feats),
            nn.Linear(hidden_feats, hidden_feats),
        )
        self.conv1 = GINEConv(mlp1,edge_dim=1)
        self.hidden_ln1 = nn.LayerNorm(hidden_feats)

        self.hidden_gins = nn.ModuleList()
        self.hidden_lns = nn.ModuleList()
        for _ in range(n_layers-2):
            mlp_ = nn.Sequential(
                nn.Linear(hidden_feats, hidden_feats),
                nn.SELU(),
                nn.BatchNorm1d(hidden_feats),
                #nn.LayerNorm(hidden_feats),
                nn.Linear(hidden_feats, hidden_feats),
            )
            conv = GINEConv(mlp_,edge_dim=1)
            self.hidden_gins.append(conv)
            self.hidden_lns.append(nn.LayerNorm(hidden_feats))

        mlp_out = nn.Sequential(
            nn.Linear(hidden_feats, hidden_feats),
            nn.SELU(),
            nn.BatchNorm1d(hidden_feats),
            #nn.LayerNorm(hidden_feats),
            nn.Linear(hidden_feats, out_feats),
        )
        self.conv_out = GINEConv(mlp_out,edge_dim=1)

    def forward(self, x, edge_index, edge_weight):
        #x, edge_index, edge_weight = data.x, data.edge_index, data.edge_attr

        x = F.silu(self.hidden_ln1(self.conv1(x, edge_index, edge_weight)))
        for i in range(self.n_layers - 2):
            x = F.selu(self.hidden_lns[i](self.hidden_gins[i](x, edge_index, edge_weight)))+x
        x = self.conv_out(x, edge_index, edge_weight)
        return x


class GCN_layer(nn.Module):
    

    def __init__(self,inputs_shape,outputs_shape):
        super(GCN_layer, self).__init__()


        self.W=Parameter(torch.rand(inputs_shape,outputs_shape),requires_grad=True)
        self.bias = Parameter(torch.rand(outputs_shape),requires_grad=True)

    
    def forward(self,Adj_matrix,input_features):
        
        
        A=(Adj_matrix).type(torch.LongTensor)
        
        assert A.shape[0]==A.shape[1]
        I=torch.eye(A.shape[0])
        
        A_hat=A+I
        
        D=torch.sum(A_hat,axis=0)
        
        D=torch.diag(D)
        
        D_inv=torch.inverse(D)
                
        A_hat = torch.mm(torch.mm(D_inv,A_hat),D_inv)
        
        aggregate=torch.mm(A_hat,input_features)
        
        propagate=torch.mm(aggregate,self.W)+self.bias     
                
        
        return propagate

class GCN(nn.Module):
    

    def __init__(self,inputs_shape,outputs_shape,n_classes,activation='Relu'):
        super(GCN, self).__init__()

        self.layer1=GCN_layer(inputs_shape,outputs_shape)
        self.layer2=GCN_layer(outputs_shape,n_classes)
        
        
        if activation =='Tanh':
            self.activation = nn.Tanh()
        elif activation=='Sigmoid':
            self.activation = nn.Sigmoid()
        elif activation=='Softmax':
            self.activation=nn.Softmax()
        elif activation=='Relu':
            self.activation=nn.ReLU()
    
        self.softmax=nn.Softmax()
        
    
    def forward(self,Adj_matrix,input_features):
        
        x=self.layer1(Adj_matrix,input_features)
        x=self.activation(x) 
        x=self.layer2(Adj_matrix,x)  
        
        return x


class TransformerNodeEncoder(nn.Module):
    #@staticmethod
    def __init__(self, d_model,num_encoder_layers,nhead,dim_feedforward,transformer_dropout,transformer_activation):
        super(TransformerNodeEncoder,self).__init__()

        self.d_model = d_model
        self.num_layer = num_encoder_layers
        # Creating Transformer Encoder Model
        encoder_layer = nn.TransformerEncoderLayer(
            d_model, nhead, dim_feedforward, transformer_dropout, transformer_activation,batch_first=True
        )
        encoder_norm = nn.LayerNorm(d_model)
        self.transformer = nn.TransformerEncoder(encoder_layer, num_encoder_layers, encoder_norm)

    def forward(self,inputs,mask):
        if mask !=None:
         transformer_out = self.transformer(inputs,src_key_padding_mask=mask)  
        else:
         transformer_out = self.transformer(inputs)  
        return transformer_out

class GCNTS(nn.Module):
    

    def __init__(self,inputs_shape,outputs_shape,n_classes,activation='Relu'):
        super(GCNTS, self).__init__()

        self.layer1=GCN_layer(inputs_shape,outputs_shape)
        self.layer2=GCN_layer(outputs_shape,n_classes)
        
        
        if activation =='Tanh':
            self.activation = nn.Tanh()
        elif activation=='Sigmoid':
            self.activation = nn.Sigmoid()
        elif activation=='Softmax':
            self.activation=nn.Softmax()
        elif activation=='Relu':
            self.activation=nn.ReLU()
    
        self.softmax=nn.Softmax()
        
    
    def forward(self,Adj_matrix,input_features):
        
        x=self.layer1(Adj_matrix,input_features)
        x=self.activation(x) 
        x=self.layer2(Adj_matrix,x)
        x=self.softmax(x)     
        
        return x
    

class GCN_geo(nn.Module):
    def __init__(self, gcn_in_channels, gcn_hidden_channels, gcn_out_channels):
        super(GCN_geo, self).__init__()
        # 第一层 GCNConv
        self.conv1 = GCNConv(gcn_in_channels,gcn_hidden_channels,improved=True)#3,'mean')#,aggr="mean")
        self.layernorm1=nn.LayerNorm(gcn_hidden_channels)
        # 第二层 GCNConv
        self.conv2 = GCNConv(gcn_hidden_channels,gcn_hidden_channels,improved=True)#,3,'mean')#aggr="mean")
        self.layernorm2=nn.LayerNorm(gcn_hidden_channels)
        self.conv3=GCNConv(gcn_hidden_channels,gcn_out_channels,improved=True)#,3,'mean')#,aggr="mean")
        #self.layernorm3=nn.LayerNorm(gcn_hidden_channels)

    def forward(self,x,edge_index, edge_attr):
       x = F.selu(self.layernorm1((self.conv1(x, edge_index, edge_attr))))
       x = F.selu(self.layernorm2((self.conv2(x, edge_index, edge_attr))))
       x=self.conv3(x, edge_index, edge_attr)
       return x  # 返回节点的输出，通常用于节点分类或其他任务
    
class GAT(nn.Module):
    def __init__(self, gcn_in_channels, gcn_hidden_channels, gcn_out_channels):
        super(GAT, self).__init__()
        # 第一层 GCNConv
        self.conv1 = GATConv(gcn_in_channels,gcn_hidden_channels,1,edge_dim=1)#3,'mean')#,aggr="mean")
        self.layernorm1=nn.LayerNorm(gcn_hidden_channels)
        # 第二层 GCNConv
        self.conv2 = GATConv(gcn_hidden_channels,gcn_hidden_channels,1,edge_dim=1)#,3,'mean')#aggr="mean")
        self.layernorm2=nn.LayerNorm(gcn_hidden_channels)
        self.conv3=GATConv(gcn_hidden_channels,gcn_out_channels,1,edge_dim=1)#,3,'mean')#,aggr="mean")
        #self.layernorm3=nn.LayerNorm(gcn_hidden_channels)

    def forward(self,x,edge_index, edge_attr):
       x = F.selu(((self.conv1(x, edge_index, edge_attr))))
       #x = F.selu(self.layernorm2((self.conv2(x, edge_index, edge_attr))))
       x=self.conv3(x, edge_index, edge_attr)
       return x  # 返回节点的输出，通常用于节点分类或其他任务
    
class MLP(nn.Module):
    def __init__(self, input_dim, hidden_dim, output_dim, num_layers):
        super(MLP, self).__init__()
        
        # 定义一个列表来存储每一层的网络层
        layers = []
        
        # 输入层到第一层隐藏层
        layers.append(nn.Linear(input_dim, hidden_dim))
        layers.append(nn.LayerNorm(hidden_dim))
        #layers.append(nn.BatchNorm1d(hidden_dim)),
        layers.append(nn.ELU())
        #layers.append(nn.LayerNorm(hidden_dim))
        
        # 生成中间的隐藏层
        for i in range(num_layers - 1):
            #print(i)
            layers.append(nn.Linear(hidden_dim//(2**(i)), hidden_dim//(2**(i+1))))
            layers.append(nn.LayerNorm(hidden_dim//(2**(i+1))))
            #layers.append(nn.BatchNorm1d(hidden_dim//(2**(i+1))))
            layers.append(nn.ELU())
            #layers.append(nn.LayerNorm(hidden_dim//(2**(i+1))))
            #layers.append(nn.LayerNorm(hidden_dim))
        
        # 最后一层从隐藏层到输出层
        layers.append(nn.Linear(hidden_dim//(2**(num_layers-1)), output_dim))
        
        # 使用nn.Sequential按顺序执行每一层
        self.model = nn.Sequential(*layers)
    
    def forward(self, x):
        return self.model(x)


class MLP_ne(nn.Module):
    def __init__(self, input_dim, hidden_dim, output_dim, num_layers):
        super(MLP_ne, self).__init__()
        
        # 定义一个列表来存储每一层的网络层
        layers = []
        
        # 输入层到第一层隐藏层
        layers.append(nn.Linear(input_dim, hidden_dim))
        #layers.append(nn.LayerNorm(hidden_dim))
        #layers.append(nn.BatchNorm1d(hidden_dim)),
        layers.append(nn.SELU())
        #layers.append(nn.LayerNorm(hidden_dim))
        
        # 生成中间的隐藏层
        for i in range(num_layers - 1):
            #print(i)
            layers.append(nn.Linear(hidden_dim//(2**(i)), hidden_dim//(2**(i+1))))
            #layers.append(nn.LayerNorm(hidden_dim//(2**(i+1))))
            #layers.append(nn.BatchNorm1d(hidden_dim//(2**(i+1))))
            layers.append(nn.SELU())
            #layers.append(nn.LayerNorm(hidden_dim//(2**(i+1))))
            #layers.append(nn.LayerNorm(hidden_dim))
        
        # 最后一层从隐藏层到输出层
        layers.append(nn.Linear(hidden_dim//(2**(num_layers-1)), output_dim))
        
        # 使用nn.Sequential按顺序执行每一层
        self.model = nn.Sequential(*layers)
    
    def forward(self, x):
        return self.model(x)
    
class GNN(nn.Module):
    def __init__(self, gcn_in_channels, gcn_hidden_channels, gcn_out_channels,TF_num_encoder_layers,TF_nhead,TF_dim_feedforward,TF_transformer_dropout,TF_transformer_activation,lamda=0.1):
        super(GNN, self).__init__()
        # 第一层 GCNConv
        self.conv_set=[]
        self.lamda=lamda
        self.conv1 =GAT(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)#NLayerGIN(gcn_in_channels, gcn_hidden_channels,gcn_out_channels,6)#GCN_geo(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)
        self.conv2 =GAT(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)#NLayerGIN(gcn_in_channels, gcn_hidden_channels,gcn_out_channels,6)#GCN_geo(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)
        self.conv3= GAT(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)#NLayerGIN(gcn_in_channels, gcn_hidden_channels,gcn_out_channels,6)#GCN_geo(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)
        #self.conv4= GCN_geo(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)
        #self.conv5= GCN_geo(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)
        self.conv_set.append(self.conv1)
        self.conv_set.append(self.conv2)
        self.conv_set.append(self.conv3)
        self.MLP_classification=MLP(gcn_out_channels*3,256,1,3)
        self.MLP_graph_percent=MLP(gcn_out_channels*3,512,1,3)
        #self.conv_set.append(self.conv4)
        #self.conv_set.append(self.conv5)
        #print(self.conv_set[0])
        #self.TF=TransformerNodeEncoder(d_model=gcn_out_channels*3,num_encoder_layers=TF_num_encoder_layers,nhead=TF_nhead,dim_feedforward=TF_dim_feedforward,transformer_dropout=TF_transformer_dropout,transformer_activation=TF_transformer_activation)
        self.certrion=torch.nn.BCELoss(reduce='sum')
        #self.certrion=torch.nn.CrossEntropyLoss(reduction="sum")#weight=torch.tensor([1,10]).float()
        #self.certrion=focal_loss.sigmoid_focal_loss()


    def forward(self, datas):
      outputs=None
      i=0
      for data in [datas.x_1,datas.x_2,datas.x_3]:#,datas.x_4[0],datas.x_5[0]]:
        #data=data[0]
        #NormalizeFeatures(data)
        x, edge_index, edge_attr = data.x.to(torch.float), data.edge_index.to(torch.int64), data.edge_attr.to(torch.float)
        mus = torch.mean(x, dim=0)
        sds = torch.std(x, dim=0)
        #print(sds.shape)
        sds[sds == 0] = 1
        #x=positive_negtive_processing(x,"0")
        #x= (x-mus)/sds
        #print(data)
        #print(f'Weight max: {data.edge_attr.max()}, min: {data.edge_attr.min()} mean: {torch.mean(data.edge_attr)}')
        # 第一层图卷积 + ReLU 激
        #print(edge_index.shape)
        x=self.conv_set[i](x,edge_index,edge_attr)
        if outputs==None:
            outputs=x
        else:
            outputs=torch.concat([outputs,x],dim=1)
            #print(outputs.shape)
        #x = F.softmax(x, dim=1)
        i+=1
      return outputs  # 返回节点的输出，通常用于节点分类或其他任务
    def multi_forward(self,datas):
        loss=0
        roc=[]
        outputs=[]
        ys=[]
        for i in range (0,len(datas)):
            data=datas[i]
            #print(data)
            out=self.forward(data)
            #out=F.selu(out)
            #print(out.shape)
            outputs.append(out)
            y=data.x_1.y.float()
            ys.append(y)
            percent=y.sum()/len(y)*100
            #prercent_loss=(percent-y_hat)**2
            #print(y_hat.shape)
        #outputs=torch.cat(outputs)
        valid_outputs=torch.cat(outputs)
        outputs=self.MLP_classification(valid_outputs)
        valid_outputs=torch.sigmoid(outputs)
        ys=torch.concat(ys)
        #print(ys.shape)
        #print(valid_outputs.shape)
        loss=self.certrion(torch.squeeze(valid_outputs,dim=1),ys)
        #print(loss)
        #loss=focal_loss.sigmoid_focal_loss(torch.squeeze(valid_outputs,dim=1),ys,alpha=0.1,gamma=2,reduction='sum')
        #auroc = AUROC(task="binary")
        #roc=auroc(F.softmax(valid_outputs,dim=1),ys)
            #average_precision = AveragePrecision(task="binary")
        return loss,valid_outputs,ys

    
    def train_test(self,datas):
      outputs=None
      i=0
      for data in [datas.x_1[0],datas.x_2[0],datas.x_3[0]]:#,datas.x_4[0],datas.x_5[0]]:
        #data=data[0]
        #NormalizeFeatures(data)
        x, edge_index, edge_attr = data.x.to(torch.float), data.edge_index.to(torch.int64), data.edge_attr.to(torch.float)
        mus = torch.mean(x, dim=0)
        sds = torch.std(x, dim=0)
        #print(sds.shape)
        sds[sds == 0] = 1
        #x=positive_negtive_processing(x,"0")
        #x= (x-mus)/sds
        #print(data)
        #print(f'Weight max: {data.edge_attr.max()}, min: {data.edge_attr.min()} mean: {torch.mean(data.edge_attr)}')
        # 第一层图卷积 + ReLU 激
        x=self.conv_set[i](x,edge_index,edge_attr)
        if outputs==None:
            outputs=x
        else:
            outputs=torch.concat([outputs,x],dim=1)
            #print(outputs.shape)
        #x = F.softmax(x, dim=1)
        i+=1
      x=self.MLP_classification(outputs)
      #x=F.softmax(x,dim=1)
      x=F.sigmoid(x)
      #print(x.shape)
      return x #返回节点的输出，通常用于节点分类或其他任务
class GCN_TF(nn.Module):
    def __init__(self, gcn_in_channels, gcn_hidden_channels, gcn_out_channels,TF_num_encoder_layers,TF_nhead,TF_dim_feedforward,TF_transformer_dropout,TF_transformer_activation,lamda=0.1):
        super(GCN_TF, self).__init__()
        # 第一层 GCNConv
        self.conv_set=[]
        self.lamda=lamda
        self.conv1 =GAT(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)#NLayerGIN(gcn_in_channels, gcn_hidden_channels,gcn_out_channels,6)#GCN_geo(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)
        self.conv2 =GAT(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)#NLayerGIN(gcn_in_channels, gcn_hidden_channels,gcn_out_channels,6)#GCN_geo(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)
        self.conv3= GAT(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)#NLayerGIN(gcn_in_channels, gcn_hidden_channels,gcn_out_channels,6)#GCN_geo(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)
        #self.conv4= GCN_geo(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)
        #self.conv5= GCN_geo(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)
        self.conv_set.append(self.conv1)
        self.conv_set.append(self.conv2)
        self.conv_set.append(self.conv3)
        self.MLP_classification=MLP(gcn_out_channels*3,256,1,3)
        self.MLP_graph_percent=MLP(gcn_out_channels*3,512,1,3)
        #self.conv_set.append(self.conv4)
        #self.conv_set.append(self.conv5)
        #print(self.conv_set[0])
        self.TF=TransformerNodeEncoder(d_model=gcn_out_channels*3,num_encoder_layers=TF_num_encoder_layers,nhead=TF_nhead,dim_feedforward=TF_dim_feedforward,transformer_dropout=TF_transformer_dropout,transformer_activation=TF_transformer_activation)
        self.certrion=torch.nn.BCELoss(reduce='sum')
        #self.certrion=torch.nn.CrossEntropyLoss(reduction="sum")#weight=torch.tensor([1,10]).float()
        #self.certrion=focal_loss.sigmoid_focal_loss()


    def forward(self, datas):
      outputs=None
      i=0
      for data in [datas.x_1,datas.x_2,datas.x_3]:#,datas.x_4[0],datas.x_5[0]]:
        #data=data[0]
        #NormalizeFeatures(data)
        x, edge_index, edge_attr = data.x.to(torch.float), data.edge_index.to(torch.int64), data.edge_attr.to(torch.float)
        mus = torch.mean(x, dim=0)
        sds = torch.std(x, dim=0)
        #print(sds.shape)
        sds[sds == 0] = 1
        #x=positive_negtive_processing(x,"0")
        #x= (x-mus)/sds
        #print(data)
        #print(f'Weight max: {data.edge_attr.max()}, min: {data.edge_attr.min()} mean: {torch.mean(data.edge_attr)}')
        # 第一层图卷积 + ReLU 激
        #print(edge_index.shape)
        x=self.conv_set[i](x,edge_index,edge_attr)
        if outputs==None:
            outputs=x
        else:
            outputs=torch.concat([outputs,x],dim=1)
            #print(outputs.shape)
        #x = F.softmax(x, dim=1)
        i+=1
      #print(outputs.shape)
      #outputs=torch.unsqueeze(outputs,dim=0)
      #print(outputs.shape)
      #x=self.TF(outputs)
      #print(x.shape)
      #x=F.silu(outputs)
      #print(x.shape)
      #x=torch.squeeze(x,dim=0)
      #out=self.MLP_classification(x)
      #y_hat=self.MLP_graph_percent(torch.sum(x,dim=0))
      #out=F.sigmoid(out)
      return outputs  # 返回节点的输出，通常用于节点分类或其他任务
    def multi_forward(self,datas):
        loss=0
        roc=[]
        outputs=[]
        ys=[]
        for i in range (0,len(datas)):
            data=datas[i]
            #print(data)
            out=self.forward(data)
            #out=F.selu(out)
            #print(out.shape)
            outputs.append(out)
            y=data.x_1.y.float()
            ys.append(y)
            percent=y.sum()/len(y)*100
            #prercent_loss=(percent-y_hat)**2
            #print(y_hat.shape)
        #outputs=torch.cat(outputs)
        padded_outputs=pad_sequence(outputs,batch_first=True,padding_value=-1)
        attention_mask = torch.all(padded_outputs == -1, dim=-1)
        outputs = self.TF(padded_outputs, attention_mask)
        #outputs=self.TF(out,None)
        valid_outputs = outputs[~attention_mask]
        outputs=self.MLP_classification(valid_outputs)
        valid_outputs=torch.sigmoid(outputs)
        ys=torch.concat(ys)
        #print(ys.shape)
        #print(valid_outputs.shape)
        loss=self.certrion(torch.squeeze(valid_outputs,dim=1),ys)
        #print(loss)
        #loss=focal_loss.sigmoid_focal_loss(torch.squeeze(valid_outputs,dim=1),ys,alpha=0.1,gamma=2,reduction='sum')
        #auroc = AUROC(task="binary")
        #roc=auroc(F.softmax(valid_outputs,dim=1),ys)
            #average_precision = AveragePrecision(task="binary")
        return loss,valid_outputs,ys

    
    def train_test(self,datas):
      outputs=None
      i=0
      for data in [datas.x_1[0],datas.x_2[0],datas.x_3[0]]:#,datas.x_4[0],datas.x_5[0]]:
        #data=data[0]
        #NormalizeFeatures(data)
        x, edge_index, edge_attr = data.x.to(torch.float), data.edge_index.to(torch.int64), data.edge_attr.to(torch.float)
        mus = torch.mean(x, dim=0)
        sds = torch.std(x, dim=0)
        #print(sds.shape)
        sds[sds == 0] = 1
        X_min = x.min(dim=0, keepdim=True).values  # 计算最小值
        X_max = x.max(dim=0, keepdim=True).values  # 计算最大值
        x=(x-X_min)/(X_max-X_min)
        #x=positive_negtive_processing(x,"0")
        #x= (x-mus)/sds
        #print(data)
        #print(f'Weight max: {data.edge_attr.max()}, min: {data.edge_attr.min()} mean: {torch.mean(data.edge_attr)}')
        # 第一层图卷积 + ReLU 激
        x=self.conv_set[i](x,edge_index,edge_attr)
        if outputs==None:
            outputs=x
        else:
            outputs=torch.concat([outputs,x],dim=1)
            #print(outputs.shape)
        #x = F.softmax(x, dim=1)
        i+=1
      outputs=torch.unsqueeze(outputs,dim=0)
      #outputs=F.selu(outputs)
      x=self.TF(outputs,None)
      #x=F.silu(x)
      x=torch.squeeze(x,dim=0)
      x=self.MLP_classification(x)
      #x=F.softmax(x,dim=1)
      x=F.sigmoid(x)
      #print(x.shape)
      return x #返回节点的输出，通常用于节点分类或其他任务
    

class GCNpariTF(nn.Module):
    def __init__(self, gcn_in_channels, gcn_hidden_channels, gcn_out_channels,TF_num_encoder_layers,TF_nhead,TF_dim_feedforward,TF_transformer_dropout,TF_transformer_activation):
        super(GCNpariTF, self).__init__()
        # 第一层 GCNConv
        self.conv_set=[]
        self.conv1 = GCN_geo(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)
        self.conv2 = GCN_geo(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)
        self.conv3= GCN_geo(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)
        #self.conv4= GCN_geo(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)
        #self.conv5= GCN_geo(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)
        self.conv_set.append(self.conv1)
        self.conv_set.append(self.conv2)
        self.conv_set.append(self.conv3)
        #self.conv_set.append(self.conv4)
        #self.conv_set.append(self.conv5)
        #print(self.conv_set[0])
        self.TF1=TransformerNodeEncoder(d_model=gcn_in_channels,num_encoder_layers=TF_num_encoder_layers,nhead=TF_nhead,dim_feedforward=TF_dim_feedforward,transformer_dropout=TF_transformer_dropout,transformer_activation=TF_transformer_activation)
        self.TF2=TransformerNodeEncoder(d_model=gcn_in_channels,num_encoder_layers=TF_num_encoder_layers,nhead=TF_nhead,dim_feedforward=TF_dim_feedforward,transformer_dropout=TF_transformer_dropout,transformer_activation=TF_transformer_activation)
        self.TF3=TransformerNodeEncoder(d_model=gcn_in_channels,num_encoder_layers=TF_num_encoder_layers,nhead=TF_nhead,dim_feedforward=TF_dim_feedforward,transformer_dropout=TF_transformer_dropout,transformer_activation=TF_transformer_activation)
        self.TFset=[]
        self.TFset.append(self.TF1)
        self.TFset.append(self.TF2)
        self.TFset.append(self.TF3)
        self.last_layer1=nn.Linear((gcn_out_channels+gcn_in_channels)*3,512)
        self.last_layer2=nn.Linear(512,gcn_out_channels)
        self.last_layer3=nn.Linear(gcn_out_channels,gcn_out_channels//2)
        self.last_layer4=nn.Linear(gcn_out_channels//2,1)
        #self.certrion=torch.nn.CrossEntropyLoss()
        self.certrion=torch.nn.BCEWithLogitsLoss()

    def forward(self, datas):
      outputs=None
      i=0
      all_outputs=None
      for data in [datas.x_1,datas.x_2,datas.x_3]:#,datas.x_4[0],datas.x_5[0]]:
        #data=data[0]
        #NormalizeFeatures(data)
        x, edge_index, edge_attr = data.x, data.edge_index.to(torch.int64), data.edge_attr
        mus = torch.mean(x, dim=0)
        sds = torch.std(x, dim=0)
        #print(sds.shape)
        sds[sds == 0] = 1
        #x= (x-mus)/sds
        #print(data)
        #print(f'Weight max: {data.edge_attr.max()}, min: {data.edge_attr.min()} mean: {torch.mean(data.edge_attr)}')
        # 第一层图卷积 + ReLU 激
        gcn_outputs=self.conv_set[i](x,edge_index,edge_attr)
        #print(gcn_outputs.shape)
        tf_outputs=torch.squeeze(self.TFset[i](torch.squeeze(x,dim=0)),dim=0)
        #print(tf_outputs.shape)
        outputs=torch.concat([gcn_outputs,tf_outputs],dim=1)
        if all_outputs==None:
            all_outputs=outputs
        else:
            all_outputs=torch.concat([all_outputs,outputs],dim=1)
        i+=1
      #print(all_outputs.shape)
      #x=F.silu(all_outputs)
      x=F.elu(self.last_layer1(all_outputs))
      x=F.elu(self.last_layer2(x))
      x=F.elu(self.last_layer3(x))
      x=(self.last_layer4(x))
      x=torch.squeeze(x,dim=0)
        #x=F.sigmoid(x)
      return x,data.y # 返回节点的输出，通常用于节点分类或其他任务
    def multi_forward(self,datas):
        loss=0
        roc=[]
        all_roc=[]
        for i in range (0,len(datas)):
            data=datas[i]
            #print(data)
            out,y=self.forward(data)
            out=torch.squeeze((out),dim=1).to(float)
            #print(out.shape)
            #print(data.x_1.y.shape)
            loss+=self.certrion(out,data.x_1.y.to(float))
            auroc = AUROC(task="binary")
            all_roc.append(auroc(out,y))
            #average_precision = AveragePrecision(task="binary")a
        roc=sum(all_roc)/len(all_roc)
        #print(sum(all_roc)/len(all_roc))
        return loss,roc

    def test(self,datas):
      outputs=None
      i=0
      for data in [datas.x_1,datas.x_2,datas.x_3]:#,datas.x_4[0],datas.x_5[0]]:
        #data=data[0]
        #NormalizeFeatures(data)
        x, edge_index, edge_attr = data.x, data.edge_index, data.edge_attr
        mus = torch.mean(x, dim=0)
        sds = torch.std(x, dim=0)
        #print(sds.shape)
        sds[sds == 0] = 1
       # x= (x-mus)/sds
        #print(data)
        #print(f'Weight max: {data.edge_attr.max()}, min: {data.edge_attr.min()} mean: {torch.mean(data.edge_attr)}')
        # 第一层图卷积 + ReLU 激
        x=self.conv_set[i](x,edge_index,edge_attr)
        if outputs==None:
            outputs=x
        else:
            outputs=torch.concat([outputs,x],dim=1)
            #print(outputs.shape)
        #x = F.softmax(x, dim=1)
        i+=1
      print(outputs.shape)
      x=self.TF(outputs)
      x=F.silu(x)
      x=F.silu(self.last_layer1(x))
      x=F.silu(self.last_layer2(x))
      x=F.silu(self.last_layer3(x))
      x=(self.last_layer4(x))
        #x=F.sigmoid(x)
      return x  # 返回节点的输出，通常用于节点分类或其他任务
    
    def train_test(self,datas):
      outputs=None
      i=0
      all_outputs=None
      for data in [datas.x_1[0],datas.x_2[0],datas.x_3[0]]:#,datas.x_4[0],datas.x_5[0]]:
        #data=data[0]
        #NormalizeFeatures(data)
        x, edge_index, edge_attr = data.x, data.edge_index.to(torch.int64), data.edge_attr
        mus = torch.mean(x, dim=0)
        sds = torch.std(x, dim=0)
        #print(sds.shape)
        sds[sds == 0] = 1
        #x= (x-mus)/sds
        gcn_outputs=self.conv_set[i](x,edge_index,edge_attr)
        tf_outputs=torch.squeeze(self.TFset[i](torch.squeeze(x,dim=0)),dim=0)
        outputs=torch.concat([gcn_outputs,tf_outputs],dim=1)
        if all_outputs==None:
            all_outputs=outputs
        else:
            all_outputs=torch.concat([all_outputs,outputs],dim=1)
        i+=1
      #x=F.silu(all_outputs)
      x=F.elu(self.last_layer1(all_outputs))
      x=F.elu(self.last_layer2(x))
      x=F.elu(self.last_layer3(x))
      x=(self.last_layer4(x))
      x=torch.squeeze(x,dim=0)
      #x=F.softmax(x,dim=1)
      return x  # 返回节点的输出，通常用于节点分类或其他任务


class GCN_KDE(nn.Module):
    def __init__(self, gcn_in_channels, gcn_hidden_channels, gcn_out_channels,TF_num_encoder_layers,TF_nhead,TF_dim_feedforward,TF_transformer_dropout,TF_transformer_activation):
        super(GCN_KDE, self).__init__()
        # 第一层 GCNConv
        self.conv_set=[]
        self.conv1 = GCN_geo(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)
        self.conv2 = GCN_geo(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)
        self.conv3= GCN_geo(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)
        #self.conv4= GCN_geo(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)
        #self.conv5= GCN_geo(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)
        self.conv_set.append(self.conv1)
        self.conv_set.append(self.conv2)
        self.conv_set.append(self.conv3)
        #self.conv_set.append(self.conv4)
        #self.conv_set.append(self.conv5)
        #print(self.conv_set[0])
        self.TF=TransformerNodeEncoder(d_model=gcn_out_channels*3,num_encoder_layers=TF_num_encoder_layers,nhead=TF_nhead,dim_feedforward=TF_dim_feedforward,transformer_dropout=TF_transformer_dropout,transformer_activation=TF_transformer_activation)
        self.last_layer1=nn.Linear(gcn_out_channels*3,512)
        self.bn1=nn.LayerNorm(512)
        self.last_layer2=nn.Linear(512,gcn_out_channels)
        self.bn2=nn.LayerNorm(gcn_out_channels)
        self.last_layer3=nn.Linear(gcn_out_channels,gcn_out_channels//2)
        self.bn3=nn.LayerNorm(gcn_out_channels//2)
        self.last_layer4=nn.Linear(gcn_out_channels//2,1)
        #self.certrion=torch.nn.CrossEntropyLoss()
        self.certrion=torch.nn.BCELoss()

    def forward(self, datas):
      outputs=None
      i=0
      for data in [datas.x_1,datas.x_2,datas.x_3]:#,datas.x_4[0],datas.x_5[0]]:
        #data=data[0]
        #NormalizeFeatures(data)
        x, edge_index, edge_attr = data.x, data.edge_index.to(torch.int64), data.edge_attr
        mus = torch.mean(x, dim=0)
        sds = torch.std(x, dim=0)
        #print(sds.shape)
        sds[sds == 0] = 1
        #x= (x-mus)/sds
        #print(data)
        #print(f'Weight max: {data.edge_attr.max()}, min: {data.edge_attr.min()} mean: {torch.mean(data.edge_attr)}')
        # 第一层图卷积 + ReLU 激
        x=self.conv_set[i](x,edge_index,edge_attr)
        if outputs==None:
            outputs=x
        else:
            outputs=torch.concat([outputs,x],dim=1)
            #print(outputs.shape)
        #x = F.softmax(x, dim=1)
        i+=1
      x=outputs
      #print(outputs.shape)
      #outputs=torch.unsqueeze(outputs,dim=0)
      #print(outputs.shape)
      #x=self.TF(outputs)
      #print(x.shape)
      #x=F.silu(outputs)
      #print(x.shape)
      #x=torch.squeeze(x,dim=0)
      #x=F.silu(self.bn1(self.last_layer1(x)))
      #x=F.silu(self.bn2(self.last_layer2(x)))
      #x=F.silu(self.bn3(self.last_layer3(x)))
      #x=(self.last_layer4(x))
      #x=torch.squeeze(x,dim=0)
      #x=F.sigmoid(x)
      return x  # 返回节点的输出，通常用于节点分类或其他任务
    def multi_forward(self,datas):
        loss=0
        roc=[]
        for i in range (0,len(datas)):
            data=datas[i]
            labels=data.x_1.y
            #print(data)
            out=self.forward(data)
            dists=torch.cdist(out,out,p=2)
            ex=torch.exp(-dists**2/(torch.mean(dists)**2))
            densities=torch.sum(ex,dim=1)/len(labels)
            loss_0 = (labels == 0).float() * (-densities)
            loss_1 = (labels == 1).float() * densities
            #out=torch.squeeze((out),dim=1).to(float)
            #print(out.shape)
            loss+=loss_0.sum()/len(loss_0)+loss_1.sum()/len(loss_1)
            #print(data.x_1.y.shape)
            #auroc = AUROC(task="binary")
            #average_precision = AveragePrecision(task="binary")
        return loss,0

    
    def train_test(self,datas):
      outputs=None
      i=0
      for data in [datas.x_1[0],datas.x_2[0],datas.x_3[0]]:#,datas.x_4[0],datas.x_5[0]]:
        #data=data[0]
        #NormalizeFeatures(data)
        x, edge_index, edge_attr = data.x, data.edge_index.to(torch.int64), data.edge_attr
        mus = torch.mean(x, dim=0)
        sds = torch.std(x, dim=0)
        #print(sds.shape)
        sds[sds == 0] = 1
        #x= (x-mus)/sds
        #print(data)
        #print(f'Weight max: {data.edge_attr.max()}, min: {data.edge_attr.min()} mean: {torch.mean(data.edge_attr)}')
        # 第一层图卷积 + ReLU 激
        x=self.conv_set[i](x,edge_index,edge_attr)
        if outputs==None:
            outputs=x
        else:
            outputs=torch.concat([outputs,x],dim=1)
            #print(outputs.shape)
        #x = F.softmax(x, dim=1)
        i+=1
      #outputs=torch.unsqueeze(outputs,dim=0)
      x=outputs
      #x=self.TF(outputs)
      #x=F.silu(x)
      #x=torch.squeeze(x,dim=0)
      #x=F.silu(self.bn1(self.last_layer1(x)))
      #x=F.silu(self.bn2(self.last_layer2(x)))
      #x=F.silu(self.bn3(self.last_layer3(x)))
      #x=(self.last_layer4(x))
      #x=torch.squeeze(x,dim=0)
      #x=F.sigmoid(x)
      dists=torch.cdist(x,x,p=2)
      ex=torch.exp(-dists**2/(torch.mean(dists)**2))
      densities=torch.sum(ex,dim=1)
       #     labels=data.x_1.y
      return densities  # 返回节点的输出，通常用于节点分类或其他任务

class DW_GAT(nn.Module):
    def __init__(self, in_size, hid_size, out_size, heads=4, n_transformer=5):
        super().__init__()
        self.n_transformer = n_transformer
        self.gat_layers = nn.ModuleList()
        # two-layer GAT
        self.gat_layers.append(
            dglnn.GATConv(
                in_size,
                hid_size,
                heads,
                residual=True
                ,
                feat_drop=0.1,
                attn_drop=0.1,
                activation=F.elu,
            )
        )
        for i in range(n_transformer-2):
            self.gat_layers.append(
                dglnn.GATConv(
                    hid_size * heads,
                    hid_size,
                    heads,
                    residual=True,
                    feat_drop=0.1,
                    attn_drop=0.1,
                    activation=F.elu,
                )
            )
        self.gat_layers.append(
            dglnn.GATConv(
                hid_size * heads,
                out_size,
                heads,
                residual=True,
                feat_drop=0.1,
                attn_drop=0.1,
                activation=None,
            )
        )
    def forward(self, g, inputs):
        h = inputs
        for i, layer in enumerate(self.gat_layers):
            h = layer(g, h, edge_weight=g.edata['weight'])
            # h = layer(g, h, edge_weight=None)
            if i == self.n_transformer - 1:  # last layer
                h = h.mean(1)
            else:  # other layer(s)
                h = h.flatten(1)
        return h


class DW_NLayerGIN(nn.Module):
    def __init__(self, in_feats, hidden_feats, out_feats, n_layers=3):
        super(DW_NLayerGIN, self).__init__()

        self.n_layers = n_layers

        # MLP for GINConv
        mlp1 = nn.Sequential(
            nn.Linear(in_feats, hidden_feats),
            nn.ELU(),
            #nn.BatchNorm1d(hidden_feats),
            nn.Linear(hidden_feats, hidden_feats),
        )
        self.conv1 = DW_GINConv(mlp1, aggregator_type='sum',learn_eps=True)
        self.hidden_ln1 = nn.LayerNorm(hidden_feats)

        self.hidden_gins = nn.ModuleList()
        self.hidden_lns = nn.ModuleList()
        for i in range(n_layers-2):
            mlp_ = nn.Sequential(
                nn.Linear(hidden_feats, hidden_feats),
                nn.ELU(),
                #nn.BatchNorm1d(hidden_feats),
                nn.Linear(hidden_feats, hidden_feats),
                #
            )
            conv = DW_GINConv(mlp_, aggregator_type='sum',learn_eps=True)
            # self.hidden_gins.append(
            #     nn.Sequential(conv, nn.LayerNorm(hidden_feats))
            # )
            self.hidden_gins.append(conv)
            self.hidden_lns.append(nn.LayerNorm(hidden_feats))

        mlp_out = nn.Sequential(
            nn.Linear(hidden_feats, hidden_feats),
            nn.ELU(),
            #nn.BatchNorm1d(hidden_feats),
            nn.Linear(hidden_feats, out_feats)
        )
        self.conv_out = DW_GINConv(mlp_out, aggregator_type='sum',learn_eps=True)

        # self.hidden_ln_out = nn.LayerNorm(hidden_feats)

    def forward(self, g, features):
        x = (self.conv1(g, features, edge_weight=g.edata['weight']))
        outputs=x
        x=F.elu(self.hidden_ln1(x))
        # x = self.hidden_ln1(self.conv1(g, features, edge_weight=g.edata['weight']))
        for i in range(self.n_layers - 2):
            x = (self.hidden_gins[i](g, x, edge_weight=g.edata['weight'])) #+ x
            #outputs=torch.concat([outputs,x],dim=1)
            x=F.elu(self.hidden_lns[i](x))
            # x = self.hidden_lns[i](self.hidden_gins[i](g, x, edge_weight=g.edata['weight'])) #+ x
        x = self.conv_out(g, x, edge_weight=g.edata['weight'])
        #outputs=torch.concat([outputs,x],dim=1)
        #print(outputs.shape)
        #print(x.shape)
        # x = F.silu(self.hidden_ln2(self.conv3(g, x, edge_weight=g.edata['weight']))) + x
        # x = self.fc(x)
        return x

class DW_GCN(nn.Module):
    def __init__(self, in_feats, hidden_feats, out_feats, n_layers=3):
        super(DW_GCN, self).__init__()
        self.conv_set=[]
        self.n_layers = n_layers
        self.in_feats=in_feats
        self.hidden_feats=hidden_feats
        self.out_feats=out_feats
        self.GIN=DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#DW_GAT(in_feats,hidden_feats,out_feats,4,n_layers)#DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)
        self.conv1 =DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#DW_GAT(in_feats,hidden_feats,out_feats,4,n_layers)#DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#NLayerGIN(gcn_in_channels, gcn_hidden_channels,gcn_out_channels,6)#GCN_geo(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)
        self.conv2 =DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#DW_GAT(in_feats,hidden_feats,out_feats,4,n_layers)#DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#NLayerGIN(gcn_in_channels, gcn_hidden_channels,gcn_out_channels,6)#GCN_geo(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)
        self.conv3= DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#DW_GAT(in_feats,hidden_feats,out_feats,4,n_layers)#DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#NLayerGIN(gcn_in_channels, gcn_hidden_channels,gcn_out_channels,6)#GCN_geo(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)
        self.conv4= DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#DW_GAT(in_feats,hidden_feats,out_feats,4,n_layers)#DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#NLayerGIN(gcn_in_channels, gcn_hidden_channels,gcn_out_channels,6)#GCN_geo(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)
        self.conv5= DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#DW_GAT(in_feats,hidden_feats,out_feats,4,n_layers)#DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#NLayerGIN(gcn_in_channels, gcn_hidden_channels,gcn_out_channels,6)#GCN_geo(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)
        self.conv_set.append(self.conv1)
        self.conv_set.append(self.conv2)
        self.conv_set.append(self.conv3)
        self.conv_set.append(self.conv4)
        self.conv_set.append(self.conv5)
        self.MLP_classification=MLP(out_feats*5,256,1,3)
        self.certrion=torch.nn.BCELoss(reduction='mean')
        #self.certrion=torch.nn.CrossEntropyLoss(reduction="sum")#weight=torch.tensor([1,10]).float()
        #self.certrion=focal_loss.sigmoid_focal_loss()
    def forward(self, datas):
      outputs=None
      i=0
      for data in [datas.x_1,datas.x_2,datas.x_3,datas.x_4,datas.x_5]:
        #data=data[0]
        #NormalizeFeatures(data)
        g=data
        features=g.ndata['emb']
        #x=positive_negtive_processing(x,"0")
        #x= (x-mus)/sds
        x=self.conv_set[i](g,features)
        #print(data)
        #print(f'Weight max: {data.edge_attr.max()}, min: {data.edge_attr.min()} mean: {torch.mean(data.edge_attr)}')
        # 第一层图卷积 + ReLU 激
        #print(edge_index.shape)
        if outputs==None:
            outputs=x
        else:
            outputs=torch.concat([outputs,x],dim=1)
            #print(outputs.shape)
        #x = F.softmax(x, dim=1)
        i+=1
      return outputs  # 返回节点的输出，通常用于节点分类或其他任务
    def multi_forward(self,datas):
        loss=0
        roc=[]
        outputs=[]
        ys=[]
        for i in range (0,len(datas)):
            data=datas[i]
            #print(data)
            out=self.forward(data)
            #out=F.selu(out)
            #print(out.shape)
            outputs.append(out)
            y=data.x_1.ndata['y'].float()
            ys.append(y)
            percent=y.sum()/len(y)*100
            #prercent_loss=(percent-y_hat)**2
            #print(y_hat.shape)
        #outputs=torch.cat(outputs)
        valid_outputs=torch.cat(outputs)
        outputs=self.MLP_classification(valid_outputs)
        valid_outputs=torch.sigmoid(outputs)
        ys=torch.concat(ys)
        loss=self.certrion(torch.squeeze(valid_outputs,dim=1),ys)
        return loss,valid_outputs,ys
    
    def train_test(self,datas):
      outputs=None
      i=0
      for data in [datas.x_1[0],datas.x_2[0],datas.x_3[0],datas.x_4[0],datas.x_5[0]]:
        #data=data[0]
        #NormalizeFeatures(data)
        g=data
        features=g.ndata['emb']
        #x=positive_negtive_processing(x,"0")
        #x= (x-mus)/sds
        x=self.conv_set[i](g,features)
        #mus = torch.mean(x, dim=0)
        #sds = torch.std(x, dim=0)
        #print(sds.shape)
        #sds[sds == 0] = 1
        #x=positive_negtive_processing(x,"0")
        #x= (x-mus)/sds
        #print(data)
        #print(f'Weight max: {data.edge_attr.max()}, min: {data.edge_attr.min()} mean: {torch.mean(data.edge_attr)}')
        # 第一层图卷积 + ReLU 激
        #x=self.conv_set[i](x,edge_index,edge_attr)
        if outputs==None:
            outputs=x
        else:
            outputs=torch.concat([outputs,x],dim=1)
            #print(outputs.shape)
        #x = F.softmax(x, dim=1)
        i+=1
      x=self.MLP_classification(outputs)
      #x=F.softmax(x,dim=1)
      x=F.sigmoid(x)
      #print(x.shape)
      return x #返回节点的输出，通常用于节点分类或其他任务
    

class DW_GCNTF(nn.Module):
    def __init__(self, in_feats, hidden_feats, out_feats, TF_num_encoder_layers=2,TF_nhead=4,TF_act='relu',TF_dim_feedforward=2048,n_layers=3,positive_processing=None,lamda=0.1):
        super(DW_GCNTF, self).__init__()
        self.conv_set=[]
        self.n_layers = n_layers
        self.in_feats=in_feats
        self.TF_num_encoder_layers=TF_num_encoder_layers
        self.TF_nhead=TF_nhead
        self.TF_dim_feedforward=TF_dim_feedforward
        self.TF_act=TF_act
        self.hidden_feats=hidden_feats
        self.out_feats=out_feats
        self.lamda=lamda
        self.positive_processing=positive_processing
        #.GIN=DW_GAT(in_feats,hidden_feats,out_feats,TF_nhead,n_layers)#DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)
        self.conv1 =DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#DW_GAT(in_feats,hidden_feats,out_feats,TF_nhead,n_layers)#DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#NLayerGIN(gcn_in_channels, gcn_hidden_channels,gcn_out_channels,6)#GCN_geo(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)
        self.conv2 =DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#DW_GAT(in_feats,hidden_feats,out_feats,TF_nhead,n_layers)#DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#NLayerGIN(gcn_in_channels, gcn_hidden_channels,gcn_out_channels,6)#GCN_geo(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)
        self.conv3= DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#DW_GAT(in_feats,hidden_feats,out_feats,TF_nhead,n_layers)#DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#NLayerGIN(gcn_in_channels, gcn_hidden_channels,gcn_out_channels,6)#GCN_geo(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)
        self.conv4= DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#DW_GAT(in_feats,hidden_feats,out_feats,TF_nhead,n_layers)#DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#NLayerGIN(gcn_in_channels, gcn_hidden_channels,gcn_out_channels,6)#GCN_geo(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)
        self.conv5= DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#DW_GAT(in_feats,hidden_feats,out_feats,TF_nhead,n_layers)#DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#NLayerGIN(gcn_in_channels, gcn_hidden_channels,gcn_out_channels,6)#GCN_geo(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)
        self.conv_set.append(self.conv1)
        self.conv_set.append(self.conv2)
        self.conv_set.append(self.conv3)
        self.conv_set.append(self.conv4)
        self.conv_set.append(self.conv5)
        self.TF=TransformerNodeEncoder(d_model=self.out_feats*5,num_encoder_layers=TF_num_encoder_layers,nhead=TF_nhead,dim_feedforward=TF_dim_feedforward,transformer_dropout=0.1,transformer_activation=TF_act)
        self.MLP_classification=MLP(self.out_feats*5,128,2,3)
        self.MLP_percent=MLP(self.out_feats*5,128,1,3)
        self.MLP_sign=MLP_ne(self.out_feats,self.out_feats,self.out_feats,2)
        #self.certrion=torch.nn.BCELoss(reduction='mean')
        self.certrion=torch.nn.CrossEntropyLoss(reduction="mean",label_smoothing=0.2)
        #self.certrion=focal_loss.sigmoid_focal_loss()
    def forward(self, datas):
      outputs=None
      i=0
      for data in [datas.x_1,datas.x_2,datas.x_3,datas.x_4,datas.x_5]:
        #data=data[0]
        #NormalizeFeatures(data)
        g=data
        x=g.ndata['emb']
        x=x[:,:self.in_feats]
        #print(x.shape)
        if self.positive_processing is not None:
          x=positive_negtive_processing(x,self.positive_processing)
        #x= (x-mus)/sds
        X_min = x.min(dim=0, keepdim=True).values  # 计算最小值
        X_max = x.max(dim=0, keepdim=True).values  # 计算最大值
        #x=(x-X_min)
        x=self.conv_set[i](g,x)
        #neg_x=self.conv_set[i](g,-x)
        #x=self.MLP_sign(pos_x+neg_x)
        #print(data)
        #print(f'Weight max: {data.edge_attr.max()}, min: {data.edge_attr.min()} mean: {torch.mean(data.edge_attr)}')
        # 第一层图卷积 + ReLU 激
        #print(edge_index.shape)
        if outputs==None:
            outputs=x
        else:
            outputs=torch.concat([outputs,x],dim=1)
            #print(outputs.shape)
        #x = F.softmax(x, dim=1)
        i+=1
      outputs=torch.unsqueeze(outputs,dim=0)
      #print(outputs.shape)
      outputs=self.TF(outputs,mask=None)
      outputs=torch.squeeze(outputs,dim=0)
      return outputs  # 返回节点的输出，通常用于节点分类或其他任务
    def multi_forward(self,datas):
        loss=0
        roc=[]
        outputs=[]
        ys=[]
        for i in range (0,len(datas)):
            data=datas[i]
            #print(data)
            out=self.forward(data)
            #out=F.selu(out)
            #print(out.shape)
            outputs.append(out)
            y=data.x_1.ndata['y'].long()
            ys.append(y)
            percent=y.sum()/len(y)*100
            #print(percent)
            #prercent_loss=(percent-y_hat)**2
            #print(y_hat.shape)
        #outputs=torch.cat(outputs)
        #valid_outputs=torch.cat(outputs)
        #padded_outputs=pad_sequence(outputs,batch_first=True,padding_value=-0.01)
        #attention_mask = torch.all(padded_outputs == -0.01, dim=-1)
        #outputs = self.TF(padded_outputs, attention_mask)
        #valid_outputs = outputs[~attention_mask]
        #graph_feature=torch.unsqueeze(torch.sum(valid_outputs,dim=0),dim=0)
        #print(valid_outputs.shape)
        outputs=torch.concat(outputs)
        outputs=self.MLP_classification(outputs)
        #y_hat=self.MLP_percent(graph_feature)
        y_hat=0
        #valid_outputs=F.sigmoid(outputs)
        ys=torch.concat(ys)
        #percent=torch.sum(ys)//len(ys)*100
        #print(percent)
        pred_percent=(y_hat-percent)**2
        #print(outputs.shape)
        #print(ys.shape)
        #loss=self.certrion(torch.squeeze(valid_outputs,dim=1),ys)#bce
        loss=self.certrion(outputs,ys)+pred_percent*self.lamda
        valid_outputs=F.softmax(outputs,dim=1)
        return loss,pred_percent,valid_outputs[:,1],ys
    
    def train_test(self,datas):
      outputs=None
      i=0
      for data in [datas.x_1[0],datas.x_2[0],datas.x_3[0],datas.x_4[0],datas.x_5[0]]:
        #data=data[0]
        #NormalizeFeatures(data)
        g=data
        x=g.ndata['emb']
        #print(x.shape[0])
        x=x[:,:self.in_feats]
        #print(x.shape)
        if self.positive_processing is not None:
          x=positive_negtive_processing(x,self.positive_processing)
        #features=positive_negtive_processing(features,"1")
        #x=positive_negtive_processing(x,"0")
        #x= (x-mus)/sds
        X_min = x.min(dim=0, keepdim=True).values  # 计算最小值
        X_max = x.max(dim=0, keepdim=True).values  # 计算最大值
        #x=(x-X_min)
        x=self.conv_set[i](g,x)
        #neg_x=self.conv_set[i](g,-x)
        #x=pos_x+neg_x
        #x=self.MLP_sign(pos_x+neg_x)
        #mus = torch.mean(x, dim=0)
        #sds = torch.std(x, dim=0)
        #print(sds.shape)
        #sds[sds == 0] = 1
        #x=positive_negtive_processing(x,"0")
        #x= (x-mus)/sds
        #print(data)
        #print(f'Weight max: {data.edge_attr.max()}, min: {data.edge_attr.min()} mean: {torch.mean(data.edge_attr)}')
        # 第一层图卷积 + ReLU 激
        #x=self.conv_set[i](x,edge_index,edge_attr)
        if outputs==None:
            outputs=x
        else:
            outputs=torch.concat([outputs,x],dim=1)
            #print(outputs.shape)
        #x = F.softmax(x, dim=1)
        i+=1
      outputs=torch.unsqueeze(outputs,dim=0)
      x=self.TF(outputs,None)
      x=torch.squeeze(x,dim=0)
      #print(x.shape)
      x=self.MLP_classification(x)
      x=torch.squeeze(x,dim=0)
      #print(x.shape)
      x=F.softmax(x,dim=1)
      #x=F.sigmoid(x)
      #x=torch.squeeze(x,dim=0)
      #print(x.shape)
      return x[:,1] #返回节点的输出，通常用于节点分类或其他任务
    


class TF_P_GIN(nn.Module):
    def __init__(self, in_feats, hidden_feats, out_feats, TF_num_encoder_layers=2,TF_nhead=4,TF_act='relu',TF_dim_feedforward=2048,n_layers=3,positive_processing=None,lamda=0.1):
        super(TF_P_GIN, self).__init__()
        self.conv_set=[]
        self.TF_set=[]
        self.n_layers = n_layers
        self.in_feats=in_feats
        self.TF_num_encoder_layers=TF_num_encoder_layers
        self.TF_nhead=TF_nhead
        self.TF_dim_feedforward=TF_dim_feedforward
        self.TF_act=TF_act
        self.hidden_feats=hidden_feats
        self.out_feats=out_feats
        self.lamda=lamda
        self.positive_processing=positive_processing
        #.GIN=DW_GAT(in_feats,hidden_feats,out_feats,TF_nhead,n_layers)#DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)
        self.conv1 =DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#DW_GAT(in_feats,hidden_feats,out_feats,TF_nhead,n_layers)#DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#NLayerGIN(gcn_in_channels, gcn_hidden_channels,gcn_out_channels,6)#GCN_geo(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)
        self.conv2 =DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#DW_GAT(in_feats,hidden_feats,out_feats,TF_nhead,n_layers)#DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#NLayerGIN(gcn_in_channels, gcn_hidden_channels,gcn_out_channels,6)#GCN_geo(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)
        self.conv3= DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#DW_GAT(in_feats,hidden_feats,out_feats,TF_nhead,n_layers)#DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#NLayerGIN(gcn_in_channels, gcn_hidden_channels,gcn_out_channels,6)#GCN_geo(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)
        self.conv4= DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#DW_GAT(in_feats,hidden_feats,out_feats,TF_nhead,n_layers)#DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#NLayerGIN(gcn_in_channels, gcn_hidden_channels,gcn_out_channels,6)#GCN_geo(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)
        self.conv5= DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#DW_GAT(in_feats,hidden_feats,out_feats,TF_nhead,n_layers)#DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#NLayerGIN(gcn_in_channels, gcn_hidden_channels,gcn_out_channels,6)#GCN_geo(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)
        self.conv_set.append(self.conv1)
        self.conv_set.append(self.conv2)
        self.conv_set.append(self.conv3)
        self.conv_set.append(self.conv4)
        self.conv_set.append(self.conv5)
        self.TF1=TransformerNodeEncoder(d_model=self.in_feats,num_encoder_layers=TF_num_encoder_layers,nhead=TF_nhead,dim_feedforward=TF_dim_feedforward,transformer_dropout=0.1,transformer_activation=TF_act)
        self.TF2=TransformerNodeEncoder(d_model=self.in_feats,num_encoder_layers=TF_num_encoder_layers,nhead=TF_nhead,dim_feedforward=TF_dim_feedforward,transformer_dropout=0.1,transformer_activation=TF_act)
        self.TF3=TransformerNodeEncoder(d_model=self.in_feats,num_encoder_layers=TF_num_encoder_layers,nhead=TF_nhead,dim_feedforward=TF_dim_feedforward,transformer_dropout=0.1,transformer_activation=TF_act)
        self.TF4=TransformerNodeEncoder(d_model=self.in_feats,num_encoder_layers=TF_num_encoder_layers,nhead=TF_nhead,dim_feedforward=TF_dim_feedforward,transformer_dropout=0.1,transformer_activation=TF_act)
        self.TF5=TransformerNodeEncoder(d_model=self.in_feats,num_encoder_layers=TF_num_encoder_layers,nhead=TF_nhead,dim_feedforward=TF_dim_feedforward,transformer_dropout=0.1,transformer_activation=TF_act)
        self.TF_set.append(self.TF1)
        self.TF_set.append(self.TF2)
        self.TF_set.append(self.TF3)
        self.TF_set.append(self.TF4)
        self.TF_set.append(self.TF5)
        self.MLP_classification=MLP((self.out_feats+self.in_feats)*5,128,2,3)#self.out_feats+
        self.MLP_percent=MLP((self.out_feats+self.in_feats)*5,8,1,2)
        self.MLP_sign=MLP_ne(self.out_feats,self.out_feats,self.out_feats,2)
        #self.certrion=torch.nn.BCELoss(reduction='mean')
        self.certrion=torch.nn.CrossEntropyLoss(reduction="mean",label_smoothing=0.2)
        #self.certrion=focal_loss.sigmoid_focal_loss()
    def forward(self, datas):
      outputs=None
      i=0
      for data in [datas.x_1,datas.x_2,datas.x_3,datas.x_4,datas.x_5]:
        #data=data[0]
        #NormalizeFeatures(data)
        g=data
        x=g.ndata['emb']
        x=x[:,:self.in_feats]
        #print(x.shape)
        if self.positive_processing is not None:
          x=positive_negtive_processing(x,self.positive_processing)
        #x= (x-mus)/sds
        X_min = x.min(dim=0, keepdim=True).values  # 计算最小值
        X_max = x.max(dim=0, keepdim=True).values  # 计算最大值
        #x=(x-X_min)
        gin_x=self.conv_set[i](g,x)
        tf_x=self.TF_set[i](torch.unsqueeze(x,dim=0),None)
        tf_x=torch.squeeze(x,dim=0)
        #x=tf_x
        #x=gin_x
        x=torch.concat([tf_x,gin_x],dim=1)
        #x=gin_x
        #print(x.shape)
        #neg_x=self.conv_set[i](g,-x)
        #x=self.MLP_sign(pos_x+neg_x)
        #print(data)
        #print(f'Weight max: {data.edge_attr.max()}, min: {data.edge_attr.min()} mean: {torch.mean(data.edge_attr)}')
        # 第一层图卷积 + ReLU 激
        #print(edge_index.shape)
        if outputs==None:
            outputs=x
        else:
            outputs=torch.concat([outputs,x],dim=1)
            #print(outputs.shape)
        #x = F.softmax(x, dim=1)
        i+=1
      return outputs  # 返回节点的输出，通常用于节点分类或其他任务
    def multi_forward(self,datas):
        loss=0
        roc=[]
        outputs=[]
        ys=[]
        for i in range (0,len(datas)):
            data=datas[i]
            #print(data)
            out=self.forward(data)
            #out=F.selu(out)
            #print(out.shape)
            outputs.append(out)
            y=data.x_1.ndata['y'].long()
            ys.append(y)
            percent=y.sum()/len(y)*100
            #print(percent)
            #prercent_loss=(percent-y_hat)**2
            #print(y_hat.shape)
        #outputs=torch.cat(outputs)
        #valid_outputs=torch.cat(outputs)
        #padded_outputs=pad_sequence(outputs,batch_first=True,padding_value=-0.01)
        #attention_mask = torch.all(padded_outputs == -0.01, dim=-1)
        #outputs = self.TF(padded_outputs, attention_mask)
        #valid_outputs = outputs[~attention_mask]
        #graph_feature=torch.unsqueeze(torch.sum(valid_outputs,dim=0),dim=0)
        #print(valid_outputs.shape)
        outputs=torch.concat(outputs)
        #print(outputs.shape)
        outputs=self.MLP_classification(outputs)
        #y_hat=self.MLP_percent(graph_feature)
        y_hat=0
        #valid_outputs=F.sigmoid(outputs)
        ys=torch.concat(ys)
        #percent=torch.sum(ys)//len(ys)*100
        #print(percent)
        pred_percent=(y_hat-percent)**2
        #print(outputs.shape)
        #print(ys.shape)
        #loss=self.certrion(torch.squeeze(valid_outputs,dim=1),ys)#bce
        loss=self.certrion(outputs,ys)+pred_percent*self.lamda
        valid_outputs=F.softmax(outputs,dim=1)
        return loss,pred_percent,valid_outputs[:,1],ys
    
    def train_test(self,datas):
      outputs=None
      i=0
      for data in [datas.x_1[0],datas.x_2[0],datas.x_3[0],datas.x_4[0],datas.x_5[0]]:
        #data=data[0]
        #NormalizeFeatures(data)
        g=data
        x=g.ndata['emb']
        #print(x.shape[0])
        x=x[:,:self.in_feats]
        #print(x.shape)
        if self.positive_processing is not None:
          x=positive_negtive_processing(x,self.positive_processing)
        #features=positive_negtive_processing(features,"1")
        #x=positive_negtive_processing(x,"0")
        #x= (x-mus)/sds
        X_min = x.min(dim=0, keepdim=True).values  # 计算最小值
        X_max = x.max(dim=0, keepdim=True).values  # 计算最大值
        #x=(x-X_min)
        gin_x=self.conv_set[i](g,x)
        tf_x=self.TF_set[i](torch.unsqueeze(x,dim=0),None)
        tf_x=torch.squeeze(x,dim=0)
        #x=tf_x
        #x=gin_x
        x=torch.concat([tf_x,gin_x],dim=1)
        #x=gin_x
        #neg_x=self.conv_set[i](g,-x)
        #x=pos_x+neg_x
        #x=self.MLP_sign(pos_x+neg_x)
        #mus = torch.mean(x, dim=0)
        #sds = torch.std(x, dim=0)
        #print(sds.shape)
        #sds[sds == 0] = 1
        #x=positive_negtive_processing(x,"0")
        #x= (x-mus)/sds
        #print(data)
        #print(f'Weight max: {data.edge_attr.max()}, min: {data.edge_attr.min()} mean: {torch.mean(data.edge_attr)}')
        # 第一层图卷积 + ReLU 激
        #x=self.conv_set[i](x,edge_index,edge_attr)
        if outputs==None:
            outputs=x
        else:
            outputs=torch.concat([outputs,x],dim=1)
            #print(outputs.shape)
        #x = F.softmax(x, dim=1)
        i+=1
      x=self.MLP_classification(outputs)
      x=torch.squeeze(x,dim=0)
      #print(x.shape)
      x=F.softmax(x,dim=1)
      #x=F.sigmoid(x)
      #x=torch.squeeze(x,dim=0)
      #print(x.shape)
      return x[:,1] #返回节点的输出，通常用于节点分类或其他任务


class TF_P_GIN_PP(nn.Module):
    def __init__(self, in_feats, hidden_feats, out_feats, TF_num_encoder_layers=2,TF_nhead=4,TF_act='relu',TF_dim_feedforward=2048,n_layers=3,positive_processing=None,lamda=0.1):
        super(TF_P_GIN_PP, self).__init__()
        self.conv_set=[]
        self.TF_set=[]
        self.n_layers = n_layers
        self.in_feats=in_feats
        self.TF_num_encoder_layers=TF_num_encoder_layers
        self.TF_nhead=TF_nhead
        self.TF_dim_feedforward=TF_dim_feedforward
        self.TF_act=TF_act
        self.hidden_feats=hidden_feats
        self.out_feats=out_feats
        self.lamda=lamda
        self.positive_processing=positive_processing
        #.GIN=DW_GAT(in_feats,hidden_feats,out_feats,TF_nhead,n_layers)#DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)
        self.conv1 =DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#DW_GAT(in_feats,hidden_feats,out_feats,TF_nhead,n_layers)#DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#NLayerGIN(gcn_in_channels, gcn_hidden_channels,gcn_out_channels,6)#GCN_geo(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)
        self.conv2 =DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#DW_GAT(in_feats,hidden_feats,out_feats,TF_nhead,n_layers)#DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#NLayerGIN(gcn_in_channels, gcn_hidden_channels,gcn_out_channels,6)#GCN_geo(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)
        self.conv3= DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#DW_GAT(in_feats,hidden_feats,out_feats,TF_nhead,n_layers)#DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#NLayerGIN(gcn_in_channels, gcn_hidden_channels,gcn_out_channels,6)#GCN_geo(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)
        self.conv4= DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#DW_GAT(in_feats,hidden_feats,out_feats,TF_nhead,n_layers)#DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#NLayerGIN(gcn_in_channels, gcn_hidden_channels,gcn_out_channels,6)#GCN_geo(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)
        self.conv5= DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#DW_GAT(in_feats,hidden_feats,out_feats,TF_nhead,n_layers)#DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#NLayerGIN(gcn_in_channels, gcn_hidden_channels,gcn_out_channels,6)#GCN_geo(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)
        self.conv_set.append(self.conv1)
        self.conv_set.append(self.conv2)
        self.conv_set.append(self.conv3)
        self.conv_set.append(self.conv4)
        self.conv_set.append(self.conv5)
        self.TF1=TransformerNodeEncoder(d_model=self.in_feats,num_encoder_layers=TF_num_encoder_layers,nhead=TF_nhead,dim_feedforward=TF_dim_feedforward,transformer_dropout=0.1,transformer_activation=TF_act)
        self.TF2=TransformerNodeEncoder(d_model=self.in_feats,num_encoder_layers=TF_num_encoder_layers,nhead=TF_nhead,dim_feedforward=TF_dim_feedforward,transformer_dropout=0.1,transformer_activation=TF_act)
        self.TF3=TransformerNodeEncoder(d_model=self.in_feats,num_encoder_layers=TF_num_encoder_layers,nhead=TF_nhead,dim_feedforward=TF_dim_feedforward,transformer_dropout=0.1,transformer_activation=TF_act)
        self.TF4=TransformerNodeEncoder(d_model=self.in_feats,num_encoder_layers=TF_num_encoder_layers,nhead=TF_nhead,dim_feedforward=TF_dim_feedforward,transformer_dropout=0.1,transformer_activation=TF_act)
        self.TF5=TransformerNodeEncoder(d_model=self.in_feats,num_encoder_layers=TF_num_encoder_layers,nhead=TF_nhead,dim_feedforward=TF_dim_feedforward,transformer_dropout=0.1,transformer_activation=TF_act)
        self.TF_set.append(self.TF1)
        self.TF_set.append(self.TF2)
        self.TF_set.append(self.TF3)
        self.TF_set.append(self.TF4)
        self.TF_set.append(self.TF5)
        self.MLP_classification=MLP((self.out_feats+self.in_feats)*5,128,2,3)#self.out_feats+
        self.MLP_percent=MLP((self.out_feats+self.in_feats)*5,128,1,3)
        self.MLP_sign=MLP_ne(self.out_feats,self.out_feats,self.out_feats,2)
        #self.certrion=torch.nn.BCELoss(reduction='mean')
        self.certrion=torch.nn.CrossEntropyLoss(reduction="mean",label_smoothing=0.2)
        #self.certrion=focal_loss.sigmoid_focal_loss()
    def forward(self, datas):
      outputs=None
      i=0
      for data in [datas.x_1,datas.x_2,datas.x_3,datas.x_4,datas.x_5]:
        #data=data[0]
        #NormalizeFeatures(data)
        g=data
        x=g.ndata['emb']
        x=x[:,:self.in_feats]
        #print(x.shape)
        if self.positive_processing is not None:
          x=positive_negtive_processing(x,self.positive_processing)
        #x= (x-mus)/sds
        X_min = x.min(dim=0, keepdim=True).values  # 计算最小值
        X_max = x.max(dim=0, keepdim=True).values  # 计算最大值
        #x=(x-X_min)
        gin_x=self.conv_set[i](g,x)
        #tf_x=self.TF_set[i](torch.unsqueeze(x,dim=0),None)
        #print(tf_x.shape)
        tf_x=torch.squeeze(x,dim=0)
        #x=tf_x
        #x=gin_x
        x=torch.concat([tf_x,gin_x],dim=1)
        #print(x.shape)
        #neg_x=self.conv_set[i](g,-x)
        #x=self.MLP_sign(pos_x+neg_x)
        #print(data)
        #print(f'Weight max: {data.edge_attr.max()}, min: {data.edge_attr.min()} mean: {torch.mean(data.edge_attr)}')
        # 第一层图卷积 + ReLU 激
        #print(edge_index.shape)
        if outputs==None:
            outputs=x
        else:
            outputs=torch.concat([outputs,x],dim=1)
            #print(outputs.shape)
        #x = F.softmax(x, dim=1)
        i+=1
      return outputs  # 返回节点的输出，通常用于节点分类或其他任务
    def multi_forward(self,datas):
        loss=0
        roc=[]
        outputs=[]
        ys=[]
        for i in range (0,len(datas)):
            data=datas[i]
            #print(data)
            out=self.forward(data)
            #out=F.selu(out)
            #print(out.shape)
            outputs.append(out)
            y=data.x_1.ndata['y'].long()
            ys.append(y)
            percent=y.sum()/len(y)*100
            #print(percent)
            #prercent_loss=(percent-y_hat)**2
            #print(y_hat.shape)
        #outputs=torch.cat(outputs)
        #valid_outputs=torch.cat(outputs)
        #padded_outputs=pad_sequence(outputs,batch_first=True,padding_value=-0.01)
        #attention_mask = torch.all(padded_outputs == -0.01, dim=-1)
        #outputs = self.TF(padded_outputs, attention_mask)
        #valid_outputs = outputs[~attention_mask]
        #graph_feature=torch.unsqueeze(torch.sum(valid_outputs,dim=0),dim=0)
        #print(valid_outputs.shape)
        outputs=torch.concat(outputs)
        #print(outputs.shape)
        #print(outputs.shape)
        #outputs=self.MLP_classification(torch.mean(outputs,dim=1))
        y_hat=self.MLP_percent(torch.mean(outputs,dim=0))
        #valid_outputs=F.sigmoid(outputs)
        ys=torch.concat(ys)
        percent=torch.sum(ys)//len(ys)*100
        #print(percent)
        pred_percent=(y_hat-percent)**2
        #print(outputs.shape)
        #print(ys.shape)
        #loss=self.certrion(torch.squeeze(valid_outputs,dim=1),ys)#bce
        loss=pred_percent
        valid_outputs=F.softmax(outputs,dim=1)
        return loss,pred_percent
    
    def train_test(self,datas):
      outputs=None
      i=0
      for data in [datas.x_1[0],datas.x_2[0],datas.x_3[0],datas.x_4[0],datas.x_5[0]]:
        #data=data[0]
        #NormalizeFeatures(data)
        g=data
        x=g.ndata['emb']
        #print(x.shape[0])
        x=x[:,:self.in_feats]
        #print(x.shape)
        if self.positive_processing is not None:
          x=positive_negtive_processing(x,self.positive_processing)
        #features=positive_negtive_processing(features,"1")
        #x=positive_negtive_processing(x,"0")
        #x= (x-mus)/sds
        X_min = x.min(dim=0, keepdim=True).values  # 计算最小值
        X_max = x.max(dim=0, keepdim=True).values  # 计算最大值
        #x=(x-X_min)
        gin_x=self.conv_set[i](g,x)
        tf_x=self.TF_set[i](torch.unsqueeze(x,dim=0),None)
        tf_x=torch.squeeze(x,dim=0)
        #x=tf_x
        #x=gin_x
        x=torch.concat([tf_x,gin_x],dim=1)
        #neg_x=self.conv_set[i](g,-x)
        #x=pos_x+neg_x
        #x=self.MLP_sign(pos_x+neg_x)
        #mus = torch.mean(x, dim=0)
        #sds = torch.std(x, dim=0)
        #print(sds.shape)
        #sds[sds == 0] = 1
        #x=positive_negtive_processing(x,"0")
        #x= (x-mus)/sds
        #print(data)
        #print(f'Weight max: {data.edge_attr.max()}, min: {data.edge_attr.min()} mean: {torch.mean(data.edge_attr)}')
        # 第一层图卷积 + ReLU 激
        #x=self.conv_set[i](x,edge_index,edge_attr)
        if outputs==None:
            outputs=x
        else:
            outputs=torch.concat([outputs,x],dim=1)
            #print(outputs.shape)
        #x = F.softmax(x, dim=1)
        i+=1
      #x=torch.squeeze(x,dim=0)
      #print(x.shape)
      #x=F.softmax(x,dim=1)
      #x=F.sigmoid(x)
      #x=torch.squeeze(x,dim=0)
      #print(x.shape)
      #print("OUTPUT SHAPE:"+str(x.shape))
      mean_output=torch.mean(outputs,dim=0)
      x=self.MLP_percent(mean_output)
      return x #返回节点的输出，通常用于节点分类或其他任务
    


class G_MLP(nn.Module):
    def __init__(self, in_feats, hidden_feats, out_feats, TF_num_encoder_layers=2,TF_nhead=4,TF_act='relu',TF_dim_feedforward=2048,n_layers=3,positive_processing=None,lamda=0.1):
        super(G_MLP, self).__init__()
        self.conv_set=[]
        self.TF_set=[]
        self.n_layers = n_layers
        self.in_feats=in_feats
        self.TF_num_encoder_layers=TF_num_encoder_layers
        self.TF_nhead=TF_nhead
        self.TF_dim_feedforward=TF_dim_feedforward
        self.TF_act=TF_act
        self.hidden_feats=hidden_feats
        self.out_feats=out_feats
        self.lamda=lamda
        self.positive_processing=positive_processing
        #.GIN=DW_GAT(in_feats,hidden_feats,out_feats,TF_nhead,n_layers)#DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)
        self.conv1 =MLP(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#DW_GAT(in_feats,hidden_feats,out_feats,TF_nhead,n_layers)#DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#NLayerGIN(gcn_in_channels, gcn_hidden_channels,gcn_out_channels,6)#GCN_geo(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)
        self.conv2 =MLP(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#DW_GAT(in_feats,hidden_feats,out_feats,TF_nhead,n_layers)#DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#NLayerGIN(gcn_in_channels, gcn_hidden_channels,gcn_out_channels,6)#GCN_geo(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)
        self.conv3= MLP(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#DW_GAT(in_feats,hidden_feats,out_feats,TF_nhead,n_layers)#DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#NLayerGIN(gcn_in_channels, gcn_hidden_channels,gcn_out_channels,6)#GCN_geo(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)
        self.conv4=MLP(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#DW_GAT(in_feats,hidden_feats,out_feats,TF_nhead,n_layers)#DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#NLayerGIN(gcn_in_channels, gcn_hidden_channels,gcn_out_channels,6)#GCN_geo(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)
        self.conv5= MLP(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#DW_GAT(in_feats,hidden_feats,out_feats,TF_nhead,n_layers)#DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#NLayerGIN(gcn_in_channels, gcn_hidden_channels,gcn_out_channels,6)#GCN_geo(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)
        self.conv_set.append(self.conv1)
        self.conv_set.append(self.conv2)
        self.conv_set.append(self.conv3)
        self.conv_set.append(self.conv4)
        self.conv_set.append(self.conv5)
        self.MLP_classification=MLP((self.out_feats+self.in_feats)*5,128,2,3)
        self.MLP_percent=MLP((self.out_feats+self.in_feats)*5,8,1,2)
        self.MLP_sign=MLP_ne(self.out_feats,self.out_feats,self.out_feats,2)
        #self.certrion=torch.nn.BCELoss(reduction='mean')
        self.certrion=torch.nn.CrossEntropyLoss(reduction="mean",label_smoothing=0.2)
        #self.certrion=focal_loss.sigmoid_focal_loss()
    def forward(self, datas):
      outputs=None
      i=0
      for data in [datas.x_1,datas.x_2,datas.x_3,datas.x_4]:#,datas.x_5]:
        #data=data[0]
        #NormalizeFeatures(data)
        g=data
        x=g.ndata['emb']
        x=x[:,:self.in_feats]
        #print(x.shape)
        if self.positive_processing is not None:
          x=positive_negtive_processing(x,self.positive_processing)
        #x= (x-mus)/sds
        X_min = x.min(dim=0, keepdim=True).values  # 计算最小值
        X_max = x.max(dim=0, keepdim=True).values  # 计算最大值
        #x=(x-X_min)
        gin_x=self.conv_set[i](x)
        tf_x=self.TF_set[i](torch.unsqueeze(x,dim=0),None)
        #print(tf_x.shape)
        tf_x=torch.squeeze(x,dim=0)
        x=torch.concat([tf_x,gin_x],dim=1)
        #print(x.shape)
        #neg_x=self.conv_set[i](g,-x)
        #x=self.MLP_sign(pos_x+neg_x)
        #print(data)
        #print(f'Weight max: {data.edge_attr.max()}, min: {data.edge_attr.min()} mean: {torch.mean(data.edge_attr)}')
        # 第一层图卷积 + ReLU 激
        #print(edge_index.shape)
        if outputs==None:
            outputs=x
        else:
            outputs=torch.concat([outputs,x],dim=1)
            #print(outputs.shape)
        #x = F.softmax(x, dim=1)
        i+=1
      return outputs  # 返回节点的输出，通常用于节点分类或其他任务
    def multi_forward(self,datas):
        loss=0
        roc=[]
        outputs=[]
        ys=[]
        for i in range (0,len(datas)):
            data=datas[i]
            #print(data)
            out=self.forward(data)
            #out=F.selu(out)
            #print(out.shape)
            outputs.append(out)
            y=data.x_1.ndata['y'].long()
            ys.append(y)
            percent=y.sum()/len(y)*100
            #print(percent)
            #prercent_loss=(percent-y_hat)**2
            #print(y_hat.shape)
        #outputs=torch.cat(outputs)
        #valid_outputs=torch.cat(outputs)
        #padded_outputs=pad_sequence(outputs,batch_first=True,padding_value=-0.01)
        #attention_mask = torch.all(padded_outputs == -0.01, dim=-1)
        #outputs = self.TF(padded_outputs, attention_mask)
        #valid_outputs = outputs[~attention_mask]
        #graph_feature=torch.unsqueeze(torch.sum(valid_outputs,dim=0),dim=0)
        #print(valid_outputs.shape)
        outputs=torch.concat(outputs)
        #print(outputs.shape)
        outputs=self.MLP_classification(outputs)
        #y_hat=self.MLP_percent(graph_feature)
        y_hat=0
        #valid_outputs=F.sigmoid(outputs)
        ys=torch.concat(ys)
        #percent=torch.sum(ys)//len(ys)*100
        #print(percent)
        pred_percent=(y_hat-percent)**2
        #print(outputs.shape)
        #print(ys.shape)
        #loss=self.certrion(torch.squeeze(valid_outputs,dim=1),ys)#bce
        loss=self.certrion(outputs,ys)+pred_percent*self.lamda
        valid_outputs=F.softmax(outputs,dim=1)
        return loss,pred_percent,valid_outputs[:,1],ys
    
    def train_test(self,datas):
      outputs=None
      i=0
      for data in [datas.x_1[0],datas.x_2[0],datas.x_3[0],datas.x_4[0]]:#,datas.x_5[0]]:
        #data=data[0]
        #NormalizeFeatures(data)
        g=data
        x=g.ndata['emb']
        #print(x.shape[0])
        x=x[:,:self.in_feats]
        #print(x.shape)
        if self.positive_processing is not None:
          x=positive_negtive_processing(x,self.positive_processing)
        #features=positive_negtive_processing(features,"1")
        #x=positive_negtive_processing(x,"0")
        #x= (x-mus)/sds
        X_min = x.min(dim=0, keepdim=True).values  # 计算最小值
        X_max = x.max(dim=0, keepdim=True).values  # 计算最大值
        #x=(x-X_min)
        gin_x=self.conv_set[i](x)
        tf_x=self.TF_set[i](torch.unsqueeze(x,dim=0),None)
        tf_x=torch.squeeze(x,dim=0)
        x=torch.concat([tf_x,gin_x],dim=1)
        #neg_x=self.conv_set[i](g,-x)
        #x=pos_x+neg_x
        #x=self.MLP_sign(pos_x+neg_x)
        #mus = torch.mean(x, dim=0)
        #sds = torch.std(x, dim=0)
        #print(sds.shape)
        #sds[sds == 0] = 1
        #x=positive_negtive_processing(x,"0")
        #x= (x-mus)/sds
        #print(data)
        #print(f'Weight max: {data.edge_attr.max()}, min: {data.edge_attr.min()} mean: {torch.mean(data.edge_attr)}')
        # 第一层图卷积 + ReLU 激
        #x=self.conv_set[i](x,edge_index,edge_attr)
        if outputs==None:
            outputs=x
        else:
            outputs=torch.concat([outputs,x],dim=1)
            #print(outputs.shape)
        #x = F.softmax(x, dim=1)
        i+=1
      x=self.MLP_classification(outputs)
      x=torch.squeeze(x,dim=0)
      #print(x.shape)
      x=F.softmax(x,dim=1)
      #x=F.sigmoid(x)
      #x=torch.squeeze(x,dim=0)
      #print(x.shape)
      return x[:,1] #返回节点的输出，通常用于节点分类或其他任务

class DW_GCNTF_KDE(nn.Module):
    def __init__(self, in_feats, hidden_feats, out_feats, TF_num_encoder_layers=2,TF_nhead=4,TF_act='relu',TF_dim_feedforward=2048,n_layers=3,positive_processing=None,lamda=0.1):
        super(DW_GCNTF_KDE, self).__init__()
        self.conv_set=[]
        self.n_layers = n_layers
        self.in_feats=in_feats
        self.TF_num_encoder_layers=TF_num_encoder_layers
        self.TF_nhead=TF_nhead
        self.TF_dim_feedforward=TF_dim_feedforward
        self.TF_act=TF_act
        self.hidden_feats=hidden_feats
        self.out_feats=out_feats
        self.lamda=lamda
        self.positive_processing=positive_processing
        #.GIN=DW_GAT(in_feats,hidden_feats,out_feats,TF_nhead,n_layers)#DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)
        self.conv1 =DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#DW_GAT(in_feats,hidden_feats,out_feats,TF_nhead,n_layers)#DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#NLayerGIN(gcn_in_channels, gcn_hidden_channels,gcn_out_channels,6)#GCN_geo(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)
        self.conv2 =DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#DW_GAT(in_feats,hidden_feats,out_feats,TF_nhead,n_layers)#DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#NLayerGIN(gcn_in_channels, gcn_hidden_channels,gcn_out_channels,6)#GCN_geo(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)
        self.conv3= DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#DW_GAT(in_feats,hidden_feats,out_feats,TF_nhead,n_layers)#DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#NLayerGIN(gcn_in_channels, gcn_hidden_channels,gcn_out_channels,6)#GCN_geo(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)
        self.conv4= DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#DW_GAT(in_feats,hidden_feats,out_feats,TF_nhead,n_layers)#DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#NLayerGIN(gcn_in_channels, gcn_hidden_channels,gcn_out_channels,6)#GCN_geo(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)
        self.conv5= DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#DW_GAT(in_feats,hidden_feats,out_feats,TF_nhead,n_layers)#DW_NLayerGIN(self.in_feats,self.hidden_feats,self.out_feats,self.n_layers)#NLayerGIN(gcn_in_channels, gcn_hidden_channels,gcn_out_channels,6)#GCN_geo(gcn_in_channels, gcn_hidden_channels,gcn_out_channels)
        self.conv_set.append(self.conv1)
        self.conv_set.append(self.conv2)
        self.conv_set.append(self.conv3)
        self.conv_set.append(self.conv4)
        self.conv_set.append(self.conv5)
        self.TF=TransformerNodeEncoder(d_model=self.out_feats*5,num_encoder_layers=TF_num_encoder_layers,nhead=TF_nhead,dim_feedforward=TF_dim_feedforward,transformer_dropout=0.1,transformer_activation=TF_act)
        self.MLP_classification=MLP(self.out_feats*5,128,2,2)
        self.MLP_percent=MLP(self.out_feats*5,128,1,3)
        #self.certrion=torch.nn.BCELoss(reduction='mean')
        self.certrion=torch.nn.CrossEntropyLoss(reduction="mean",label_smoothing=0.1,weight=torch.tensor([1,2]))
        #self.certrion=focal_loss.sigmoid_focal_loss()
    def forward(self, datas):
      outputs=None
      i=0
      for data in [datas.x_1,datas.x_2,datas.x_3,datas.x_4,datas.x_5]:
        #data=data[0]
        #NormalizeFeatures(data)
        g=data
        x=g.ndata['emb']
        #print(x.shape)
        x=x[:,:self.in_feats]
        #print(x.shape)
        if self.positive_processing is not None:
          x=positive_negtive_processing(x,self.positive_processing)
        #x= (x-mus)/sds
        X_min = x.min(dim=0, keepdim=True).values  # 计算最小值
        X_max = x.max(dim=0, keepdim=True).values  # 计算最大值
        #x=(x-X_min)
        x=self.conv_set[i](g,x)
        #print(data)
        #print(f'Weight max: {data.edge_attr.max()}, min: {data.edge_attr.min()} mean: {torch.mean(data.edge_attr)}')
        # 第一层图卷积 + ReLU 激
        #print(edge_index.shape)
        if outputs==None:
            outputs=x
        else:
            outputs=torch.concat([outputs,x],dim=1)
            #print(outputs.shape)
        #x = F.softmax(x, dim=1)
        i+=1
      return outputs  # 返回节点的输出，通常用于节点分类或其他任务
    def multi_forward(self,datas):
        loss=0
        roc=[]
        outputs=[]
        ys=[]
        for i in range (0,len(datas)):
            data=datas[i]
            #print(data)
            out=self.forward(data)
            #out=F.selu(out)
            #print(out.shape)
            outputs.append(out)
            y=data.x_1.ndata['y'].long()
            ys.append(y)
            percent=y.sum()/len(y)*100
            #print(percent)
            #prercent_loss=(percent-y_hat)**2
            #print(y_hat.shape)
        #outputs=torch.cat(outputs)
        #valid_outputs=torch.cat(outputs)
        nn_outputs=torch.cat(outputs)
        #padded_outputs=pad_sequence(outputs,batch_first=True,padding_value=1e-3)
        #attention_mask = torch.all(padded_outputs == 1e-3, dim=-1)
        #outputs = self.TF(padded_outputs, attention_mask)
        #valid_outputs = outputs[~attention_mask]
        #graph_feature=torch.sum(valid_outputs,dim=0)
        #graph_feature=torch.unsqueeze(graph_feature,dim=0)
        #y_hat=self.MLP_percent(graph_feature)
        ##y_hat=0
        pred_percent=torch.zeros(1)
        ys=torch.concat(ys)
        #percent=torch.sum(ys)//len(ys)*100
        #print(percent)
        #pred_percent=(y_hat-percent)**2
        #print(outputs.shape)
        #print(ys.shape)
        ys[ys==0]=-1
        ys[ys==1]=10000
        dists=torch.cdist(nn_outputs,nn_outputs.detach(),p=2)
        sigma=(torch.mean(dists)).detach()
        exp=torch.exp(-dists**2/(2*20**2))
        kde=torch.mean(exp,dim=1)
        #print(kde.shape)
        #print(ys.shape)
        max_min_kde=kde*ys
        loss=torch.mean(kde)
        #loss=self.certrion(torch.squeeze(valid_outputs,dim=1),ys)#bce
        #loss=self.certrion(outputs,ys)+pred_percent*self.lamda
        #valid_outputs=F.softmax(outputs,dim=1)
        ys[ys==-1]=0
        ys[ys==10000]=1
        return loss,pred_percent,kde,ys
    
    def train_test(self,datas):
      outputs=None
      i=0
      for data in [datas.x_1[0],datas.x_2[0],datas.x_3[0],datas.x_4[0],datas.x_5[0]]:
        #data=data[0]
        #NormalizeFeatures(data)
        g=data
        x=g.ndata['emb']
        x=x[:,:self.in_feats]
        #print(x.shape)
        if self.positive_processing is not None:
          x=positive_negtive_processing(x,self.positive_processing)
        #features=positive_negtive_processing(features,"1")
        #x=positive_negtive_processing(x,"0")
        #x= (x-mus)/sds
        X_min = x.min(dim=0, keepdim=True).values  # 计算最小值
        X_max = x.max(dim=0, keepdim=True).values  # 计算最大值
        #x=(x-X_min)
        x=self.conv_set[i](g,x)
        #mus = torch.mean(x, dim=0)
        #sds = torch.std(x, dim=0)
        #print(sds.shape)
        #sds[sds == 0] = 1
        #x=positive_negtive_processing(x,"0")
        #x= (x-mus)/sds
        #print(data)
        #print(f'Weight max: {data.edge_attr.max()}, min: {data.edge_attr.min()} mean: {torch.mean(data.edge_attr)}')
        # 第一层图卷积 + ReLU 激
        #x=self.conv_set[i](x,edge_index,edge_attr)
        if outputs==None:
            outputs=x
        else:
            outputs=torch.concat([outputs,x],dim=1)
            #print(outputs.shape)
        #x = F.softmax(x, dim=1)
        i+=1
      #outputs=torch.unsqueeze(outputs,dim=0)
      #x=self.TF(outputs,None)
      #x=torch.squeeze(x,dim=0)
      dists=torch.cdist(outputs,outputs)
      sigma=torch.mean(dists)
      exp=torch.exp(-dists/(2*20**2))
      kde=torch.mean(exp,dim=1)
      return kde #返回节点的输出，通常用于节点分类或其他任务

