%\documentclass{uai2023} % for initial submission
\documentclass[accepted]{uai2023} % after acceptance, for a revised
% version; also before submission to
% see how the non-anonymous paper
% would look like
%% There is a class option to choose the math font
% \documentclass[mathfont=ptmx]{uai2023} % ptmx math instead of Computer
% Modern (has noticable issues)
% \documentclass[mathfont=newtx]{uai2023} % newtx fonts (improves upon
% ptmx; less tested, no support)
% NOTE: Only keep *one* line above as appropriate, as it will be replaced
%       automatically for papers to be published. Do not make any other
%       change above this note for an accepted version.

%% Choose your variant of English; be consistent
\usepackage[american]{babel}
% \usepackage[british]{babel}

%% Some suggested packages, as needed:
\usepackage{natbib} % has a nice set of citation styles and commands
    \bibliographystyle{plainnat}
    \renewcommand{\bibsection}{\subsubsection*{References}}
\usepackage{mathtools} % amsmath with fixes and additions
% \usepackage{siunitx} % for proper typesetting of numbers and units
\usepackage{booktabs} % commands to create good-looking tables
\usepackage{tikz} % nice language for creating drawings and diagrams

% 
\usepackage{times}
\usepackage{helvet}
\usepackage{courier}
\usepackage{float, graphicx, multirow}
\usepackage{makecell} 
%\usepackage{hyperref}
\usepackage{lipsum}
\usepackage[toc,page]{appendix}
\usepackage{caption}
\usepackage{subcaption}
\usepackage{amsmath,amsfonts,amssymb,amsthm}
\usepackage{amssymb}% http://ctan.org/pkg/amssymb
\usepackage{physics}
\usepackage{pifont}% http://ctan.org/pkg/pifont
\usepackage{tablefootnote}
\newtheorem{theorem}{Theorem}%  meant for continuous numbers
\newtheorem{definition}{Definition}%
\usepackage[colorinlistoftodos]{todonotes}
\newcommand{\STAB}[1]{\begin{tabular}{@{}c@{}}#1\end{tabular}}



%% Provided macros
% \smaller: Because the class footnote size is essentially LaTeX's \small,
%           redefining \footnotesize, we provide the original \footnotesize
%           using this macro.
%           (Use only sparingly, e.g., in drawings, as it is quite small.)

%% Self-defined macros
\newcommand{\swap}[3][-]{#3#1#2} % just an example

\title{Universal Graph Contrastive Learning with a Novel Laplacian Perturbation}

% The standard author block has changed for UAI 2023 to provide
% more space for long author lists and allow for complex affiliations
%
% All author information is authomatically removed by the class for the
% anonymous submission version of your paper, so you can already add your
% information below.
%
% Add authors
\author[1]{\href{mailto:<taewook.ko@snu.ac.kr>?Subject=Your UAI 2023 paper "UGCL"}{Taewook Ko}{}}
\author[1]{Yoonhyuk Choi}
\author[2]{Chong-Kwon Kim}
% Add affiliations after the authors
\affil[1]{%
    Department of Computer Science and Engineering\\
    Seoul National University}
\affil[2]{%
    Research Institute of Energy AI\\
    Korea Institute of Energy Technology}


  
\begin{document}
\maketitle

\begin{abstract}
    Graph Contrastive Learning (GCL) is an effective method for discovering meaningful patterns in graph data. By evaluating diverse augmentations of the graph, GCL learns discriminative representations and provides a flexible and scalable mechanism for various graph mining tasks. This paper proposes a novel contrastive learning framework by introducing Laplacian perturbation.     
    The proposed framework offers a distinct advantage by employing an indirect perturbation method, which provides a more stable approach while maintaining the perturbation effects. Moreover, it exhibits a wide range of applicability by not being restricted to specific graph types.
    We demonstrate that a spectral graph convolution based on the Laplacian successfully extracts representations from diverse graph types. Our extensive experiments on a variety of real-world datasets, covering multiple graph types, show that the proposed model outperforms state-of-the-art baselines in both node classification and link sign prediction tasks.
\end{abstract}

\section{Introduction}\label{sec:intro}
Contrastive learning, which maximizes the mutual information between representations of augmented data, is a widely used method that helps learn discriminative representations from limited labeled data or self-supervised environments \citep{chen2020simple,he2020momentum}. Recently, a growing number of studies have successfully demonstrated the effectiveness of contrastive learning in graph data. These studies, known as Graph Contrastive Learning (GCL), make diverse graph views through several graph perturbation methods such as deleting or adding edges/nodes \citep{you2020graph,zeng2021contrastive}, random-walk sampling \citep{qiu2020gcc}, or masking attributes \citep{zhu2021graph}. On the other hand, JOAO \citep{you2021graph} and AD-GCL \citep{suresh2021adversarial} proposed novel graph encoders for contrastive learning. SimGRACE \citep{xia2022simgrace} added Gaussian noise to graph encoders. 

Majority of prior GCL techniques are designed for specific graph types. Many are confined to unsigned undirected graphs, severely limiting their application domain. Several algorithms that expand the applicability of GCL have been proposed \citep{tong2021directed, shu2021sgcl}. However, these expanded schemes focused on a single graph type. For example, DiGCL \citep{tong2021directed} and SGCL \citep{shu2021sgcl} are customized for directed and signed directed graphs, respectively.
Although their approaches are innovative, DiGCL is adequate for dense directed graphs only and SGCL may fail to capture valuable network semantics emanated from the balance theory \citep{heider1946attitudes,holland1971transitivity}.

This paper proposes a novel comprehensive Graph Contrastive Learning algorithm called \textbf{UGCL}\footnote{The source code is available at\\ \url{https://github.com/twko05/UGCL.git}.} (Universal GCL). We devise a new data augmentation scheme based on magnetic Laplacian perturbation. UGCL claims to have wide applicability ranging from simple unsigned undirected graphs to signed directed graphs. The magnetic Laplacian \citep{shubin1994discrete,olgiati2017remarks,colin2013magnetic}, initially studied in quantum physics, recently has been applied in graph studies due to its Hermitian properties. \citet{cucuringu2020hermitian,cloninger2017note} used the magnetic Laplacian for clustering in directed graphs. \citet{zhang2021magnet} introduced directed graph convolution based on a magnetic Laplacian. Recent studies \citep{ko2023spectral,fiorini2022sigmanet,he2022msgnn} expanded the idea of magnetic Laplacian to signed graphs by defining signed magnetic Laplacian. 

The signed magnetic Laplacian captures the structure of the graph by encoding both edge signs and directions with complex values and phases. By adjusting the phase value as a parameter, the Laplacian can be modified, leading us to introduce a Laplacian perturbation method. To the best of our knowledge, this is the first attempt to apply perturbation to the magnetic Laplacian matrix. Unlike the structural perturbation methods that induce abrupt changes to graph structures, phase perturbation enjoys the flexibility of fine adjustments while maintaining the overall graph structure. 

To perform graph convolutions on these augments, we introduce a magnetic Laplacian-based spectral convolution layer, inspired by the principles of graph signal processing \citep{defferrard2016convolutional,hammond2011wavelets}. Finally, we maximize the mutual information between the augmented representations by reducing the node-level contrastive loss \citep{zhu2021graph,shu2021sgcl}. We conducted experiments on real-world graph data of various types to demonstrate the effectiveness of our method. The proposed framework outperformed state-of-the-art baseline in node classification and link sign prediction tasks.


The main contributions of this paper are as follows.
\begin{itemize}
\item This paper introduces a novel Universal Graph Contrastive Learning (\textbf{UGCL}). 
\item To the best of our knowledge, this is the first attempt to introduce magnetic Laplacian perturbation.
\item The magnetic Laplacian perturbation enables fine adjustments while keeping the graph topology.
\item The proposed framework has wide applicability and can be applied to various graph types.
\item UGCL demonstrates enhanced graph representation learning on diverse real-world graphs.
\end{itemize}


\section{Related Work}
\subsection{Graph Contrastive Learning}
SimCLR \citep{chen2020simple} and MoCo \citep{he2020momentum} introduced contrastive learning methods for image classification, which have achieved significant success. These works have stimulated numerous subsequent studies aiming to enhance learning efficiency through self-supervised approaches. DGI \citep{velickovic2019deep} and GMI \citep{peng2020graph} are two pioneering attempts that brought the contrastive learning mechanism to graph analysis by measuring the mutual information between graphs and node representations. InfoGraph \citep{sun2019infograph} introduced patch-level representation, while GCC \citep{qiu2020gcc} utilized random-walk sampling to create positive and negative samples. 

These early studies proved the feasibility of constrastive learning in graph representation learning and ignited immense research investigations leading to a plethora of clever graph augmentation techniques \citep{you2020graph,zeng2021contrastive,zhu2021graph,you2021graph} and graph encoding schemes \citep{shu2021sgcl,xia2022simgrace,suresh2021adversarial,xia2022simgrace}. These advancements have led to various application studies including graph clustering \citep{pan2021multi,zhong2021graph}, node embedding \citep{zhu2021graph}, DDI (Drug Drug Interaction) prediction \citep{wang2021multi,li2022geomgcl}, and recommendation \citep{lin2022improving}. 

However, most existing GCL techniques are limited their use to unsigned undirected graphs. To broaden the scope of the GCL technique, DiGCL \citep{tong2021directed} introduced a contrastive learning for directed graphs through perturbing the teleport probability of a transition matrix. SGCL \citep{shu2021sgcl} proposed a signed directed contrastive learning by randomly altering the signs and directions of edges. However, both approaches have limitations and are restricted in their applicability to all graph types. In light of this, this study introduces a novel generalized graph contrastive learning framework with Laplacian matrix perturbation.


\subsection{Hermitian Adjacency Matrix and Magnetic Laplacian}
The traditional adjacency matrix, which utilizes 0s and 1s to encode graph connectivity, possesses the advantageous property of symmetry, allowing for efficient spectral analyses of graphs. However, when it comes to dealing with signed or directed graphs, binary encoding alone proves insufficient for effective representation.
Several studies have proposed to use Hermitian adjacency matrices as an alternative to the traditional adjacency matrix for directed graphs. \citet{liu2015hermitian,guo2017hermitian} encode graph edges using a Hermitian matrix form, which is equal to its conjugate transpose. Bidirectional edges are encoded as 1, while two types of unidirectional edges are represented by imaginary numbers (i and -i). The plus and minus signs to the imaginary number distinguish the edge directions. \citet{mohar2020new,cucuringu2020hermitian} used complex numbers with various phases to improve the interpretability of directed adjacency matrices. 

With the Hermitian matrix, we can define a magnetic Laplacian. The magnetic Laplacian, originally used in quantum mechanics for the analyses of charged particles under magnetic flux \citep{shubin1994discrete,olgiati2017remarks,lieb1993fluxes,colin2013magnetic,fanuel2018magnetic}, 
has recently emerged as a flexible and powerful tool for directed graph analyses.
Many algorithms based on the Hermitian matrix were introduced including graph clustering \citep{f2020characterization,cloninger2017note}, community detection \citep{fanuel2017magnetic}, and graph representation learning \citep{furutani2019graph}.
MagNet \citep{zhang2021magnet} proved the PSD (Positive Semi-Definite) property of the proposed directed magnetic Laplacian and introduced a spectral graph convolution for directed graphs. Recently, several studies \citep{ko2023spectral,fiorini2022sigmanet,he2022msgnn,singh2022signed} proposed signed magnetic Laplacians to apply the idea of magnetic Laplacian to signed graphs. 


\section{Problem Formulation}\label{sec:problem}
Let $\mathcal{G} = (V, \mathcal{E})$ be a graph where $V$ is a set of nodes and $\mathcal{E}$ is a set of directed edges. As a weighted graph, we use a sign matrix $\textbf{S}$ to denote the sign of edges. The value of $\textbf{S}(u,v)$ is set to 1 if there exists a positive directed edge from node u to node v, or -1 if there is a negative directed edge. Each node has one of three possible relationships with other nodes: {none, positive, negative}. This results in nine possible relationships for each node pair, as shown in Figure~\ref{fig:1}(b). The goal of this paper is to discover the latent features of nodes as a low-dimensional embedding vector $z_u \in \mathbb{R}^d$ as:
\begin{equation}
    f(\mathcal{G}) = \mathbf{Z},\label{eq:1}
\end{equation}
where $\mathbf{Z}\in \mathbb{R}^{\mid V \mid \times d}$ is a node embedding matrix. Note that we describe the proposed algorithm assuming signed directed graphs, the most generic form of graphs. However, the proposed scheme can be applied to any types of graphs with a straightforward modification. 


\section{Magnetic Laplacian}\label{sec:magnetic}
A graph Laplacian ($\textbf{L}=\textbf{D}-\textbf{A}$), where $\textbf{D}$ is a diagonal degree matrix, is a powerful tool to represent graph structure. They not only have the positive semi-definite (PSD) property but also have non-negative eigenvalues with associated orthonormal eigenvectors when the graphs are unsigned and undirected. GCN \citep{kipf2016semi} and ChebyNet \citep{defferrard2016convolutional} proposed spectral graph convolution techniques based on those properties. However, in the case of signed or directed graphs, the presence of complex eigenvalues of the graph Laplacian makes it challenging to satisfy the conditions for spectral convolution in the graph Fourier transform.

Recent studies \citep{ko2023spectral,fiorini2022sigmanet} employed novel signed directed magnetic Laplacian matrices in representing the structure of signed directed graphs. The magnetic Laplacian satisfies the PSD property and is amenable to spectral graph analyses. First of all, we define a complex Hermitian adjacency matrix.  
\begin{equation}
\mathbf{H}^q = \mathbf{A}_s \odot \mathbf{P}^{q},\label{eq:2}
\end{equation}
where $\mathbf{A}_s := \frac{1}{2}(\mathbf{A}+ \mathbf{A^\intercal})$ is a symmetrized adjacency matrix, and $\mathbf{P}^q$ is a phase matrix with complex numbers. $\odot$ is an element-wise multiplication operation. The definition of the phase matrix is as:


\begin{equation}
\textbf{P}^{q}(u,v) := \frac{\text{exp}(i\Theta^{q}(u,v))+ \text{exp}(i\overline{\Theta}^{q}(u,v))}
{\|\text{exp}(i\Theta^{q}(u,v))+ \text{exp}(i\overline{\Theta}^{q}(u,v))\|+\epsilon}.\label{eq:3}
\end{equation}
\begin{equation*}
    \Theta^{q}(u,v)= 
\begin{cases}
    \ q & \ \ \  \ \ \ \text{if} \ \ \ \textbf{S}(u,v)=1\\
    \ \pi+q &  \ \ \   \ \ \ \text{if} \ \ \ \textbf{S}(u,v)=-1\\
    \  i \ \infty & \ \ \   \ \ \  \text{if} \ \ \ \textbf{S}(u,v)=0\\
    \end{cases}
\end{equation*}

\begin{equation*}
    \overline{\Theta}^{q}(u,v)= 
\begin{cases}
    \ -q & \ \ \  \ \ \ \text{if} \ \ \  \textbf{S}(v,u)=1\\
    \ \pi-q & \ \ \  \ \ \ \text{if} \ \ \  \textbf{S}(v,u)=-1\\
    \  i \ \infty & \ \ \  \ \ \ \text{if}  \ \ \ \textbf{S}(v,u)=0\\
    \end{cases}
\end{equation*}

\begin{figure}[t]
  \centering
  \includegraphics[width=\linewidth]{figure_1.PNG}
  \caption{Encoding values of a signed directed graph via complex Hermitian adjacency matrix. The parameter $q$ controls the phase angle. The blue and red arrows indicate positive and negative edges, respectively.}\label{fig:1}
\end{figure}
where $q \in \text{[}0, \pi/2\text{]}$ is a parameter that controls the encoding phases. The effect of $q$ is described in detail in Section~\ref{sec:theoretical}.
The symmetrized adjacency matrix encodes the node connectivity, while the phase matrix encodes directions and signs of edges with different phase values. Figure~\ref{fig:1} illustrates the edge encoding of the defined Hermitian adjacency matrix. They uniquely encode all the nine node pair relationships of signed-directed graphs. Each relation has a distinct phase and magnitude combination. We can see that $\textbf{H}^q$ is a complex numbered skew-symmetric form, a complex Hermitian matrix. We then define signed directed magnetic Laplacian with the Hermitian adjacency matrix as follows:
\begin{equation}
    \mathbf{L}^{q}_U := \mathbf{D_s}-
    \mathbf{H}^{q} = \mathbf{D_s}- \mathbf{A}_s\odot \mathbf{P}^q\label{eq:4},
\end{equation}
%We have normalized Laplacian by normalizing Equation 6 with the node degree.
\begin{equation}
    \mathbf{L}^{q}_N := \mathbf{I}-(\mathbf{D_s}^{-\frac{1}{2}} \mathbf{A}_s \mathbf{D_s}^{-\frac{1}{2}})\odot \mathbf{P}^q,\label{eq:5}
\end{equation}
where $\mathbf{D}_s$ is a symmetric degree matrix.
\begin{equation*}
    \textbf{D}_s(u,v) =
\begin{cases}
    \ \sum_{w\in V}\text{A}_s(u,w) & \ \ \  \ \ \ \text{if} \ \ \ u = v     \\
    \  \ \ \ \ \ \ \ \ 0 & \ \ \   \ \ \  \text{if} \ \ \ u \neq v .
    \end{cases}
\end{equation*}

$\mathbf{L}^{q}_U$ and $\mathbf{L}^{q}_N$ are unnormalized and normalized signed directed magnetic Laplacians, respectively. 

\begin{theorem}
    \textbf{The unnormalized and normalized signed directed magnetic Laplacians are positive semi-definite.}
    \begin{equation*}
    \ \ \ \ \  x^T\textbf{L}_N^qx \geq 0   \ \ \ \ \ x \in \mathbb{R}^n.\label{theorem:1}
    \end{equation*}
\end{theorem}
    
\begin{theorem}
    \textbf{The eigenvalues of the normalized magnetic Laplacians are in the range of [0, 2].}\label{theorem:2}
\end{theorem}
Proofs of Theorems are reported in Supplementary Material. By Theorem~\ref{theorem:1}, the Laplacians are diagonalizable by a spectral decomposition. For example, the normalized Laplacian is diagonalized as:
\begin{equation}
    \textbf{L}^{q}_N = \textbf{U}\Lambda\textbf{U}^{\dagger}.\label{eq:6}
\end{equation}
Each column of the matrix $\mathbf{U}$ is eigenvector $\mathbf{u}_k$ and $\mathbf{U}^{\dagger}$ is a conjugate transpose of $\mathbf{U}$. $\Lambda$ is a diagonal matrix where the elements are $k$-th eigenvalues $\Lambda_{k,k} = \mathbf{\lambda}_k$. The eigenvalues and eigenvectors contain the structural information of the signed directed graph. We leverage this matrix to define spectral graph convolution. 



\section{Model Framework}\label{sec:model}
We propose two perturbation stages: structure perturbation and Laplacian perturbation. The structure perturbation directly perturbs the graph data, resulting in a significant perturbation effect. However, it can hinder the convergence of learning. In contrast, the Laplacian perturbation indirectly influences the graph data. It introduces limited alterations while still maintaining effective perturbation effects.

\subsection{Structure Perturbation}
Structure perturbation consists of two types of perturbation: edge sign perturbation and edge direction perturbation. In edge sign perturbation, we randomly alter the signs of edges in a given graph. For instance, we sample $p\%$ of positive edges and change their signs to negative, and do the same to negative edges. Similarly, we sample $r\%$ of edges and reverse their directions. Random edge perturbation yields a perturbed graph view, $\widetilde
{\mathcal{G}} = (V, \tilde
{\mathcal{E}}, \tilde{\textbf{S}})$. 
Figure~\ref{fig:edge} shows an example of structure perturbation. 

A moderate degree of perturbation can allow the model to learn robust representations from noisy real-world data and uncover relationships that were previously hidden. This can ultimately enhance the model's generalization performance. Many existing studies \citep{you2020graph,zeng2021contrastive,qiu2020gcc,zhu2021graph,you2021graph} solely depend on this kind of sturucture perturbation. However, excessive perturbation can lead to loss of graph information. The significance of the information in edge signs and directions is acknowledged by the balance and status theories \citep{heider1946attitudes,holland1971transitivity}. A single change in edge sign or direction can lead to violations of balance or status theories in all triads associated with that edge. Even perturbing a few edges can result in a catastrophic disruption to the semantics of the graph. Therefore, we introduce a novel Laplacian perturbation that allows robust alterations to the original graphs. 

\subsection{Laplacian Perturbation}
 The magnetic Laplacian can be modified by adjusting the parameter $q$. By varying the $q$ value, we can obtain different magnetic Laplacian matrices from a given graph structure. With this property, we implement Laplacian perturbation through $q$ variation, selecting $q$ values from 0 to 0.5$\pi$. Despite variations of the Laplacian matrix caused by the $q$, the underlying graph structure remains unaltered. This technique of Laplacian perturbation is an effective way to augment graphs without distorting the original data. The meaning of Laplacian perturbation is analyzed in Section~\ref{sec:theoretical}.
 
 The overall perturbation procedure of UGCL consists of two steps; structure perturbation and Laplacian perturbation. We create two different perturbed graph views, $\widetilde{\mathcal{G}}_1$ and $\widetilde{\mathcal{G}}_2$ by applying edge-based structure perturbation to the original graph. Then, we obtain the perturbed signed directed magnetic Laplacians, $\widetilde{\textbf{L}}^{q_1}_1$ and $\widetilde{\textbf{L}}^{q_2}_2$, from each of the two structurally perturbed graph views with sampled $q$ values.


\begin{figure}[t]
  \centering
  \includegraphics[width=\linewidth]{edge.PNG}
  \caption{Structure perturbation of a signed directed graph. Dashed edges indicate perturbed edges.}\label{fig:edge}
\end{figure}



\begin{figure*}[t]
  \centering
  \includegraphics[width=0.8\linewidth]{figure_3.PNG}
  \caption{Model overview. There are two structurally perturbed graph views and get perturbed Laplacians from them. Defined graph encoder with the perturbed Laplacians. Contrastive objectives are calculated after projection heads.}\label{fig:3}
\end{figure*}



\subsection{Graph Encoder}
\subsubsection{Spectral Convolution via Magnetic Laplacian}
We define a graph encoder with the perturbed Laplacian matrix. The signed directed magnetic Laplacian $\mathbf{L}^q$, is diagonalizable with eigenvector matrix $\mathbf{U}$, and diagonal eigenvalue matrix $\Lambda$ thanks to its PSD property. Several studies on graph convolution \citep{defferrard2016convolutional,hammond2011wavelets} have utilized the eigenvectors as the discrete Fourier modes in graph signal processing. The transformation of graph signals is performed through the graph Fourier transform, 
$\mathbf{\hat{\textbf{x}}}=\mathbf{U}^{\dagger}\mathbf{x}$. 
%Thanks to the unitarity of $\mathbf{U}$, the inverse Fourier transform formula is defined as follows:
%\begin{equation}
% \mathbf{x}=\mathbf{U}\mathbf{\hat{x}}= \sum_{k=1}^{N}\hat{\mathbf{x}}(k)\mathbf{u}_k. 
%\end{equation}
A spectral convolution operation of the graph signal is described as:
\begin{equation}
 \mathbf{g}_\theta \ast \mathbf{x} = \mathbf{U} \mathbf{g}_\theta \mathbf{U}^{\dagger}\mathbf{x},\label{eq:7}
\end{equation}
where $\mathbf{g}_\theta=diag(\theta)$ is a trainable filter. For efficient calculation, \citet{hammond2011wavelets} proposed a truncated Chebyshev polynomial expansion of the filter by:
\begin{equation}
 \mathbf{g}_{\theta'}(\mathbf{\Lambda})\approx 
 \sum_{k=0}^{K}\theta'_k T_k(\mathbf{\overline{\Lambda}}).\label{eq:8}
\end{equation} 
Here, $T_0(x)=1, T_1(x)=x$, and $T_k=2x T_{k-1}(x)+T_{k-2}(x)$ for $k \geq 2$.
%where the $k$ is an expansion order.
$\theta'_k$ are Chebyshev coefficients, and $\mathbf{\overline{\Lambda}}=\frac{2}{\lambda_{max}}\mathbf{\Lambda}-\mathbf{I}$ is a normalized eigenvalue matrix where $\lambda_{max}$ is the largest eigenvalue. Equation~\eqref{eq:7} becomes a simplified form of spectral graph convolution as
\begin{equation}
 \mathbf{g}_{\theta'} \ast \mathbf{x} = 
 \sum_{k=0}^{K}\theta'_k T_k(\mathbf{\overline{L}})x,\label{eq:9}
 \end{equation} 
where $\mathbf{\overline{L}}=\frac{2}{\lambda_{max}}\mathbf{L}-\mathbf{I}$ analogous to $\mathbf{\overline{\Lambda}}$. 


\subsubsection{Spectral Convolution Layer}
We define the spectral convolution layer with the approximated spectral convolution operation Equation~\eqref{eq:9}. We set the maximum polynomial order $K$ as 1, and assume $\lambda_{max} = 2$ to make it practical. Like GCN \citep{kipf2016semi}, we set $\theta=\theta_0'=-\theta_1'$. Then we have approximated convolution layer as:    
\begin{equation}
    \mathbf{g}_{\theta'} \ast \mathbf{x} \approx \theta(\mathbf{I}+(\mathbf{D}^{-\frac{1}{2}}_s \mathbf{A}_s \mathbf{D}^{-\frac{1}{2}}_s) \odot \mathbf{P}^q)\mathbf{x}.\label{eq:10}
\end{equation}

By the following renormalization trick: 
\begin{equation}
\mathbf{I}+(\mathbf{D}^{-\frac{1}{2}}_s \mathbf{A}_s \mathbf{D}^{-\frac{1}{2}}_s)\odot \mathbf{P}^q \to \mathbf{\overline{D}}^{-\frac{1}{2}}_s \mathbf{\overline{A}}_s \mathbf{\overline{D}}^{-\frac{1}{2}}_s\odot \mathbf{P}^q,\label{eq:11}
\end{equation}
where, $\mathbf{\overline{A}_s} = \mathbf{A}_s+\mathbf{I} $ and $\mathbf{\overline{D}_s}(i,i)=\sum_j{\mathbf{\overline{A}_s}(i,j)}$. The spectral convolution layer is defined as:
\begin{equation}
  \textbf{X}^{l+1} = 
  (\mathbf{\overline{D}}^{-\frac{1}{2}}_s \mathbf{\overline{A}}_s \mathbf{\overline{D}}^{-\frac{1}{2}}_s\odot \mathbf{P}^q) \mathbf{X}^{l} \mathbf{W}.\label{eq:12}
\end{equation} 
$\textbf{X}^{l+1} \in \mathbb{R}^{|V| \times F}$ is the convoluted graph signals or representations after the $l$-th layer. $\textbf{W} \in \mathbb{R}^{C \times F}$ is a learnable matrix. $C$ and $F$ are the numbers of input and output channels, respectively.  The renormalization trick prevents gradient vanishing and exploding problems. 


\subsubsection{Graph Encoder}
%Graph encoder stacks $L$ layers of the proposed spectral convolution layer and gets output feature matrix, $\mathbf{X}^{(L)}$. 
%The $l$-th layer feature vector $\mathbf{x}^{(l)}$ is defined as:
%\begin{equation}
%  \mathbf{x}_j^{(l)}= \sigma ( \sum_{i=1}^{F_{l-1}} \mathbf{Y}_{ij}^{(l)}\mathbf{x}_i^{(l-1)}+\mathbf{b}_j^{(l)}),
%\end{equation} 
%where $F_{l-1}$ is the channel number of $(l$-1)th layer, The activation function, $\sigma$, is a complex version of ReLU \citep{zhang2021magnet}. 
As the output of the convolution layer has both real and imaginary values, we apply an unwinding operation to concatenate the features in the common domain.
\begin{equation}
    \mathbf{X}_{\text{unwind}}^{(L)} = 
[\text{real}(\mathbf{X}^{(L)}) ||
    \text{imag}(\mathbf{X}^{(L)}) \otimes (-i)].\label{eq:13}
\end{equation} 
A fully connected layer after unwinding finally yields the node representations as 
\begin{equation}
    \textbf{Z} = \sigma(\mathbf{X}_{\text{unwind}}^{(L)}\mathbf{W}^{L+1} + \mathbf{B}^{(L+1)}).\label{eq:14}
\end{equation}
$\textbf{Z} \in \mathbb{R}^{|V| \times D}$ is an augmented node representation. 
%The augmented two graph views are fed into the spectral graph encoder and processed as augmented node representations.
We apply a projection head in advocate of \citep{jacovi2021contrastive,chen2020big}. A non-linear transformation $g(\cdot)$ maps the representations to another latent space that can enhance the discriminative power of contrastive learning. %we used two fully-connected layers.
$\textbf{M}$ is a projected latent of the augmented representation.
\begin{equation}
\textbf{M} = g({\textbf{Z}}).\label{eq:15}
\end{equation}


\subsection{Contrastive Objective}
\subsubsection{Inter-view Loss}
The contrastive objective aims to align the latent of the same node while differentiating that of other nodes. Two identical nodes from different graph views are considered as an inter-positive pair, while other node pairs are considered inter-negative pairs. For example, a node $u$ from $\widetilde{\mathcal{G}}_1$ and the same  node $u$ from $\widetilde{\mathcal{G}}_2$ are the inter-positive pair. On the other hand, other nodes $\{v \in \text{V}; v \neq u\}$ from $\widetilde{\mathcal{G}}_2$ are the inter-negative pair with the node $u$ of $\widetilde{\mathcal{G}}_1$. Even though the nodes in the inter-positive pair come from different graph views, they are the same nodes. Therefore, we aim to maximize the agreement of positive pair latent, $\textbf{m}^{u}_1$ and $\textbf{m}^{u}_2$. For the same reason, we minimize the agreement of negative pair latent, $\textbf{m}^{u}_1$ and $\textbf{m}^{v}_2$. The goal of the inter-view objective is to maximize the similarity of positive pairs and minimize the similarity of negative pairs.
\begin{equation}
  \mathcal{L}_{inter} = \frac{1}{|V|}\sum_{u \in V} \text{log}\frac{\text{exp}((\textbf{m}^{u}_1 \cdot \textbf{m}^{u}_2)/\tau)}{\sum_{v \in V}\text{exp}((\textbf{m}^{u}_1 \cdot \textbf{m}^{v}_2)/\tau)}\label{eq:16}
\end{equation}



\subsubsection{Intra-view Loss}
While the inter-view loss compares the latent representations of nodes between two distinct graph views, the intra-view loss calculates the discriminative loss within a single graph view. It is essential to differentiate the latent representations of all nodes from each other, as each node possesses unique characteristics. The objective is to make the latent of all nodes being distinctive. The intra-loss is defined as:
\begin{equation}
  \mathcal{L}_{intra} = \frac{1}{K}\sum^{K}_{k=1}\frac{1}{|V|}\sum_{u \in V} \text{log}\frac{1}{\sum_{v \in V, u \neq v}\text{exp}((\textbf{m}^{u}_k \cdot \textbf{m}^{v}_k)/\tau)},\label{eq:17}
\end{equation}
where $k$ indicates the graph view index. The contrastive loss is the sum of the inter- and intra-view loss functions.
\begin{equation}
  \mathcal{L}_{contrastive} = \mathcal{L}_{inter}+ \mathcal{L}_{intra}\label{eq:18}
\end{equation}

\subsection{Prediction}
%For model training, we not only use contrastive loss but also utilize label loss. In contrast to the contrastive loss is self-supervised, the label loss is a supervised loss. 
The augmented two graph views are the input to graph encoders and they make two node representations, $\textbf{Z}_1$ and $\textbf{Z}_2$. The representations are concatenated and fed into the output layer that produces the final node embedding as, 
\begin{equation}
  \textbf{R} = \sigma([\textbf{Z}_1 \parallel \textbf{Z}_2] \textbf{W}^{out}+\textbf{B}^{out}).\label{eq:19}
\end{equation}
The final embedding is utilized for downstream tasks such as predicting the edge sign from $u$ to $v$. The prediction layer is defined as:
\begin{equation}
  \hat{y}_{u,v} = \sigma([\textbf{r}_u||\textbf{r}_v]{\textbf{W}}^{pred}+\textbf{B}^{pred}).\label{eq:20}
\end{equation}
%We define the label loss with the prediction error as:
%\begin{equation}
%\begin{multlined}
%  \mathcal{L}_{label} = -\sum_{{(u,v)}\in {\textbf{S}=1}} y_{u,v} \text{log}\hat{y}_{u,v}  \\
%  -\sum_{{(u,v)}\in {\textbf{S}=-1}}(1-y_{u,v}) \text{log} (1-\hat{y}_{u,v}).
%   \end{multlined}
% \end{equation}
For semi-supervised learning, the proposed model is trained by the following objective function with weight parameter $\alpha$.
\begin{equation}
  \mathcal{L} = \alpha \times \mathcal{L}_{contrastive}+ \mathcal{L}_{label}.\label{eq:21}
\end{equation}





\section{Theoretical Analysis}\label{sec:theoretical}
\subsection{Meaning of the $q$ value}

The phases of signed directed magnetic Laplacian are controlled by the parameter $q$. The $q$ value affects the sensitivity to the sign and direction information by determining the phase angle between the real and imaginary axes. When the $q$ is small, the phase difference between the two reverse edges is small. The Laplacian places less emphasis on directional information. In an extreme case of $q=0$, direction information is ignored and becomes an undirected model. 
On the contrary, a large $q$ value also decreases the validity of the encoding. When $q=\pi/2$, a positive edge from node $u$ to node $v$, and a  negative edge from node $v$ to node $u$ are encoded to the same value. Figure~\ref{fig:high_low} describes the effect of $q$ value. 


\begin{figure}[t]
  \centering
  \includegraphics[width=\linewidth]{high_low_q_5.PNG}
  \caption{Effect of $q$ value.  }\label{fig:high_low}
\end{figure}



\subsection{Analysis of the Laplacian Perturbation}
Direct perturbations to nodes, edges, or attributes of the graph can lead to significant differences between the perturbed graph view and the original graph. In contrast, the proposed Laplacian perturbation, achieved through the variation of the $q$ value, indirectly influences the graph data. Analyzing the exact nature of this perturbation and how it differs from the original graph is challenging. To address this issue, we analyze the impact of Laplacian perturbation on the graph information by quantifying graph entropy. 


\begin{table*}[t]
\centering
\renewcommand{\arraystretch}{1.23}
\resizebox{\textwidth}{!}{%
\begin{tabular}{cc|ccc|cccc|ccc}
\Xhline{2\arrayrulewidth}
&  & \multicolumn{3}{c|}{Signed Convolution} & \multicolumn{4}{c|}{Contrastive Learning} & \multicolumn{3}{c}{Proposed}   \\ \hline
\multicolumn{1}{c|}{Dataset} & Metric & SGCN & SDGNN & SDGCN & DiGCL & GCA & SimGRACE & SGCL & UGCL-S & UGCL-L & UGCL \\   \Xhline{2\arrayrulewidth}

%\multicolumn{1}{c|}{\multirow{4}{*}{Bitcoin-Alpha}} 
\multicolumn{1}{c|}{\multirow{4}{*}{\STAB{\rotatebox[origin=c]{90}{Bitcoin-Alpha}}}}
& AUC & 0.782 & 0.835 & 0.858 & 0.814 & 0.838 & 0.823 & 0.849 & \textbf{0.896} & 0.883 & \underline{0.886} \\
\multicolumn{1}{c|}{} & Macro-F1  & 0.668 & 0.683 & 0.723 & 0.653 & 0.671 & 0.657 & 0.712 & 0.740 & \underline{0.744} & \textbf{0.754}  \\
\multicolumn{1}{c|}{} & Micro-F1  & 0.899 & 0.909 & 0.923 & 0.907 & 0.913 & 0.919  & 0.923 & \underline{0.947} & 0.942 & \textbf{0.949}\\
\multicolumn{1}{c|}{} & Binary-F1  & 0.941 & 0.947 & 0.958 & 0.950 & 0.953 & 0.957 &  0.959 & \textbf{0.973} & 0.969 & \underline{0.971}\\  \hline

\multicolumn{1}{c|}{\multirow{4}{*}{\STAB{\rotatebox[origin=c]{90}{Bitcoin-OTC}}}}
& AUC & 0.832 & 0.879 & 0.887 & 0.852 & 0.868 & 0.859 & 0.893 & \textbf{0.914} & 0.902 & \underline{0.910}\\   
\multicolumn{1}{c|}{} & Macro-F1  & 0.710 & 0.751 & 0.773 & 0.725 & 0.743 & 0.725 & 0.781 & \textbf{0.803} & 0.796 & \underline{0.802} \\
\multicolumn{1}{c|}{} & Micro-F1  & 0.886 & 0.902 & 0.911 & 0.904 & 0.907 & 0.906  & 0.920 & \underline{0.935} & 0.930 & \textbf{0.937}\\
\multicolumn{1}{c|}{} & Binary-F1  & 0.924 & 0.938 & 0.950 & 0.948 & 0.948 & 0.948 & 0.956 &  \underline{0.964} & 0.962 & \textbf{0.965}\\  \hline

\multicolumn{1}{c|}{\multirow{4}{*}{\STAB{\rotatebox[origin=c]{90}{Epinions}}}} & AUC & 0.848 & 0.914 & 0.939 & 0.839 & 0.911 & 0.913 & 0.876 & 0.941 & \textbf{0.943} & \underline{0.942}\\   
\multicolumn{1}{c|}{} & Macro-F1  & 0.741 & 0.831 & 0.850 & 0.726 & 0.814 & 0.812 & 0.798 & 0.861 & \textbf{0.865} & \underline{0.863} \\
\multicolumn{1}{c|}{} & Micro-F1  & 0.893 & 0.912 & 0.925 & 0.887 & 0.913 & 0.915  & 0.909 & \underline{0.934} & \textbf{0.936} & \textbf{0.936}\\
\multicolumn{1}{c|}{} & Binary-F1  & 0.937 & 0.944 & 0.956 & 0.936 & 0.950 & 0.951 & 0.948 & \underline{0.962} & \textbf{0.963} & \textbf{0.963}\\  \hline

\multicolumn{1}{c|}{\multirow{4}{*}{\STAB{\rotatebox[origin=c]{90}{Slashdot}}}} & AUC & 0.740 & 0.849 & 0.886 & 0.813 & 0.870 & 0.865 & 0.783 & \underline{0.900} & 0.891 & \textbf{0.902}\\   
\multicolumn{1}{c|}{} & Macro-F1  & 0.688 & 0.729 & 0.780 & 0.667 & 0.750 & 0.745 & 0.683 & \textbf{0.792} & 0.785 & \underline{0.789} \\
\multicolumn{1}{c|}{} & Micro-F1  & 0.786 & 0.823 & 0.855 & 0.813 & 0.842 & 0.833  & 0.811 & \textbf{0.864} & 0.859 & \underline{0.863}\\
\multicolumn{1}{c|}{} & Binary-F1  & 0.869 & 0.889 & 0.908 & 0.887 & 0.902 & 0.895 & 0.884 & \textbf{0.915} & 0.911 & \underline{0.914}\\  \hline

\Xhline{2\arrayrulewidth}
\end{tabular}%
}
\caption{Link sign prediction performance. \textbf{Bold} and \underline{underline} indicate the best and the second performance respectively. The performances are the average score of ten experiments with different seed sets.}
\label{tab:1}
\end{table*}


Von Neumann entropy is a widely used form to quantify graph entropy.
 \citet{ye2014approximate} introduced the Von Neumann entropy of a directed graph with Laplacian matrix as:
\begin{equation*}
    H(\mathcal{G}_D) = \frac{\text{Tr}[\text{L}]}{|V|}-    \frac{\text{Tr}[\text{L}^2]}{|V|}. 
\end{equation*}
Leveraging the Von Neumann entropy of directed graphs, we derive Theorem~\ref{theorem:3} which states that the entropy of a signed directed graph is less than or equal to the sum of the entropy of a positive edge graph and a negative edge graph.
\begin{theorem} \textbf{Von Neumann Entropy of a Signed Directed Graph} \label{theorem:3}
\begin{equation*}
H(\mathcal{G}) \leq H(\mathcal{G}^+_D) + H(\mathcal{G}^-_D).
\end{equation*}
\end{theorem}
$\mathcal{G}$ is a signed directed graph. $\mathcal{G}^+_D$ and $\mathcal{G}^-_D$ are the graph with positive edges and the graph with negative edges, respectively. The Von Neumann entropy of a signed directed graph satisfies the upper bound. This theorem is proved in Supplementary Material. Then, we quantify the effect of Laplacian perturbation through the change in the Von Neumann entropy by $q$ value variation. 
\begin{definition}
    \textbf{Perturbation Error} 
    Given a perturbation term $\Delta q$, we define the perturbation error of the Von Neumann entropy caused by Laplacian perturbation.
    \begin{equation*}
    \Delta H(\mathcal{G},q, \Delta q) = H(\mathcal{G},q) - H(\mathcal{G},q+ \Delta q).
\end{equation*} 
\end{definition} 
\begin{theorem}
    \textbf{Perturbation Error of a Signed Directed Graph} 
\begin{equation*}
\begin{split}
    \Delta H(\mathcal{G}^+_D, q, \Delta q),     \Delta H(\mathcal{G}^-_D, q, \Delta q) \leq \Delta H(\mathcal{G}, q, \Delta q), \\
    \Delta H(\mathcal{G}, q, \Delta q) \leq 
    \Delta H(\mathcal{G}^+_D, q, \Delta q)+
    \Delta H(\mathcal{G}^-_D, q, \Delta q).
\end{split}
\end{equation*}  \label{theorem:4}
\end{theorem}


Signed directed perturbation error is described with lower and upper bounds. And we can notice that the graph entropy varies by the $q$ value variation even though the degree matrix and adjacency matrix are fixed. This perturbation error caused by Laplacian perturbation provides contrastive information in various magnitudes for the encoder. It helps the encoder to focus more on the graph structure rather than just learning from the supervised learning. The proof of Theorem~\ref{theorem:4} is in the Supplementary Material. 

In this subsection, we investigate the impact of Laplacian perturbation on graphs and infer the resulting variations. This analysis demonstrates the effectiveness of Laplacian perturbation as an alternative method that avoids direct perturbation of the graph structure. By preserving the graph's structural integrity while inducing meaningful perturbations, Laplacian perturbation proves to be highly valuable across various applications.

\begin{table}[t]
\centering
\renewcommand{\arraystretch}{1.2}
\resizebox{\columnwidth}{!}{%
\begin{tabular}{ccccc}
\Xhline{2.5\arrayrulewidth}
Dataset & \# nodes & \# pos edges & \# neg edges & ratio (\%) \\ \hline
Bitcoin-Alpha & 3,783 & 22,650 & 1,536 & 93.7 \\
Bitcoin-OTC & 5,881 & 32,029 & 3,563 & 90.0 \\
Epinions & 131,828 & 717,667 & 123,705 & 85.3 \\
Slashdot & 82,144 & 425,072 & 124,130 & 77.4 \\ \Xhline{2.5\arrayrulewidth}
%Bitcoin-Alpha\tablefootnote{http://www.btc-alpha.com} & 3,783 & 22,650 & 1,536 & 93.7 \\
%Bitcoin-OTC\tablefootnote{http://www.bitcoin-otc.com} & 5,881 & 32,029 & 3,563 & 90.0 \\
%Epinions\tablefootnote{http://www.epinions.com} & 131,828 & 717,667 & 123,705 & 85.3 \\
%Slashdot\tablefootnote{http://www.slashdot.com} & 82,144 & 425,072 & 124,130 & 77.4 \\ \Xhline{2.5\arrayrulewidth}
\end{tabular}%
}
\caption{Dataset statistics.}
\label{tab:2}
\end{table}


\section{Experiments}\label{sec:experiment}
To demonstrate the effectiveness and universality of our model, we evaluate it on various graph datasets. We conduct node classification tasks on unsigned undirected graphs and link sign prediction tasks on signed directed graphs. %For details on the datasets, baselines, task settings, and reproducible information, please refer to the Supplemental Material.
%Detail descriptions of the dataset, baseline, task setting, and reproducible information are reported in the Supplement Material. 
Through the experiments, we aim to address the following research questions:
\begin{itemize}
    \item \textbf{RQ1}: Does UGCL have better representation learning ability compared to state-of-the-art baselines?
    \item \textbf{RQ2}: How does UGCL demonstrate its universality across different types of graphs?
    \item \textbf{RQ3}: How do the perturbation methods of UGCL affect the performance?
    \item \textbf{RQ4}: How do the model components of UGCL affect the performance?
\end{itemize}




\subsection{Link Sign Prediction (RQ1)}
\subsubsection{Baselines}
We implemented seven baselines to compare the model performance. There are three signed graph convolution models and four constative learning models. 
\begin{itemize}
\item \textbf{SGCN} \citep{derr2018signed} defines (un)balanced path based on the balanced theory for neighbor aggregation. 
\item \textbf{SDGNN} \citep{huang2021sdgnn} proposed four weight matrices to aggregate neighbor features by edge types. 
\item \textbf{SDGCN} \citep{ko2023spectral} proposed a magnetic Laplacian to overcome the limitation of graph Laplacian.
\item \textbf{GraphCL} \citep{you2020graph} randomly perturbs graph structures by dropping or adding edges and nodes. 
\item \textbf{GCA} \citep{zhu2021graph} proposed score-based graph augmentation and node-level contrastive objective.
\item \textbf{SimGRACE} \citep{xia2022simgrace} introduced a graph encoder perturbation rather than graph augmentation to overcome the cumbersome augmentation search.
\item \textbf{SGCL} \citep{shu2021sgcl} is a GCL for signed directed graphs, which perturbs the edge sign and directions.
\end{itemize}

\subsubsection{Experimental Result}
Table~\ref{tab:1} summarizes the link sign prediction results. The results are the average of ten independent experiments. There are two variants of UGCL; UGCL-S is a model with structure perturbation, and UGCL-L is a model with Laplacian perturbation. The results show that UGCL and its variants always perform the best on all datasets and in all metrics. We can infer that the proposed model learns the node representation properly from the signed directed graphs. 

SGCL or SDGCN demonstrates the second-best performance, following the proposed model. SDGCN achieves good performance by leveraging its signed directed spectral convolution, which effectively utilizes the sign and direction of edges. However, its performance is limited in the context of semi-supervised learning. On the other hand, SGCL is a contrastive learning model specifically designed for signed graphs, and its strong performance on most datasets validates the effectiveness of contrastive learning. However, SGCL exhibits poor performance on the Epinions and Slashdot datasets. Although the structure perturbation methods of SGCL and the proposed model share similarities, the proposed model mitigates the drawbacks of structure perturbation by incorporating Laplacian augmentation. Furthermore, UGCL benefits from an advanced spectral graph encoder compared to the simple GNN encoder utilized in SGCL.


\begin{figure*}[t]
  \centering
  \includegraphics[width=0.9\linewidth]{figure_5_2.PNG}
  \caption{Structure perturbation analysis. The x-axis indicates the perturbing ratio.}\label{fig:5}
\end{figure*}

\begin{figure*}[t]
  \centering
  \includegraphics[width=0.9\linewidth]{figure_6_2.PNG}
  \caption{Laplacian perturbation analysis. The x-axis indicates noise variance.}\label{fig:6}
\end{figure*}

\subsection{Universality of UGCL (RQ2)}
The signed directed magnetic Laplacian has the capability to represent various graph types. For instance, in the case of vanilla graphs where all edges are assumed to be bidirectional and positive ($\mathbf{S}=1$), the encoding of edges is done using {0, 1}, resulting in a Laplacian equivalent to the traditional graph Laplacian. When dealing with unsigned directed graphs, the edges are encoded using {0, 1, $\frac{1}{2}(\text{cos}q+i\text{sin}q)$, $\frac{1}{2}(\text{cos}q-i\text{sin}q)$}, which resembles the Laplacian definition in MagNet \citep{zhang2021magnet}. In essence, the traditional graph Laplacian and the Laplacian employed in MagNet can be viewed as special cases of our encoding. Similarly, the signed undirected graph can be handled as well. Consequently, the signed directed magnetic Laplacian proves to be applicable to all graph types, and the Laplacian perturbation method exhibits wide-ranging utility.

To demonstrate the wide applicability of our approach, we conducted a node classification task on different graph types. However, due to space limitations, we have provided the results in the Supplementary Material. It is worth noting that the proposed UGCL model performs well even on both undirected graphs and directed graphs, further highlighting its versatility and effectiveness across different graph types.


\subsection{Perturbation Analysis (RQ3)}
Figure~\ref{fig:5} illustrates the performance variation with respect to the edge perturbation ratio, where Laplacian perturbation is not utilized in this particular experiment. The results indicate that the performance improves initially with a small perturbation ratio, but starts to decline when the ratio exceeds 0.1. This observation highlights the effectiveness of structure perturbation when applied in moderation, while also emphasizing the potential risks associated with excessive perturbation.

Figure~\ref{fig:6} displays the performance variation in response to Laplacian perturbation, where structure perturbation is not employed in this specific experiment. We set $q=\pi/4$ and introduce Gaussian noise with zero mean and varying standard deviations. The x-axis represents the standard deviation of the Gaussian noise. Similar to structure perturbation, performances are low when the standard deviation is zero, indicating no Laplacian perturbation. The results show an initial increase in performance followed by a decrease. Compared to structure perturbation, Laplacian perturbation demonstrates lower sensitivity to the perturbation ratio. This suggests that Laplacian perturbation can provide more stable and robust perturbation effects.

While graph augmentations are essential in contrastive learning, excessively large-scale perturbations can be detrimental to the training process. Structure perturbation provides direct contrastive information, but it runs the risk of compromising the network semantics. On the other hand, Laplacian perturbation offers indirect perturbations to the graph data while maintaining effectiveness. In UGCL, these two augmentation techniques are combined to achieve efficient and stable graph augmentation, striking a balance between informative perturbations and preserving the integrity of the network semantics.

\subsection{Ablation Study (RQ4)}\label{sec:ablation}
We check the effects of UGCL components though ablation studies. Table~\ref{tab:2} shows the F1 scores and w/o struct, w/o Lapla, and w/o aug are the variation of perturbation methods. Especially, w/o aug, which turns off both perturbations, shows the lowest performance. As we expected, the model leverages the advantage of contrastive learning. It shows that perturbation are important in our model. w/o contrast is a model with $\alpha=0$ and the model uses label loss only. Note that it does not mean that the model does not utilize the benefits of contrastive learning. Even though the contrastive loss weight is zero, label loss is calculated with augmented representations of graph views. w/o proj is a model without a projection head. It is confirmed that the projection head is useful for robust contrastive learning \citep{jacovi2021contrastive,chen2020big}.


\section{Conclusion}\label{sec:conclusion}
This paper proposes UGCL, a graph contrastive learning framework. It incorporates two levels of perturbation, structure and Laplacian. Structure perturbation involves modifying the signs and directions of random edges. Although this perturbation may lead to the loss of graph information, it enhances the noise robustness. Laplacian perturbation changes the phase parameter $q$ during each training iteration. It does not directly impact the graph structure but rather influences the magnetic Laplacian. The efficacy of Laplacian perturbation is verified through both theoretical analysis and empirical experiments. By utilizing the perturbed Laplacian, we define a spectral graph encoder. The proposed framework demonstrates its wide applicability to all graph types. Through extensive evaluations on diverse real-world graphs, the proposed framework consistently demonstrates superior performance compared to other existing approaches. 


\begin{table}[t]
\centering
\renewcommand{\arraystretch}{1.2}
\resizebox{\columnwidth}{!}{%
\begin{tabular}{lcccc}
\Xhline{2.5\arrayrulewidth}
 & Bitcoin-Alpha & Bitcoin-OTC & Epinions & Slashdot \\ \hline
UGCL                     & \textbf{0.949} & \textbf{0.937} & \textbf{0.936} & 0.863 \\
\quad w/o struct  & 0.942 & 0.930 & \textbf{0.936} & 0.859 \\
\quad w/o Lapla  & 0.947 & 0.935 & 0.934 & \textbf{0.864} \\
\quad w/o aug   & 0.919 & 0.913 & 0.920 & 0.853 \\
\quad w/o contrast & 0.940 & 0.931 & 0.929 & 0.855 \\
\quad w/o proj   & 0.942 & 0.932 & 0.931 & 0.858 \\
\Xhline{2.5\arrayrulewidth}
\end{tabular}%
}
\caption{The results of ablation study.}\label{tab:2}
\end{table}

\begin{acknowledgements} 
    This work was supported by the KENTECH Research Grant (202200019A), IITP (No.2021-0-02068, 2023-RS-2022-00156287) grant funded by the Korean government (MSIT), and BK21 Four Intelligence Computing (4199990214639) funded by the National Research
Foundation of Korea (NRF)

\end{acknowledgements}

% References
%\bibliography{uai2023-template}
\bibliography{ko_750}

\end{document}
