%\documentclass{uai2023} % for initial submission
\documentclass[accepted]{uai2023} % after acceptance, for a revised
% version; also before submission to
% see how the non-anonymous paper
% would look like

%% There is a class option to choose the math font
% \documentclass[mathfont=ptmx]{uai2023} % ptmx math instead of Computer
% Modern (has noticable issues)
% \documentclass[mathfont=newtx]{uai2023} % newtx fonts (improves upon
 % ptmx; less tested, no support)
% NOTE: Only keep *one* line above as appropriate, as it will be replaced
%       automatically for papers to be published. Do not make any other
%       change above this note for an accepted version.

%% Choose your variant of English; be consistent
\usepackage[american]{babel}
% \usepackage[british]{babel}

%% Some suggested packages, as needed:
\usepackage{natbib} % has a nice set of citation styles and commands
    \bibliographystyle{plainnat}
    \renewcommand{\bibsection}{\subsubsection*{References}}
\usepackage{mathtools} % amsmath with fixes and additions
% \usepackage{siunitx} % for proper typesetting of numbers and units
\usepackage{booktabs} % commands to create good-looking tables
\usepackage{tikz} % nice language for creating drawings and diagrams

\usepackage{times}
\usepackage{helvet}
\usepackage{courier}
\usepackage{float, graphicx, multirow}
\usepackage{makecell} 
%\usepackage{hyperref}
\usepackage{lipsum}
\usepackage[toc,page]{appendix}
\usepackage{caption}
\usepackage{subcaption}
\usepackage{mathtools}
\usepackage{amsmath,amsfonts,amssymb,amsthm}
\usepackage{amssymb}% http://ctan.org/pkg/amssymb
\usepackage{physics}
\usepackage{pifont}% http://ctan.org/pkg/pifont
\usepackage{tablefootnote}
\newtheorem{theorem}{Theorem}%  meant for continuous numbers
\newtheorem{definition}{Definition}%
\newtheorem{proposition}{Proposition}%
\usepackage[colorinlistoftodos]{todonotes}
\newcommand{\STAB}[1]{\begin{tabular}{@{}c@{}}#1\end{tabular}}


% for cross referencing the main text
% PLEASE ONLY USE xr IN THE SUPPLEMENTARY MATERIAL. 
% In the main paper, hard code any cross-reference to the supplementary material. 
\usepackage{xr} 
%\externaldocument{uai2023-template}
\externaldocument{ko_750}


%% Provided macros
% \smaller: Because the class footnote size is essentially LaTeX's \small,
%           redefining \footnotesize, we provide the original \footnotesize
%           using this macro.
%           (Use only sparingly, e.g., in drawings, as it is quite small.)

%% Self-defined macros
\newcommand{\swap}[3][-]{#3#1#2} % just an example

\title{Universal Graph Contrastive Learning with a Novel Laplacian Perturbation\\(Supplementary Material)}

% The standard author block has changed for UAI 2023 to provide
% more space for long author lists and allow for complex affiliations
%
% All author information is authomatically removed by the class for the
% anonymous submission version of your paper, so you can already add your
% information below.
%
% Add authors
\author[1]{\href{mailto:<taewook.ko@snu.ac.kr>?Subject=Your UAI 2023 paper "UGCL"}{Taewook Ko}{}}
\author[1]{Yoonhyuk Choi}
\author[2]{Chong-Kwon Kim}
% Add affiliations after the authors
\affil[1]{%
    Department of Computer Science and Engineering\\
    Seoul National University}
\affil[2]{%
    Research Institute of Energy AI\\
    Korea Institute of Energy Technology}


\begin{document} 
\onecolumn %% Turn this off if single column is desired for the supplement

\maketitle
%This Supplementary Material should be submitted as a separate file. Please do not append the Supplementary Material to the main paper. 
%Fig. \ref{fig:pitt} and Eq \ref{eq:example} in the main paper can be cross referenced using \texttt{xr}. 

\appendix

\section{Notations}
We provide a summary of the notations used in this paper and their descriptions in the following tables for reader convenience.
\begin{table}[h]
\centering
%\renewcommand{\arraystretch}{1.3}
%\resizebox{\columnwidth}{!}{%
\begin{tabular}{cl}
\Xhline{2.5\arrayrulewidth}
Notation  & Description  \\ \hline
$\mathcal{G}$          &  Graph            \\
$\mathcal{G}^+, \mathcal{G}^-$          &  Positive and negative graph            \\
\textit{V} , \textit{E}           & Node and edge set    \\
%$          & Edge set      \\
\textbf{S}           & Sign matrix   \\
%$\mathcal{E}^+$, $\mathcal{E}^-$  & Positive and negative edge matrix              \\
\textbf{\textit{Z}}   & Node representation matrix              \\
$\textbf{A}$, $\textbf{A}_s$ & Adjacency matrix and symmetric adjacency matrix \\
$\textbf{D}$, $\textbf{D}_s$ & Degree matrix and symmetric degree matrix \\
\textbf{L} &     Laplacian matrix \\  
$\textbf{L}^{q}$  & Magnetic Laplacian matrix with parameter $q$              \\
$\widetilde{\mathcal{G}}$, $\widetilde{\textbf{L}}^{q}$          &   Structure perturbed graph and perturbed magnetic Laplacian            \\
$\textbf{P}^{q}$ &         Phase matrix           \\
$\textbf{H}^{q}$ &           Complex Hermitian adjacency matrix          \\
$q$ & Phase control parameter \\
\textbf{X} &   Input graph signal             \\
\textbf{M} &   Projected representations             \\
$g$ &   Projected head             \\
\textbf{W, b} &   Learnable weight matrix and bias           \\
\Xhline{2.5\arrayrulewidth}
\end{tabular}%
\caption{Notations of this paper and its descriptions}
\label{tab:notation}
\end{table}



\section{Experiment Details}
\subsection{Link Sign Prediction TASK}
\subsubsection{Dataset and Metric}
We used four signed-directed graph dataset, Bitcoin-Alpha, Bitcoin-OTC, Epinions, and Slashdot which are widely used in signed-directed graph research.  
Bitcoin-Alpha\footnote{http://www.btc-alpha.com} and Bitcoin-OTC\footnote{http://www.bitcoin-otc.com} \citep{kumar2016edge} are extracted from Bitcoin trading platforms. Nodes are users, and edges are user relationships. Users can score the others on a scale of -10 to +10. Edges higher than 0 are treated as positive edges, otherwise negative edges. Epinions\footnote{http://www.epinions.com} \citep{guha2004propagation} is a who-trust-whom network crawled from a consumer review site. Users can notate trust or distrust to reviews of other users. Slashdot\footnote{http://www.slashdot.com} \citep{kunegis2009slashdot} is a social network of user community site. Especially they share new information. Users tag others as friends or foes, and we can construct positive and negative edges with this information. 
The preprocessed datasets can be found at  Standford Network Analysis Project (SNAP)\footnote{https://snap.stanford.edu/data/index.html\#signnets}.
Some papers \citep{li2020learning,derr2018signed} used sub-networks of the originals due to the large network size. We use the whole graph structure for the experiments. In the training phase, we sample positive and negative edges at a ratio of 3:1, but in the validation and test sets, we maintain a natural ratio. It is because the ratio of the positive and negative edges is highly unbalanced. If we train a model with 90 percent of positive samples, a model can easily improve its performance by simply predicting all links are positive. Then, we adopt four metrics, AUC, macro-F1, micro-F1, and binary-F1, for unbiased evaluation.


\subsubsection{Implementation Details}
 Since some graph contrastive baselines are intended for self-supervised learning, we train them with the same semi-supervised loss of the proposed model. Moreover, we removed the read-out process of GraphCL and SimGRACE, which are designed for graph embedding. 
 We ran ten times of experiments with different seed sets for a fair comparison. The seeds are [0, 10, 20, 30, 40, 50, 60, 70, 80, 90]. We apply early stop conditions by comparing the training and validation losses. The model parameters with the lowest validation loss are saved during the training. If validation loss goes up consecutively for more than ten epochs, we stop training and get performance with a test set. 
We follow the hyperparameter settings of the original papers of each model. The node embedding dimension is set to 128 for all the baselines to make the same learning capacity. The edges are split into 60:20:20 for training, validation, and test sets. However, we did not use all the positive edges as training instances during the training stage. The structure perturbing ratio $p$ and $r$ are set to 0.1 for all datasets. The magnetic Laplacian phase $q$ is perturbed by adding Gaussian noise with a standard deviation of 0.1. The contrastive loss weight $\alpha$ is set to 0.2. Graph encoder stacks two signed-directed spectral convolution layers. We use Adam optimizer with learning rate = 0.001, weight decay = 0.001. All experiments are run 10 times with different seed sets to avoid randomness and get the average score. The experiments are conducted on Xeon E5-2660 v4 and accelerated via Nvidia Titan XP 12G GPU. The software is implemented via Ubuntu v16.4 with python v3.7 and Pytorch v1.12.1.





\subsection{Node Classification Task}
\subsubsection{Dataset and Metric}
Our experiments utilized five datasets, including three directed citation networks (Cora, Citeseer, and Pubmed) and two undirected co-author networks in Computer Science (CS) and Physics. In the citation networks, nodes correspond to scientific publications and edges represent citations, while in the co-author networks, nodes correspond to researchers and edges represent co-author relations, which are bidirectional. All datasets were preprocessed and made available through the DGL library \footnote{https://docs.dgl.ai/}. To evaluate the performance of our models on the node classification task, we used prediction accuracy as our primary metric.

\begin{table}[h]
\centering
\renewcommand{\arraystretch}{1.3}
{%
\begin{tabular}{ccccc}
\Xhline{2.5\arrayrulewidth}
 Dataset &\# node & \# edge &  \# features & \# class \\ \hline
Cora & 2,708 & 10,556 &  1,433 & 7 \\
Citeseer & 3,327 & 9,228 & 3,703  &6 \\
Pubmed &  19,717 & 88,651 & 500  & 3 \\ 
CS &  18,333 & 163,788 & 6,805 & 15 \\ 
Physics & 34,493 & 495,924 &8,415&5  \\
\Xhline{2.5\arrayrulewidth}
\end{tabular}%
}
\caption{Dataset statistics.}
\label{tab:Dataset Statistics}
\end{table}



\subsubsection{Baselines}
We implemented nine baselines to compare the model performance. There are five graph convolution models and four constative learning models. 
\begin{itemize}
\item \textbf{GCN} \citep{kipf2016semi} is a spectral graph convolution model with Laplacian matrix.
\item \textbf{GAT} \citep{velivckovic2017graph} is a spatial graph convolution model utilizing attention mechanism. 
\item \textbf{APPNP} \citep{gasteiger2018predict} utilize PageRank for efficient propagation scheme.
\item \textbf{MagNet} \citep{zhang2021magnet} defined a magnetic Laplacian for directed graph convolution. 
\item \textbf{DiGCN} \citep{tong2020digraph} is a directed graph convolution with directed Laplacian matrix.
\item \textbf{DiGCL} \citep{tong2021directed} is a graph contrastive model for directed graphs, which perturbs the Directed Laplacian matrix by changing the teleport probability of the transition matrix.
\end{itemize}
    And also used contrastive learning models, \textbf{GraphCL}, \textbf{GCA}, and \textbf{SimGRACE}. 

\subsubsection{Implementation Details}
We followed the same settings as the link-sign prediction experiments, conducting ten runs with different seed sets, applying early stopping criteria, and the same computing resources. The hyper-parameters used were consistent with those of the original papers. %The results are semi-supervised learning experiments. %$ are trained with 50 to 100 labeled nodes depending on the dataset.

\subsubsection{Prediction Performance}
The proposed UGCL and its variants consistently demonstrate superior performance across various datasets, with the exception of the pubmed dataset. Despite this, the overall results highlight the wide applicability and effectiveness of UGCL in comparison to other approaches. These findings emphasize the competitive performance of UGCL and its potential as a powerful tool for graph-related tasks.

\begin{table*}[h]
\centering
\renewcommand{\arraystretch}{1.2}
%\resizebox{\textwidth}{!}
{%
\begin{tabular}{c|l|ccc|cc}
\Xhline{2\arrayrulewidth}
\multicolumn{2}{c|}{\multirow{2}{*}{Method}}  & \multicolumn{3}{c|}{Directed} & \multicolumn{2}{c}{Undirected}  \\  \cline{3-7}
\multicolumn{2}{c|}{}  & CORA & CITESEER &  PUBMED & CS & Physics \\ \hline

\multirow{5}{*}{\STAB{\rotatebox[origin=c]{90}{Convolution}}} 
 & GCN   & 0.761 & 0.657 & 0.740  & 0.818 & 0.906  \\
& GAT   & 0.780 & 0.658 & 0.771  & 0.827 & 0.912 \\ 
 & APPNP   & 0.769 & 0.664 & 0.768  & 0.823 & 0.920 \\ %\cline{2-7} 
 & MagNet   & 0.789 & 0.683 & 0.765  & 0.845 & 0.914  \\
 & DiGCN   & 0.770 & 0.669 & 0.776  & 0.857 & 0.914 \\ \hline

\multirow{7}{*}{\STAB{\rotatebox[origin=c]{90}{Contrastive}}}
 & GraphCL   & 0.782 & 0.681 & 0.763  & 0.887 & 0.935 \\ 
 & GCA   & 0.786 & 0.688 & \underline{0.794}  & 0.889 & 0.940  \\ 
 & SimGRACE   & 0.791 & 0.673 & \textbf{0.795}  & 0.897 & 0.941 \\ 
 & DiGCL   & \underline{0.794} & 0.672 & 0.757  & 0.902 & 0.927  \\  \cline{2-7}
 & UGCL  & \textbf{0.796} & \textbf{0.699} & 0.762  & \textbf{0.916} & \textbf{0.955}  \\ 
 & UGCL-S   & 0.787 & 0.658 & 0.764  & 0.893 & \underline{0.951} \\ 
 & UGCL-L   & 0.791 & \underline{0.692} & 0.751  & \underline{0.907} & 0.940  \\ \hline
\Xhline{2\arrayrulewidth}
\end{tabular}%
}
\caption{Node classification  performance. \textbf{Bold} and \underline{underline} indicate the best and the second performance respectively. The performances are the average score of 10 experiments with different seed sets.}
\label{tab:my-table}
\end{table*}




\section{Proof of Theorems}
\begin{theorem} For a signed directed graph $\mathcal{G} = (V, E, \textbf{\textit{S}})$, both the unnormalized and normalized magentic Laplacian $\textbf{L}_{U}^{q}, \textbf{L}_{N}^{q}$ are positive semdifinite.
\end{theorem}
\textit{proof.} \\ The unnormalized magnetic Laplacian $\textbf{L}_{U}^{q}$ is an Hermitian matrix by its definition. Then, we have Imag($\textbf{x}^{\dagger}\textbf{L}_{U}^{q}\textbf{x}$)=0 where {$\textbf{x} \in \mathbb{C}^N $}. Now we show Real($\textbf{x}^{\dagger}\textbf{L}_{U}^{q}\textbf{x}$) $\geq 0$. The following procedures utilize the definitions of $\text{D}_s$ and $\text{A}_s$.
\begin{flalign*}
& 2\text{Real}(\textbf{x}^{\dagger}\textbf{L}_{U}^{q}\textbf{x}) \\
= & 2\sum_{u,v=1}^{N}{\mathbf{D_s}}(u,v)\mathbf{x}(u)\overline{\mathbf{x}(v)}\\ & - 2\sum_{u,v=1}^{N}{\mathbf{A_s}}(u,v)\mathbf{x}(u)\overline{\mathbf{x}(v)}
\left[
    \frac{\text{cos}(i\Theta^{q}(uv)) + \text{cos}(i\overline{\Theta}^{q}(uv))}
    {\|\text{exp}(i\Theta^{q}(uv)) +\text{exp}
    (i\overline{\Theta}^{q}(uv))\|+ \epsilon}
\right]\\
= & 2\sum_{u=1}^{N}{\mathbf{D_s}}(u,u)\mathbf{x}(u)\overline{\mathbf{x}(u)}\\ & - 2\sum_{u,v=1}^{N}{\mathbf{A_s}}(u,v)\mathbf{x}(u)\overline{\mathbf{x}(v)}
\left[
    \frac{\text{cos}(i\Theta^{q}(uv)) + \text{cos}(i\overline{\Theta}^{q}(uv))}
    {\|\text{exp}(i\Theta^{q}(uv)) +\text{exp}
    (i\overline{\Theta}^{q}(uv))\|+ \epsilon}
\right]\\
\end{flalign*} 
\begin{flalign*}
= & 2\sum_{u,v=1}^{N}{\mathbf{A_s}}(u,v)\abs{\mathbf{x}(u)}^2\\ & - 2\sum_{u,v=1}^{N}{\mathbf{A_s}}(u,v)\mathbf{x}(u)\overline{\mathbf{x}(v)}
\left[
    \frac{\text{cos}(i\Theta^{q}(uv)) + \text{cos}(i\overline{\Theta}^{q}(uv))}
    {\|\text{exp}(i\Theta^{q}(uv)) +\text{exp}
    (i\overline{\Theta}^{q}(uv))\|+ \epsilon}
\right]\\
= & \sum_{u,v=1}^{N}{\mathbf{A_s}}(u,v)\abs{\mathbf{x}(u)}^2 + \sum_{u,v=1}^{N}{\mathbf{A_s}}(u,v)\abs{\mathbf{x}(v)}^2\\ & - 2\sum_{u,v=1}^{N}{\mathbf{A_s}}(u,v)\mathbf{x}(u)\overline{\mathbf{x}(v)}
\left[
    \frac{\text{cos}(i\Theta^{q}(uv)) + \text{cos}(i\overline{\Theta}^{q}(uv))}
    {\|\text{exp}(i\Theta^{q}(uv)) +\text{exp}
    (i\overline{\Theta}^{q}(uv))\|+ \epsilon}
\right]\\
= & \sum_{u,v=1}^{N}{\mathbf{A_s}}(u,v)
\left(
\abs{\mathbf{x}(u)}^2 +\abs{\mathbf{x}(v)}^2 -
2\mathbf{x}(u)\overline{\mathbf{x}(v)}
\left[
    \frac{\text{cos}(i\Theta^{q}(uv)) + \text{cos}(i\overline{\Theta}^{q}(uv))}
    {\|\text{exp}(i\Theta^{q}(uv)) +\text{exp}
    (i\overline{\Theta}^{q}(uv))\|+ \epsilon}
\right]
\right) \\
\geq & \sum_{u,v=1}^{N}{\mathbf{A_s}}(u,v) 
(\abs{\mathbf{x}(u)}^2 +\abs{\mathbf{x}(v)}^2 -
2\abs{\mathbf{x}(u)}\abs{\overline{\mathbf{x}(v)}}) \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \  \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \  \ \ \ \ \ \ \ \ \ \ \ \ \ \\
= & \sum_{u,v=1}^{N}{\mathbf{A_s}}(u,v) 
(\abs{\mathbf{x}(u)}-\abs{\mathbf{x}(v)})^2 \\
\geq & 0.
\end{flalign*} 
Thus, $\textbf{x}^{\dagger}\textbf{L}_{U}^{q}\textbf{x} \geq 0$ for $\textbf{x} \in \mathbb{C}^N $, positive semi-definite. \\
\\
For normalized Laplacian matrix, $\textbf{L}_{N}^{q} = \textbf{D}_{s}^{-1/2}\textbf{L}_{U}^{q}\textbf{D}_{s}^{-1/2}$.
%We prove $\textbf{x}^{\dagger}\textbf{L}_{N}^{q}\textbf{x} \geq 0$ for $\textbf{x} \in \mathbb{C}^N $
\begin{flalign*}
\textbf{x}^\dagger\textbf{L}_{N}^{q}\textbf{x} 
& = \textbf{x}^\dagger\textbf{D}_{s}^{-1/2}\textbf{L}_{U}^{q}\textbf{D}_{s}^{-1/2}\textbf{x} \\
& =\textbf{y}^\dagger\textbf{L}_{U}^{q}\textbf{y} \\
& \geq 0.
\end{flalign*} 
where, $\textbf{y}=\textbf{D}_{s}^{-1/2}\textbf{x}$. \\
Thus, both unnormalized and normalized magnetic Laplacians are  positive semi-definite. 

%\subsection{Interval of the Normalized Magnetic Laplacian Eigenvalues}
\begin{theorem} For a signed directed graph $\mathcal{G} = (V, E, \textbf{\textit{S}})$, 
the eigenvalues of the normalized magnetic Laplacian $\textbf{L}_{N}^{q}$ lie in [0, 2].
\end{theorem}
\textit{proof.} \\
$\textbf{L}_{N}^{q}$ has non-negative and real eigenvalues since it is positive semi-definite by Theorem.1. Now, we show the eigenvalues are less than or equal to 2. Here, we use the Courant-Fischer theorem \citep{golub2013matrix},
\begin{flalign*}
\lambda_{N} 
& = \max_{\textbf{x}\neq0} \frac{\textbf{x}^{\dagger}\textbf{L}_{N}^{q}\textbf{x}}{\textbf{x}^{\dagger}\textbf{x}} \\
& = \max_{\textbf{x}\neq0} \frac{\textbf{x}^{\dagger}\textbf{D}_s^{-1/2}\textbf{L}_{U}^{q}\textbf{D}_s^{-1/2}\textbf{x}}{\textbf{x}^{\dagger}\textbf{x}} \\
& = \max_{\textbf{y}\neq0} \frac{\textbf{y}^{\dagger}\textbf{L}_{U}^{q}\textbf{y}}{\textbf{y}^{\dagger}\textbf{D}_{s}\textbf{y}}.
\end{flalign*} 
where, $\textbf{y}=\textbf{D}_{s}^{-1/2}\textbf{x}$. Since $\textbf{D}_s$ is diagonal, 
\begin{equation*}
\textbf{y}^\dagger\textbf{D}_s\textbf{y}=\sum_{u,v=1}^{N}{\textbf{D}_s(u,v)}\textbf{y}(u)\overline{\textbf{y}(v)} = \sum_{u=1}^{N}{\textbf{D}_s(u,u)\abs{\textbf{y}}^2}
\end{equation*}
Similar to Theorem 1, we have
\begin{flalign*}
&\textbf{y}^\dagger\textbf{L}_U^q\textbf{y}  \\
= & \frac{1}{2}\sum_{u,v=1}^N{\textbf{A}_s}(u,v)
    \left(\abs{\textbf{y}(u)}^2+\abs{\textbf{y}(v)}^2-2\textbf{y}(u)\overline{\textbf{y}(v)}
     \frac{\text{cos}(i\Theta^{q}(uv))+ \text{cos}(i\overline{\Theta}^{q}(uv))}
    {\|\text{exp}(i\Theta^{q}(uv)) + \text{exp}(i\overline{\Theta}^{q}(uv))\|+ \epsilon}
    \right)\\
\leq & \frac{1}{2}\sum_{u,v=1}^N{\textbf{A}_s}(u,v)
    (\abs{\textbf{y}(u)}^2+\abs{\textbf{y}(v)}^2) \\
\leq & \sum_{u,v=1}^N{\textbf{A}_s}(u,v)
    (\abs{\textbf{y}(u)}^2+\abs{\textbf{y}(v)}^2) \\
\leq & 2\sum_{u,v=1}^N{\textbf{A}_s}(u,v)\abs{\textbf{y}(u)}^2 \qquad  \text{(since}\; \textbf{A}_s \;\text{is symmetric)}\\
= & 2\sum_{u=1}^N{\abs{\textbf{y}(u)}^2}
    \left( \sum_{v=1}^{N}{\textbf{A}_s}(u,v)\right)  \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \  \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \  \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \\ 
= & 2\sum_{u=1}^N{\abs{\textbf{y}(u)}^2\textbf{D}_s(u,u)} \\
= & 2\textbf{y}^{\dagger}\textbf{D}_s\textbf{y}.
\end{flalign*}
Thus,
\begin{equation*}
    \lambda_N = 
     \max_{\textbf{y}\neq0} \frac{\textbf{y}^{\dagger}\textbf{L}_{U}^{q}\textbf{y}}
     {\textbf{y}^{\dagger}\textbf{D}_{s}\textbf{y}} \leq
     \max_{\textbf{y}\neq0} \frac{2\textbf{y}^{\dagger}\textbf{D}_s\textbf{y}}
     {\textbf{y}^{\dagger}\textbf{D}_{s}\textbf{y}} = 2.
\end{equation*}
Finally, the eigenvalues of normalized magnetic Laplacian are between [0, 2].









\begin{proposition} Let a $\mathcal{G}_1=(V,E_1)$ and $\mathcal{G}_2=(V,E_2)$ be a directed graphs on the same vertex set. Then their union $\mathcal{G}=(V,E_1 \cup E_2)$ has entropy $H(\mathcal{G}) \leq H(\mathcal{G}_1) + H(\mathcal{G}_2)$.
\end{proposition}
\textit{proof.} \\ Let $p_1(x,y)$ and $p_2(x,y)$ be the distributions that minimize $I(X\wedge Y)$ for $\mathcal{G}_1$ and $\mathcal{G}_2$, respectively. Then we have a joint distribution with Bayes' rule
\begin{equation*}
    p(x,y_1,y_2)=p(x)\cdot p_1(y_1|x) \cdot p_2(y_2|x).    
\end{equation*}
For a given choice of $X$, observe the $Y_1 \cap Y_2$ contains $X$ and is an independent set in $\mathcal{G}$. Therefore,

\begin{flalign*}
H(\mathcal{G}) & \leq I(X \wedge (Y_1 \cap Y_2)) \\
& \leq I(X \wedge Y_1 , Y_2) \\
& = H(Y_1, Y_2) - H(Y_1,Y_2|X) \\
& = H(Y_1, Y_2) - H(Y_1|X) - H(Y_2|X) \\
& \leq H(Y_1) - H(Y_1|X) + H(Y_2) - H(Y_2|X) \\
& = H(\mathcal{G}_1)+H(\mathcal{G}_2).
\end{flalign*} 



\begin{theorem} Von Neumann entropy of a signed directed graph can be expressed via two directed graph entropy.
\end{theorem}
\textit{proof.} \\ 
For a signed directed graph, $\mathcal{G}=(V, E,\mathbf{S})$, we can split it into two directed graphs via the edge type. Extract positive edges from $E$ and $S$ then construct a directed graph with node set $V$. Now we have a positive directed graph $\mathcal{G}^+ = (V, E^+)$. Similarly, we have a negative directed graph $\mathcal{G}^- = (V, E^-)$. Therefore, by utilizing Proposition 1.
\begin{equation*}
    H(\mathcal{G}) \leq  H(\mathcal{G}^+)+H(\mathcal{G}^-).
\end{equation*}



\begin{proposition} Let $\mathcal{G}=(V,E)$ and $\mathcal{F}=(V,E')$ are graphs with same the same vertex set $V$ and $\mathcal{F}$ is a subgraph of $\mathcal{G}$, $E' \subset E$. 
Then the entropy is, $H(\mathcal{F}) \leq H(\mathcal{G})$
\end{proposition}
\textit{proof.} \\ 
If $X, Y$ are random variables achieving $H(\mathcal{G})$, then $Y$ is also an independent set in $H(\mathcal{F})$. Therefore, $H(\mathcal{F}) \leq I(X \wedge Y) = H(\mathcal{G})$

\begin{theorem}
    \textbf{Perturbation Error of a Signed Directed Graph} 
\end{theorem}
\textit{proof.} \\ By Definition 1, we have perturbation error of a graph as:
\begin{equation*}
    \Delta H(\mathcal{G},q, \Delta q) = H(\mathcal{G},q) - H(\mathcal{G},q+ \Delta q).
\end{equation*}
Since $H(\mathcal{G},q) \leq H(\mathcal{G}_D^+,q) +H(\mathcal{G}_D^-,q) $ and $H(\mathcal{G},q+ \Delta q) \leq H(\mathcal{G}_D^+,q+ \Delta q) +H(\mathcal{G}_D^-,q+ \Delta q) $, we have the following results. 
\begin{flalign*}
    \Delta H(\mathcal{G},q, \Delta q)  & \leq  H(\mathcal{G}_D^+,q) +H(\mathcal{G}_D^-,q) - H(\mathcal{G}_D^+,q+ \Delta q) - H(\mathcal{G}_D^-,q+ \Delta q)   \\
    & =  H(\mathcal{G}_D^+,q) - H(\mathcal{G}_D^+,q+ \Delta q)
    + H(\mathcal{G}_D^-,q)  - H(\mathcal{G}_D^-,q+ \Delta q)   \\
    & = \Delta H(\mathcal{G}_D^+,q, \Delta q) +\Delta H(\mathcal{G}_D^-,q, \Delta q)
\end{flalign*}
And by Proposition 2, 
\begin{flalign*}
    \Delta H(\mathcal{G}_D^+,q, \Delta q)  & \leq      \Delta H(\mathcal{G},q, \Delta q)\\
    \Delta H(\mathcal{G}_D^-,q, \Delta q)  & \leq      \Delta H(\mathcal{G},q, \Delta q)\\
\end{flalign*}
Therefore, a signed directed graph perturbation error is described in the lower and upper boundaries. 



\bibliography{ko_750}% uai2023-template}

\end{document}
