\begin{table*}[t]
  \centering
{%\footnotesize 
% \small
\fontsize{8}{9}\selectfont
% \vspace{-7mm}
\caption{%Graph CL under linear probe.
\alg vs baselines. Methods identified with $\dagger$ and $*$ are supervised methods and SSL methods for graphs under heterophily, respectively.
\alg achieves state-of-the-art under heterophily, and a comparable performance under homophily. 
% CL represents graph CL methods. SL represents graph supervised learning methods. -het represents the method focusing on heterophily graphs. 
}\label{tab:benchmark_baselines}
\vspace{-1mm}
{
  \begin{tabular} {c c c c| c c c c c c}
    \toprule
&\multicolumn{3}{c|}{Homophily}&\multicolumn{6}{c}{Heterophily}\\\midrule
&Cora & CiteSeer  & Pubmed& Actor & Chameleon & Squirrel  & Penn94 & Twitch-gamers & Genius \\
\toprule
% \hy{comment}
\multicolumn{1}{c|}{Hom.($\beta$)} & $.83$ & $.71$ & $.79$ & $.09$ & $.23$ & $.19$ & $.48$ & $.56$ & $.51$\\
\multicolumn{1}{c|}{Nodes} & 2,708 & 3,327 & 19,717 & 5,201 & 2,277 & 5,201 & 41,554 & 168,114 & 421,961\\
\multicolumn{1}{c|}{Edges} & 5,278 & 4,676 & 44,324 & 198,493 & 8,854 & 46,998 & 1,362,229 & 6,797,557 & 984,979\\
\multicolumn{1}{c|}{Classes} & 6 & 7 & 3 & 5 & 5 & 5 & 2 & 2 & 2\\
\midrule
\multicolumn{1}{c|}{\textbf{\alg}} & \ul{84.1} $\pm$ 1.0 & 70.1 $\pm$ 0.8 & 84.5 $\pm$ 0.4 & 34.0 $\pm$ 0.2 & \textbf{50.9} $\pm$ 1.0 & \textbf{42.9} $\pm$ 2.6 & \textbf{68.1} $\pm$ 3.5  & \textbf{67.0} $\pm$ 0.9 & \ul{84.3}$\pm$0.1 \\
% \multicolumn{1}{c|}{\textbf{\alg(no-aug)}} & 77.09 $\pm$ 1.7 & 64.34 $\pm$ 1.5 & \textbf{48.04} $\pm$ 3.1 & \textbf{33.44} $\pm$ 1.7 & \textbf{64.21} $\pm$ 11.2\\
\midrule
% \multicolumn{1}{c|}{Raw feature}  & 64.8 & 64.6 & 24.43  \\\midrule
 \multicolumn{1}{c|}{DGI}  & \textbf{84.5} $\pm$ 1.1 & \textbf{71.9}  $\pm$ 0.7 & 86.0 $\pm$ 0.1 & 28.0 $\pm$ 1.4 & 32.6 $\pm$ 2.9 & 38.8 $\pm$ 2.3 & 62.9 $\pm$ 0.4 & 61.5 $\pm$ 0.6 & OOM\\
\multicolumn{1}{c|}{BGRL} & 83.0 $\pm$ 0.7 & 69.8 $\pm$ 0.6 & 80.2 $\pm$ 0.6 & 28.3 $\pm$ 0.9 & 32.6 $\pm$ 4.7 & 35.7 $\pm$ 1.4 & 58.8 $\pm$ 0.6 & 60.9 $\pm$ 0.3 & 76.4$\pm$3.0\\
\multicolumn{1}{c|}{GRACE} & 83.7 $\pm$ 0.7 & 71.4 $\pm$ 1.0 & 86.7$\pm$0.1 & \ul{34.5} $\pm$ 1.1 & 35.4 $\pm$ 3.6 & 36.2 $\pm$ 2.8 & 62.5 $\pm$ 0.4 & 57.1 $\pm$ 0.1 & 	79.6$\pm$2.9 \\\midrule
\multicolumn{1}{c|}{SP-GCL$^*$} & 83.2 $\pm$ 0.1 & 72.0 $\pm$ 0.4 & 79.2 $\pm$ 0.7 & 27.7 $\pm$ 0.7 & 36.5 $\pm$ 1.9 & 33.7 $\pm$ 1.3 & - & 62.0 $\pm$ 0.2 & \textbf{90.1}$^*\!\!$ $\pm$ 0.2 \\
\multicolumn{1}{c|}{HGRL$^*$} & 82.1 $\pm$ 0.8 & 71.0 $\pm$ 0.7 & 84.2 $\pm$ 0.2 & 35.4 $\pm$ 0.9 & 43.9 $\pm$ 1.7 & 38.7 $\pm$ 1.7 & OOM & OOM & OOM \\\midrule\midrule
\multicolumn{1}{c|}{GCN$^\dagger$} & 82.3 $\pm$ 1.2 & 70.2 $\pm$ 0.9 & 86.4 $\pm$ 0.3 & 28.2 $\pm$ 0.4 & 40.9 $\pm$ 4.1 & 39.5 $\pm$ 1.5 & 82.5 $\pm$ 0.3 & 62.2 $\pm$ 0.3 & 87.4 $\pm$ 0.4 \\\midrule
\multicolumn{1}{c|}{MixHop$^\dagger$} & 81.0 $\pm$ 1.6 & 66.4 $\pm$ 1.7 & 85.1 $\pm$ 0.3 & 29.0 $\pm$ 1.0 & 33.8 $\pm$ 1.2 & 33.4 $\pm$ 1.6 & 83.5 $\pm$ 0.7 & 65.6 $\pm$ 0.3 & 90.6 $\pm$ 0.2 \\
\multicolumn{1}{c|}{H2GCN$^\dagger$} & 81.4 $\pm$ 1.2 & 71.8 $\pm$ 0.9 & 85.9 $\pm$ 0.4 & 33.6 $\pm$ 0.8 & 26.8 $\pm$ 3.6 & 35.1 $\pm$ 1.2 & OOM & OOM & OOM \\
\multicolumn{1}{c|}{GloGNN$^\dagger$} & \textbf{{88.3}}$^\dagger\!\!$ $\pm$ 1.1 & \textbf{{77.4}}$^\dagger\!\!$ $\pm$ 1.7 & \textbf{{89.6}}$^\dagger\!\!$ $\pm$ 0.4 & \textbf{{37.4}}$^\dagger\!\!$ $\pm$ 0.8 & 25.9 $\pm$ 3.6 & 35.1 $\pm$ 1.2 & \textbf{{85.6}}$^\dagger\!\!$ $\pm$ 0.4 & 66.4 $\pm$ 0.3 & \textbf{{90.7}}$^\dagger\!\!$ $\pm$ 0.1 \\
\multicolumn{1}{c|}{CPGNN$^\dagger$} & 83.6 $\pm$ 1.3 & 72.0 $\pm$ 0.5 & 86.7 $\pm$ 0.2 & 35.6 $\pm$ 0.9 & 33.0 $\pm$ 3.2 & 30.0 $\pm$ 2.0 & OOM & OOM & OOM \\
\bottomrule
\end{tabular}
}
}%\vspace{-5mm}
\end{table*}
% \vspace{-2mm}
\section{Experiments}%
% \vspace{-1mm}
In this section, we 
evaluate the node representations learned with \alg, under linear probe. We compare \alg with existing graph CL, graph SSL and graph supervised learning methods, and conduct an extensive ablation study to evaluate the effect of each of \alg's components.

\noindent\textbf{Datasets.} 
We consider nine widely-used public benchmark datasets with different homophily ratios, $\beta$. The details of the datasets are shown in Sec. \ref{sec:dataset}. We repeat the experiments 10 times for smaller benchmark datasets, and 3 times for large real-world datasets, and report the early-stopped average accuracy as the final result. For small graphs, we follow CPGNN \citep{zhu2020graph}, GRACE \citep{zhu2020deep}, and HGRL \citep{chen2022towards} and randomly select 10\% of nodes for training, 10\% of nodes for validation, and 80\% of nodes for testing. For large graphs, following ~\citep{lim2021large} we randomly select 25\% of nodes for training, 25\% of nodes for validation, and 50\% of nodes for testing. %\looseness=-1

\noindent
\textbf{Linear Probe Evaluation.}
For SSL methods, we follow the evaluation protocol used in ~\citep{zhu2020deep}. Models are first trained in a self-supervised manner without labels. Then, we fed the final node embeddings into a $l_2$-regularized logistic regression classifier to fit the labeled data. 

% \vspace{-0mm}
\vspace{-2mm}
\subsection{Results}
\vspace{-1mm}
\noindent\textbf{\alg vs Self-supervised Baselines.} 
We compare \alg with existing baselines for self-supervised representation learning.
We consider general graph self-supervised learning methods like DGI ~\citep{velickovic2019deep}, BGRL ~\citep{thakoor2021large}, and GRACE ~\citep{zhu2020deep} as well as graph self-supervised learning methods that focus on learning under heterophily like HGRL ~\citep{chen2022towards}, and SP-GCL ~\citep{wang2022can}. In addition, we also include popular general graph supervised learning methods like GCN ~\cite{kipf2016semi}, and graph supervised learning method targeting graphs under heterophily like MixHop, H2GCN, GloGNN, and CPGNN \citep{abu2019mixhop,zhu2020beyond,zhu2021graph,li2022finding}. We record the hyperparameters for our experiments in Sec. \ref{sec:hype}
Table \ref{tab:benchmark_baselines} shows that \alg{} achieves a significant boost on graphs with heterophily and a comparable performance on graphs with homophily compared to the popular graph CL methods, showing up to 7\% performance boost on Chameleon and 5\% boost on Penn94.
Compared to supervised methods such as H2GCN trained in an end-to-end manner, \alg achieves a comparable performances under homophily and superior performance on heterophilic graphs like Chameleon by 10\% and Squirrel by 3\%. This confirms the effectiveness of \alg. 

\begin{figure}[!t]
  \centering
  \begin{subfigure}[b]{0.48\columnwidth}
    \includegraphics[width=\linewidth]{IJCAI/Fig/chameleon_spectrum_updated.png}
    \caption{Chameleon}
    \label{fig:chameleon_spectrum}
  \end{subfigure}
  \hfill
  \begin{subfigure}[b]{0.48\columnwidth}
    \includegraphics[width=\linewidth]{IJCAI/Fig/chameleon_alignment_updated.png}
    \caption{Chameleon}
    \label{fig:chameleon_alignment}
  \end{subfigure}
  \begin{subfigure}[b]{0.48\columnwidth}
    \includegraphics[width=\linewidth]{IJCAI/Fig/citeseer_spectrum_updated.png}
    \caption{Citeseer}
    \label{fig:citeseer_spectrum}
  \end{subfigure}
  \hfill
  \begin{subfigure}[b]{0.48\columnwidth}
    \includegraphics[width=\linewidth]{IJCAI/Fig/citeseer_alignment_updated.png}
    \caption{Citeseer}
    \label{fig:citeseer_alignment}
  \end{subfigure}
  % Shared caption and label for the merged figure
  \vspace{-1mm}
  \caption{GRACE vs \alg representations. (a), (c) distribution of eigenvalues in the representation matrix. (b), (d) alignment of the labels with the eigenvectors of the representation matrix.% In both (a) and (c), the representations exhibit eigenvalues at 1, resulting in an overlap.
  \alg produces higher quality representations with lower rank and higher alignment with the label vector.
  }
  \label{fig:sp_alg_combined}
  \vspace{-4mm}
\end{figure}
\textbf{\alg learns superior representations under heterophily. }\label{sec:spectrum_study}
Next, we compare the quality of representations learned by \alg with that of GRACE, which only uses the low-pass filter for graph CL.
% demonstrate the superiority of \alg in generating meaningful representations for heterophilic graphs by contrasting both the high-pass graph views and the low-pass filtered graph views. 
% This approach differs from traditional GCL methods like GRACE \citep{zhu2020deep}, which utilize only low-pass filtered views. 
We study Chameleon, a popular heterophily dataset \citep{platonov2023critical}, and Citeseer, a well-known homophily dataset ~\citep{yang2016revisiting}. 
% Following %a similar approach to 
% ~\citep{xue2022investigating}, 
% We compare the spectra of representations to evaluate the quality of representations for GRACE and \alg, by comparing the spectrum of their representation matrices.
Fig. \ref{fig:sp_alg_combined} compares the distribution of normalized eigenvalues of the representation matrices and the alignment of their eigenvectors with the label vector.
Lower-ranked representations that have a higher alignment between their prominent eigenvalues and label vector yield superior performance \citep{xue2022investigating}.
% The representation matrix is the Jacobian of
% that is the Jacobian of the linear probe trained on the learned representations. 
% \hy{after training with \alg, we train a linear model using the learned representations and the available labels to classify the nodes. That is the linear model $f$ can be written as $f=W^TX$, where $X$ are \alg representations and $W$ is the weight of the linear model. For this linear model, the Jacobian matrix is $X$, which includes all partial derivatives of f w.r.t $W$. We conduct a spectral analysis on the Jacobian matrix of \alg, and compare this with GRACE ~\citep{zhu2020deep}. }
% To align the spectra more effectively, we normalize the eigenvalues into the range (0,1). %Fig. \ref{fig:sp_alg_combined} illustrates this comparison. 
Fig. \ref{fig:chameleon_spectrum} 
% compares the distribution of normalized eigenvalues, 
%\alg's representation diminishes the smaller eigenvalues of the Jacobian, leading to
confirms that \alg's representations of Chameleon (heterophily) have a lower-rank structure compare to that of GRACE. %This reduction in noise enhances the output representation. 
Fig. \ref{fig:chameleon_alignment} further confirms %the %superiority of \alg's representation on heterophily graphs by demonstrating 
a strong alignment between the eigenvectors of the representation matrix and the label vector. Both factors contribute to higher classification accuracy of \alg compared to GRACE. On the other hand, on Citeseer (homophily), \alg exhibits a similar but only slightly higher rank %Jacobian low-rank structure
% eigen and alignment between the eigenvectors and clean label vectors
spectrum than GRACE. Thus, contrasting the low-pass and high-pass views does not significantly harm the performances under homophily. 