\section{Background}
\label{sec:background}
Let \(\mathcal{G} = (V,E,w)\) be a (possibly directed) graph with \(N\) vertices , \(M\) edges and weight function \(w: V \times V \rightarrow \mathbb{R}_{\geq 0}\). For any edge \(e = (u,v) \in E\), we write the weight of \(e\) as \(w_{uv}\) or \(w_e\). For an undirected graph \(\mathcal{G}\), we denote the degree of vertex \(u\) by \(d(u) = \sum_{v \in V} w_{uv}\). If \(\mathcal{G}\) is directed, we define the in-degree and out-degree of vertex \(u\) as \(d_{\text{in}}(u) = \sum_{v \in V} w_{vu}\) and \(d_{\text{out}}(u) = \sum_{v \in V} w_{uv}\). The degree of vertex \(u\) in this case is \(d(u) = d_{\text{in}}(u) + d_{\text{out}}(u)\). 
For any two sets \(S,T \in V\), we define the cut value \(w(S,T) = \sum_{\substack{(u,v) \in E \\ u \in S, v \in T}} w_{uv}\) and the volume of \(S \subset V\) as \(\text{vol}(S) = \sum_{u \in S} d(u)\). 

We define the conductance of \(\emptyset \ne S \subset V\) as
\[
\Phi(S) = \frac{w(S,V-S)}{\text{vol}(S)}.
\]
A \(k\)-way partition of \(V\) is a collection of \(k\) subsets \(S_1, \hdots, S_k \subset V\) where \(S_i \cap S_j = \emptyset\) for \(i \neq j\) and \(\bigcup_{i=1}^k S_i = V\).
For undirected graphs, we measure the quality of a partition by the \(k\)-way expansion:
\[
\Phi(S_1,\dots,S_k) = \max_{1 \leq i \leq k} \Phi(S_i).
\]
The \(k\)-way expansion constant of $\mathcal{G}$ \cite{lee2014multiway} is defined as
\[
\rho(k) = \min_{\text{partition } S_1, \hdots S_k} \Phi(S_1,\dots,S_k).
\]


Spectral clustering leverages eigenvalues and eigenvectors of Hermitian matrices associated with the graph. The adjacency matrix \(A \in \mathbb{R}^{N \times N}\) of an undirected graph \(\mathcal{G} = (V,E,w)\) is defined as $A_{uv} = w_{uv}$ if $(u,v) \in E$ and zero otherwise.
% \[
% A_{uv} = \begin{cases}
% w_{uv} & \text{if } (u,v) \in E, \\
% 0 & \text{otherwise}.
% \end{cases}
% \]
When \(\mathcal{G}\) is directed, we will use the Hermitian adjacency matrix as defined in \cite{cucuringu2020hermitian}:
\begin{equation}
A_{uv} = \begin{cases}
    w_{uv}\exp\left(2 \pi \mathrm{i}/\tilde{k}\right) & \text{ if } u \rightarrow v,  \\
    w_{uv}\exp\left(-2 \pi \mathrm{i}/\tilde{k}\right) & \text{ if } u \leftarrow v, \label{eq:adjdig}\\
    0 & \text{ otherwise}
\end{cases}
\end{equation}
where $\mathrm{i}$ is the imaginary unit and the value \(\Tilde{k}\) must be prescribed. Throughout our paper we will assume for simplicity that, for a directed graph, $(u,v) \in E \implies (v,u) \not\in E$.
The following definitions all apply to both undirected and directed graphs using each respective adjacency matrix.

The degree matrix \(D \in \mathbb{R}^{N \times N}\) is a diagonal matrix where each diagonal entry equals the degree of a vertex: $D_{uu} = d(u)$.
The Laplacian matrix \(L \in \mathbb{R}^{N \times N}\) is defined as $L = D - A$, while the normalized Laplacian matrix \(\mathcal{L} \in \mathbb{R}^{N \times N}\) is defined as
$
\mathcal{L} = D^{-1/2} L D^{-1/2} = I - D^{-1/2} A D^{-1/2}$.%,
%where \(I\) is the identity matrix.

We will use \(M \in \mathbb{C}^{N \times N}\) to denote any 
 Hermitian positive semidefinite matrix representation of a graph. We will denote its eigenvectors by \(f_1, \hdots, f_N \in \mathbb{C}^N\) with corresponding eigenvalues \( \lambda_1 \leq \hdots \leq \lambda_N \). We will write the eigendecomposition of $M$ as $M = F \Delta F^*$ with $F=(f_1 \, f_2 \, \cdots \, f_N)$ and $\Delta = \text{diag}(\lambda_1, \hdots, \lambda_N)$.
 
 
% \begin{align*} 
% M = F \Delta F^*, \qquad
% F = \begin{pmatrix}
%     | &  & | \\
%     f_1 & \hdots & f_N \\
%     | &  & |
% \end{pmatrix}, \qquad
% \Delta = \text{diag}(\lambda_1, \hdots, \lambda_N)
% \end{align*}

Given a basis of orthonormal vectors \(g_1, \hdots, g_N \in \mathbb{C}^N\), we denote their Rayleigh quotients by \(\gamma_i = g_i^* M g_i\), with \(\gamma_1 \leq \hdots \leq \gamma_N\). We assemble these vectors in a matrix \(G \in \mathbb{C}^{N \times N}\).

There are many variants of Spectral Clustering in the literature. Our results are quite general and will apply to most of these variants. For simplicity, we will consider the variant defined in Algorithm~\ref{alg:spectral}, which is the one considered in \cite{peng2015partitioning}. For undirected graphs, we typically choose $\tilde{k} = k$ and $M = \mathcal{L}$, which has real eigenvectors. The third step of Algorithm~\ref{alg:spectral} is optional and typically depends on the matrix representation used; for example, it is needed when $M$ is the normalised Laplacian $\mathcal{L}$, but not when $M$ is the combinatorial Laplacian $L$.
\vspace{-0.1cm}
\begin{algorithm}[h!]
\begin{algorithmic}[1]
%\Procedure{Spectral Clustering}{}
    \State \textbf{Input:} $\mathcal{G}=(V,E,w),M \in \mathbb{C}^{|V| \times |V|},k \ge 2,\tilde{k}\le k$
    \State Compute the matrix $F \in \mathbb{C}^{|V| \times \tilde{k}}$ whose columns are the orthonormal eigenvectors $f_1,\dots,f_{\tilde{k}}$ associated to $\lambda_1 \le \cdots \le \lambda_{\tilde{k}}$.
    \State $\tilde{F} \gets D^{1/2} F$
    \State Minimise the following $k$-means objective:
    \[
        \min_{c_1,\dots,c_k \in \mathbb{C}^{\tilde{k}}} \sum_{u \in V} d(u) \|\tilde{F}_{u,\colon} - c_i \|_2^2
    \]
    \State \textbf{Output:} partition $A_1,\dots,A_k$ corresponding to the solution of the above $k$-means problem.
\end{algorithmic}
\caption{Spectral Clustering}
\label{alg:spectral}
\end{algorithm}




