\begin{table}[t]
\centering
\caption{Neuron similarity statistics for homogeneously trained networks (GELU activation).
\textbf{Top:} Mean distance averaged over all neurons.
\textbf{Middle:} Mean distance averaged over the 80\% of neurons with smallest distances.
\textbf{Bottom:} Difference, quantifying the contribution of the 20\% most isolated neurons.
Both models trained on the full MNIST training set.}
\label{tab:neuron_similarity_homogeneous}
\small
\begin{tabular}{@{}l cccc cccc@{}}
\toprule
& \multicolumn{4}{c}{\textbf{Nearest Neighbor Distance}} & \multicolumn{4}{c}{\textbf{Mean Distance to All}} \\
\cmidrule(lr){2-5} \cmidrule(lr){6-9}
& \multicolumn{2}{c}{Within} & \multicolumn{2}{c}{Across} & \multicolumn{2}{c}{Within} & \multicolumn{2}{c}{Across} \\
\cmidrule(lr){2-3} \cmidrule(lr){4-5} \cmidrule(lr){6-7} \cmidrule(lr){8-9}
Layer & A & B & A{\footnotesize$\to$}B & B{\footnotesize$\to$}A & A & B & A{\footnotesize$\to$}B & B{\footnotesize$\to$}A \\
\midrule
\multicolumn{9}{@{}l}{\textit{All neurons}} \\
1 & 33.8 & 34.4 & 32.3 & 32.3 & 58.7 & 60.6 & 59.4 & 59.4 \\
2 & 26.7 & 27.1 & 27.4 & 26.5 & 55.0 & 58.2 & 56.5 & 56.5 \\
3 & 26.1 & 27.4 & 26.8 & 28.4 & 60.4 & 62.9 & 61.7 & 61.7 \\
\midrule
\multicolumn{9}{@{}l}{\textit{80\% least isolated neurons}} \\
1 & 30.7 & 30.9 & 29.2 & 29.3 & 54.6 & 56.0 & 55.6 & 54.6 \\
2 & 24.1 & 23.6 & 24.6 & 23.0 & 51.6 & 54.1 & 53.1 & 52.4 \\
3 & 22.7 & 24.3 & 23.7 & 25.2 & 56.6 & 59.6 & 58.2 & 57.9 \\
\midrule
\multicolumn{9}{@{}l}{\textit{Difference (isolated neuron contribution)}} \\
1 & 3.1 & 3.5 & 3.1 & 3.0 & 4.0 & 4.6 & 3.8 & 4.8 \\
2 & 2.6 & 3.5 & 2.8 & 3.5 & 3.4 & 4.1 & 3.4 & 4.1 \\
3 & 3.3 & 3.1 & 3.1 & 3.2 & 3.8 & 3.3 & 3.5 & 3.8 \\
\bottomrule
\end{tabular}
\end{table}
