\begin{table}[ht]
\centering
\scriptsize 
\caption{Dataset statistics for Appendiceal Cancer, TCGA-NSCLC, TCGA-ESCA and BRACS. WSIs passing quality control are included. For the TCGA cohorts, slides with missing or ambiguous histologic labels were excluded.}
\label{tab:dataset_stats}
\begin{tabular}{l|c|l|cc}
\toprule
\multirow{2}{*}{\textbf{Dataset}} & \multirow{2}{*}{\textbf{Label}} & \multirow{2}{*}{\textbf{Diagnosis}} &
\multicolumn{2}{c}{\textbf{Number of WSIs}} \\
& & & \textbf{Site 1} & \textbf{Site 2} \\
% -------- Appendiceal Cancer (split by Site) ----------
\midrule
\multirow{2}{*}{Appendiceal Cancer} &
0 & LAMN & 74 & 22 \\
& 1 & MAC & 40 & 5 \\
% -------- TCGA-NSCLC ----------
\midrule
\multirow{2}{*}{TCGA-NSCLC} &
0 & LUAD & \multicolumn{2}{c}{496} \\
& 1 & LUSC & \multicolumn{2}{c}{490} \\
% -------- TCGA-ESCA ----------
\midrule
\multirow{2}{*}{TCGA-ESCA} &
0 & EAC & \multicolumn{2}{c}{63} \\
& 1 & ESCC & \multicolumn{2}{c}{90} \\
% -------- BRACS ----------
\midrule
\multirow{7}{*}{BRACS} &
0 & N & \multicolumn{2}{c}{34} \\
& 1 & PB & \multicolumn{2}{c}{142} \\
& 2 & UDH & \multicolumn{2}{c}{70} \\
& 3 & ADH & \multicolumn{2}{c}{46} \\
& 4 & FEA & \multicolumn{2}{c}{41} \\
& 5 & DCIS & \multicolumn{2}{c}{61} \\
& 6 & IC & \multicolumn{2}{c}{132} \\

\bottomrule
\end{tabular}
\end{table}