\begin{table*}[htbp]
\centering
\small
\setlength{\tabcolsep}{6pt}
\resizebox{\textwidth}{!}{
\begin{tabular}{lcccccccccc}
\toprule
 & \multicolumn{2}{c}{CAMELYON16} 
 & \multicolumn{2}{c}{TCGA-NSCLC} 
 & \multicolumn{2}{c}{PANDA} 
 & \multicolumn{2}{c}{BRACS} 
 & Params & FLOPs \\
\cmidrule(lr){2-3}
\cmidrule(lr){4-5}
\cmidrule(lr){6-7}
\cmidrule(lr){8-9}


& AUC & ACE 
& AUC & ACE 
& $\kappa$ & ACE 
& AUC & ACE 
& (M) & (G) \\
\midrule

ABMIL~\cite{ilse_attention-based_2018}   
& $\mathbf{.987_{.005}}$ & $.036_{.004}$
& $.973_{.009}$ & $.039_{.008}$
& $.910_{.028}$ & $.044_{.015}$
& $\underline{.852_{.025}}$ & $\underline{.175_{.007}}$
& $.660$ & $1.31$ \\

CLAM~\cite{lu_data-efficient_2021}      
& $\underline{.986_{.004}}$ & $.044_{.027}$
& $.953_{.004}$ & $.056_{.016}$
& $.927_{.025}$ & $.031_{.018}$
& $.850_{.021}$ & $.183_{.011}$
& $.920$ & $1.84$ \\

TransMIL~\cite{shao_transmil_2021}
& $.978_{.004}$ & $.044_{.012}$
& $.970_{.012}$ & $.046_{.019}$
& $.911_{.030}$ & $.043_{.021}$
& $.826_{.032}$ & $.186_{.012}$
& $2.67$ & $85.02$ \\

DGRMIL~\cite{zhu_dgr-mil_2025}
& $.967_{.018}$ & $.027_{.021}$
& $.974_{.011}$ & $\underline{.038_{.022}}$
& $.933_{.047}$ & $.036_{.025}$
& $.818_{.035}$ & $.186_{.023}$
& $4.34$ & $79.88$ \\

PAMIL~\cite{pamil}      
& $.986_{.003}$ & $.032_{.013}$
& $.970_{.015}$ & $.043_{.018}$
& $.941_{.060}$  & $.026_{.032}$
& $.830_{.038}$ & $.193_{.018}$ 
& $.796$ & $1.32$ \\

BayesMIL~\cite{cui_bayes-mil_2023}
& $.975_{.006}$ & $\mathbf{.023_{.006}}$
& $.973_{.021}$ & $\mathbf{.033_{.017}}$
& $.926_{.031}$ & $.031_{.016}$
& $.829_{.022}$ & $.183_{.028}$
& $1.32$ & $2.63$ \\

% MixMIL    
% & $.979_{.007}$ & $.430_{.001}$
% & $.963_{.014}$ & $.410_{.025}$
% & $.870_{.028}$ & $.180_{.010}$
% & $.855_{.010}$ & $.254_{.002}$
% & $1.57$ & $1.05$ \\

% AGP       
% & $.910_{.023}$ & $.078_{.013}$
% & $.976_{.014}$ & $.048_{.025}$
% & $.906_{.047}$ & $.026_{.013}$
% & $.830_{.010}$ & $.134_{.014}$
% & $1.21$ & $2.87$ \\

SGPMIL~\cite{lolos_sgpmil_2025}    
& $\mathbf{.987_{.008}}$ & $\underline{.026_{.009}}$
& $.973_{.014}$ & $.047_{.027}$
& $\mathbf{.955_{.037}}$ & $\underline{.028_{.022}}$
& $\mathbf{.870_{.026}}$ & $\mathbf{.142_{.032}}$
& $1.21$ & $2.44$ \\
\hline

Mean
& $.693_{.046}$ & $.241_{.022}$ 
& $\mathbf{.979_{.015}}$ & $.041_{.019}$
& $.924_{.028}$ & $.035_{.013}$
& $.738_{.006}$ & $.223_{.015}$
& $\mathbf{.130}$ & $\mathbf{.260}$ \\

\textbf{\ours+Mean}     
& $.975_{.006}$ & $.028_{.006}$
& $\underline{.978_{.016}}$ & $\mathbf{.033_{.021}}$
& $\underline{.944_{.053}}$ & $\mathbf{.021_{.024}}$
& $.850_{.031}$ & $.189_{.026}$
& $\underline{.314}$ & $\underline{.628}$ \\

\bottomrule
\end{tabular}}
\caption{Slide-level performance comparison across datasets. Results are reported as AUC/$\kappa$, and ACE. FLOPs are measured per forward pass for a bag of 1000 patch embeddings at inference. Using a mean operator in the initial projection layer before classification (i.e., our approach without the block) leads to substantial performance degradation for large bag sizes, such as CAMELYON16 and BRACS.}
\label{tab:bag-level-performance_uni}
\end{table*}


