\begin{table*}
\centering
\caption{
In-distribution experiment using \texttt{Qwen2.5-7B} using difference choices for the covariance of $q_{\btheta}(\s)$.
We report the mean and standard deviation of test set performance using 3 training seeds.
}
\begin{tabular}{@{}ccc|cccccc@{}}
\toprule
\multirow{2}{*}{\textbf{Metric}} & \multirow{2}{*}{$\boldsymbol{\Sigma}$}  & \multirow{2}{*}{\textbf{Params (M)}} & \multicolumn{6}{c}{\textbf{Datasets}} \\ 
  &  & & \textbf{WG-S} & \textbf{ARC-C} & \textbf{ARC-E} & \textbf{WG-M} & \textbf{OBQA} & \textbf{BoolQ} \\
\midrule
\multirow{2}{*}{\textbf{ACC ($\uparrow$)}}
& Full Rank & $3.773$ & $77.93_{\pm 0.3}$ & $89.30_{\pm 0.5}$ & $96.48_{\pm 0.2}$ & $81.88_{\pm 0.5}$ & $91.73_{\pm 0.6}$ & $88.74_{\pm 0.1}$ \\
& Diagonal & $3.769$ & $78.64_{\pm 0.4}$ & $90.16_{\pm 0.8}$ & $96.26_{\pm 0.1}$ & $81.42_{\pm 0.3}$ & $90.90_{\pm 0.5}$ & $88.48_{\pm 0.1}$ \\
\midrule
\multirow{2}{*}{\textbf{ECE ($\downarrow$)}}
& Full Rank & $3.773$ & $13.25_{\pm 0.6}$ & $6.69_{\pm 0.6}$ & $2.65_{\pm 0.1}$ & $7.11_{\pm 0.2}$ & $2.61_{\pm 0.2}$ & $1.57_{\pm 0.2}$ \\
& Diagonal & $3.769$ & $8.88_{\pm 0.5}$ & $5.03_{\pm 0.9}$ & $1.78_{\pm 0.2}$ & $3.64_{\pm 0.2}$ & $2.43_{\pm 0.7}$ & $1.96_{\pm 0.3}$
\\
\midrule
\multirow{2}{*}{\textbf{NLL ($\downarrow$)}}
& Full Rank & $3.773$ & $0.67_{\pm 0.0}$ & $0.41_{\pm 0.0}$ & $0.14_{\pm 0.0}$ & $0.42_{\pm 0.0}$ & $0.23_{\pm 0.0}$ & $0.23_{\pm 0.0}$ \\
& Diagonal & $3.769$ & $0.51_{\pm 0.0}$ & $0.31_{\pm 0.0}$ & $0.11_{\pm 0.0}$ & $0.40_{\pm 0.0}$ & $0.23_{\pm 0.0}$ & $0.24_{\pm 0.0}$ \\

\bottomrule
\end{tabular}
\label{tab:qwen7B_cov}
\end{table*}