\begin{tabular}{lllrllrrllr}
  \toprule
                               &                                 &                  & \multicolumn{4}{c}{$\alpha=0.25$} & \multicolumn{4}{c}{$\alpha=0.30$}                                                                                                                                                       \\
  Dataset                      & Model                           & Method           & Miscov.~$\downarrow$              & APSS~$\downarrow$\                & NS~$\downarrow$\            & NAR~$\uparrow$\  & Miscov.~$\downarrow$\  & APSS~$\downarrow$\         & NS~$\downarrow$\            & NAR~$\uparrow$ \\
  \midrule

  \multirow[t]{2}{*}{DS1000}   & GPT 4o Mini                     & \texttt{\methodname-HS}  & 0.25                              & \textbf{3.06}         & \textbf{20.41}  & 0.60             & 0.30                   & \textbf{3.05}  & \textbf{19.06}  & 0.68           \\
  \cline{2-11}
                               & Gemma 2 27b                     & \texttt{\methodname-HS}  & 0.25                              & \textbf{6.73}         & \textbf{12.73}  & 0.47             & 0.29                   & \textbf{6.26}  & \textbf{12.02}  & 0.53           \\
  \cline{1-11} \cline{2-11}
  \multirow[t]{18}{*}{GSM}     & \multirow[t]{6}{*}{GPT 4o Mini} & \texttt{CLM\ Sum}          & 0.15                              & 1.98                  & 2.91            & 0.71             & 0.24                   & 1.11           & 1.17            & 1.00           \\
                               &                                 & \texttt{\methodname-HS}  & 0.21                              & 1.47                  & 1.48            & 1.00             & 0.22                   & 1.29           & 1.30            & 1.00           \\
                               &                                 & \texttt{\methodname-L}   & 0.22                              & \textbf{1.00}         & \textbf{1.00}   & 1.00             & 0.22                   & \textbf{1.00}  & \textbf{1.00}   & 1.00           \\
  \cline{2-11}
                               & \multirow[t]{6}{*}{Llama 3 8B}  & \texttt{CLM\ Max}          & 0.12                              & 13.65                 & 24.76           & 0.56             & 0.22                   & 10.97          & 23.45           & 0.94           \\
  %  &                                 & \texttt{CLM\ Sum}          & 0.11                              & 13.92                 & 24.16           & 0.50             & 0.23                   & 11.16          & 23.03           & 0.95           \\
                               &                                 & \texttt{\methodname-HS}  & 0.24                              & \textbf{11.39}        & \textbf{12.12}  & 1.00             & 0.29                   & \textbf{6.98}  & \textbf{7.27}   & 1.00           \\
                               &                                 & \texttt{\methodname-L}   & 0.22                              & 12.78                 & 13.68           & 1.00             & 0.26                   & 7.88           & 8.27            & 1.00           \\
  \cline{2-11}
                               & \multirow[t]{6}{*}{Phi 2}       & \texttt{CLM\ Max}          & -                               & -                               & -                         & -              & 0.05                   & 16.60          & 22.91           & 0.19           \\
                               &                                 & \texttt{CLM\ Sum}          & -                               & -                               & -                         & -              & 0.06                   & 16.51          & 21.26           & 0.21           \\
                               &                                 & \texttt{\methodname-HS}  & 0.25                              & \textbf{15.79}        & \textbf{17.63}  & 0.94             & 0.30                   & \textbf{9.86}  & \textbf{10.56}  & 0.99           \\
                               &                                 & \texttt{\methodname-L}   & 0.05                              & 21.83                 & 25.00           & 0.20             & 0.27                   & 14.27          & 15.90           & 1.00           \\
  \cline{1-11} \cline{2-11}
  \multirow[t]{14}{*}{MBPP}    & \multirow[t]{6}{*}{GPT 4o Mini} & \texttt{CLM\ Max}          & 0.08                              & 1.04                  & 1.76            & 0.38             & 0.15                   & 1.02           & 1.38            & 0.65           \\
  %  &                                 & \texttt{CLM\ Sum}          & 0.10                              & 1.67                  & 2.54            & 0.46             & 0.16                   & 1.27           & 1.49            & 0.74           \\
                               &                                 & \texttt{\methodname-HS}  & 0.19                              & \textbf{1.00}         & 1.00            & 1.00             & 0.19                   & \textbf{1.00}  & 1.00            & 1.00           \\
                               &                                 & \texttt{\methodname-L}   & 0.18                              & 1.03                  & \textbf{1.00}   & 1.00             & 0.18                   & 1.03           & \textbf{1.00}   & 1.00           \\
  \cline{2-11}
                               & \multirow[t]{5}{*}{Llama 3 8B}  & \texttt{CLM\ First-K}      & -                               & -                               & -                         & -              & 0.02                   & 7.13           & 12.16           & 0.07           \\
  %  &                                 & \texttt{CLM\ First-K\  (nr)} & -                               & -                               & -                         & -              & 0.04                   & 12.12          & 12.12           & 0.16           \\
                               &                                 & \texttt{CLM\ Sum}          & -                               & -                               & -                         & -              & 0.02                   & 8.45           & 13.40           & 0.06           \\
                               &                                 & \texttt{\methodname-HS}  & 0.24                              & 7.06                  & 11.19           & 0.99             & 0.29                   & \textbf{3.82}  & \textbf{4.78}   & 1.00           \\
                               &                                 & \texttt{\methodname-L}   & 0.18                              & \textbf{6.78}         & \textbf{10.71}  & 0.70             & 0.27                   & 4.13           & 5.70            & 1.00           \\
  \cline{2-11}
                               & \multirow[t]{3}{*}{Phi 2}       & \texttt{CLM\ First-K\  (nr)} & -                               & -                               & -                         & -              & 0.02                   & 19.57          & 19.57           & 0.07           \\
                               &                                 & \texttt{\methodname-HS}  & 0.23                              & \textbf{8.37}         & \textbf{16.97}  & 0.95             & 0.28                   & 4.39           & 7.28            & 0.98           \\
                               &                                 & \texttt{\methodname-L}   & 0.06                              & 10.96                 & 22.56           & 0.21             & 0.26                   & \textbf{4.25}  & \textbf{6.46}   & 0.90           \\
  \cline{1-11} \cline{2-11}
  \multirow[t]{6}{*}{Math}     & \multirow[t]{6}{*}{GPT 4o Mini} & \texttt{CLM\ First-K}      & 0.22                              & 13.73                 & 16.61           & 0.99             & 0.27                   & 8.25           & 9.22            & 1.00           \\
  %  &                                 & \texttt{CLM\ First-K\  (nr)} & 0.22                              & 14.81                 & 14.81           & 0.99             & 0.27                   & 8.52           & 8.52            & 1.00           \\
  %  &                                 & \texttt{CLM\ Max}          & 0.22                              & 14.14                 & 23.53           & 0.99             & 0.27                   & 11.02          & 18.62          & 1.00           \\
  %  &                                 & \texttt{CLM\ Sum}          & 0.22                              & 14.55                 & 16.53           & 0.99             & 0.27                   & 10.03          & 12.03           & 1.00           \\
                               &                                 & \texttt{\methodname-HS}  & 0.24                              & \textbf{9.17}         & \textbf{9.20}   & 0.98             & 0.29                   & \textbf{6.74}  & \textbf{6.75}   & 1.00           \\
                               &                                 & \texttt{\methodname-L}   & 0.23                              & 11.74                 & 11.80           & 1.00             & 0.28                   & 7.08           & 7.10            & 1.00           \\
  \cline{1-11} \cline{2-11}
  \multirow[t]{8}{*}{TriviaQA} & GPT 4o Mini                     & \texttt{\methodname-HS}  & 0.24                              & \textbf{1.40}         & \textbf{21.85}  & 0.86             & 0.30                   & \textbf{1.27}  & \textbf{7.94}   & 0.94           \\
  \cline{2-11}
                               & \multirow[t]{6}{*}{Llama 3 8B}  & \texttt{CLM\ First-K}      & 0.24                              & 5.75                  & 5.75            & 1.00             & 0.28                   & 1.06           & \textbf{1.07}   & 1.00           \\
                               &                                 & \texttt{CLM\ First-K\  (nr)} & 0.24                              & 5.72                  & 5.72            & 1.00             & 0.28                   & 1.08           & 1.08            & 1.00           \\
                               &                                 & \texttt{CLM\ Max}          & 0.24                              & \textbf{1.42}         & 8.24           & 1.00             & 0.28                   & \textbf{1.00}  & 1.08            & 1.00           \\
                               &                                 & \texttt{CLM\ Sum}          & 0.24                              & 3.82                  & \textbf{4.83}   & 1.00             & 0.28                   & 1.06           & 1.09            & 1.00           \\
                               &                                 & \texttt{\methodname-HS}  & 0.26                              & 1.51                  & 9.60            & 1.00             & 0.29                   & 1.15           & 1.90            & 1.00           \\
                               &                                 & \texttt{\methodname-L}   & 0.25                              & 1.55                  & 11.70           & 1.00             & 0.29                   & 1.17           & 2.00            & 1.00           \\
  \cline{2-11}
                               & Phi 2                           & \texttt{\methodname-HS}  & 0.24                              & \textbf{1.94}         & \textbf{20.70}  & 0.59             & 0.29                   & \textbf{2.02}  & \textbf{19.96}  & 0.65           \\
  \cline{1-11} \cline{2-11}
  \bottomrule
\end{tabular}

