\begin{tabular}{lllrllrrllr}
  \toprule
                               &                                 &                  & \multicolumn{4}{c}{$\alpha=0.25$} & \multicolumn{4}{c}{$\alpha=0.30$}                                                                                                                                                       \\
  Dataset                      & Model                           & Method           & Miscov.~$\downarrow$              & APSS~$\downarrow$\                & NS~$\downarrow$\            & NAR~$\uparrow$\  & Miscov.~$\downarrow$\  & APSS~$\downarrow$\         & NS~$\downarrow$\            & NAR~$\uparrow$ \\
  \midrule

  \multirow[t]{2}{*}{DS1000}   & GPT 4o Mini                     & \texttt{\methodname-HS}  & 0.26              & 2.94         & 20.40  & \textbf{0.58}             & 0.31                   & 2.94  & 19.38  & \textbf{0.67}           \\
  \cline{2-11}
                               & Gemma 2 27b                     & \texttt{\methodname-HS}  & 0.18              & \textbf{8.00}         & \textbf{16.86}  & \textbf{0.38}             & 0.22                   & \textbf{7.00}  & \textbf{14.92}  & \textbf{0.44}           \\
  \cline{1-11} \cline{2-11}
  \multirow[t]{18}{*}{GSM}     & \multirow[t]{6}{*}{GPT 4o Mini} & \texttt{CLM\ Sum}          & 0.15              & 1.98                  & 2.91            & 0.71             & 0.24                   & 1.11           & 1.17            & \textbf{1.00}           \\
                               &                                 & \texttt{\methodname-HS}  & 0.23              & \textbf{1.45}         & \textbf{1.46}   & \textbf{1.00}             & 0.23                   & 1.34  & 1.35   & \textbf{1.00}           \\
                               &                                 & \texttt{\methodname-L}   & 0.21              & 1.98         & 2.00   & \textbf{1.00}             & 0.23                   & \textbf{1.00}  & \textbf{1.00}   & \textbf{1.00}           \\
  \cline{2-11}
                               & \multirow[t]{6}{*}{Llama 3 8B}  & \texttt{CLM\ Max}          & 0.12              & \textbf{13.65}                 & 24.76           & 0.56             & 0.22                   & 10.97          & 23.45           & 0.94           \\
                               &                                 & \texttt{\methodname-HS}  & 0.19              & 19.24         & 20.97  & \textbf{1.00}             & 0.24                   & 10.52  & 11.13   & \textbf{1.00}           \\
                               &                                 & \texttt{\methodname-L}   & 0.19              & 18.33        & \textbf{19.98}  & \textbf{1.00}             & 0.25                   & \textbf{9.89}  & 10.47   & \textbf{1.00}           \\
  \cline{2-11}
                               &   \multirow[t]{6}{*}{Phi 2}       & \texttt{CLM\ Max}          & -              & -               & -                         & -              & 0.05                   & 16.60          & 22.91           & 0.19           \\
                               &                                 & \texttt{CLM\ Sum}          & -              & -               & -                         & -              & 0.06                   & 16.51          & 21.26           & 0.21           \\
                               &                                 & \texttt{\methodname-HS}  & 0.18              & 19.00         & 21.66  & \textbf{0.83}             & 0.24                   & \textbf{15.59}  & \textbf{17.38}  & \textbf{0.94}           \\
                               &                                 & \texttt{\methodname-L}   & -                                 & -                     & -               & -                & 0.14                   & 19.49  & 22.00  & 0.50           \\
  \cline{1-11} \cline{2-11}
  \multirow[t]{14}{*}{MBPP}    & \multirow[t]{6}{*}{GPT 4o Mini} & \texttt{CLM\ Max}          & 0.08              & \textbf{1.04}                  & \textbf{1.76}            & 0.38             & 0.15                   & 1.02           & 1.38            & 0.65           \\
                               &                                 & \texttt{\methodname-HS}  & 0.07              & 1.94         & 15.00   & \textbf{0.50}             & 0.16                   & \textbf{1.00}  & \textbf{1.00}   & \textbf{1.00}           \\
                               &                                 & \texttt{\methodname-L}   & 0.21              & 1.20         & 1.97   & \textbf{1.00}             & 0.21                   & \textbf{1.00}  & \textbf{1.00}   & \textbf{1.00}           \\
  \cline{2-11}
                               & \multirow[t]{5}{*}{Llama 3 8B}  & \texttt{CLM\ First-K}      & -                               & -                               & -                         & -              & 0.02                   & \textbf{7.13}           & \textbf{12.16}           & 0.07           \\
                               &                                 & \texttt{CLM\ Sum}          & -                               & -                               & -                         & -              & 0.02                   & 8.45           & 13.40           & 0.06           \\
                               &                                 & \texttt{\methodname-HS}  & 0.12              & \textbf{11.13}         & 23.50  & \textbf{0.83}             & 0.17                   & 10.25  & 19.05  & \textbf{0.95}           \\
                               &                                 & \texttt{\methodname-L}   & 0.004              & -                     & -               & 0.01             & 0.24                   & 7.92  & 13.00   & \textbf{1.00}           \\
  \cline{2-11}
                               & \multirow[t]{3}{*}{Phi 2}       & \texttt{CLM\ First-K\  (nr)} & -                               & -                               & -                         & -              & 0.02                   & 19.57          & 19.57           & 0.07           \\
                               &                                 & \texttt{\methodname-HS}  & 0.16              & 10.50         & \textbf{24.15}  & \textbf{0.80}             & 0.22                   & \textbf{9.97}  & \textbf{21.32}  & \textbf{0.92}           \\
                               &                                 & \texttt{\methodname-L}   & 0.02              & \textbf{8.86}         & 24.95  & 0.10             & 0.004                   & 11.32  & 25.00  & 0.01           \\
  \cline{1-11} \cline{2-11}
  \multirow[t]{6}{*}{Math}     & \multirow[t]{6}{*}{GPT 4o Mini} & \texttt{CLM\ First-K}      & 0.22                              & 13.73                 & 16.61           & 0.99             & 0.27                   & 8.25           & 9.22            & \textbf{1.00}           \\
                               &                                 & \texttt{\methodname-HS}  & 0.20              & \textbf{11.35}         & \textbf{11.40}  & 0.97             & 0.24                   & 8.22  & 8.25   & 0.99           \\
                               &                                 & \texttt{\methodname-L}   & 0.24              & 12.92         & 13.00  & \textbf{1.00}             & 0.28                   & \textbf{7.46}  & \textbf{7.50}   & \textbf{1.00}           \\
  \cline{1-11} \cline{2-11}
  \multirow[t]{8}{*}{TriviaQA} & GPT 4o Mini                     & \texttt{\methodname-HS}  & 0.23              & \textbf{1.39}         & 22.80  & \textbf{0.83}             & 0.28                   & \textbf{1.36}  & 13.73  & 0.92           \\
  \cline{2-11}
                               & \multirow[t]{6}{*}{Llama 3 8B}  & \texttt{CLM\ First-K}      & 0.24                              & 5.75                  & 5.75            & \textbf{1.00}             & 0.28                   & 1.06           & \textbf{1.07}            & \textbf{1.00}           \\
                               &                                 & \texttt{CLM\ First-K\  (nr)} & 0.24                              & 5.72                  & 5.72            & \textbf{1.00}             & 0.28                   & 1.08           & 1.08            & \textbf{1.00}           \\
                               &                                 & \texttt{CLM\ Max}          & 0.24                              & \textbf{1.42}                  & 8.24            & \textbf{1.00}             & 0.28                   & \textbf{1.00}           & 1.08            & \textbf{1.00}           \\
                               &                                 & \texttt{CLM\ Sum}          & 0.24                              & 3.82                  & \textbf{4.83}            & \textbf{1.00}             & 0.28                   & 1.06           & 1.09            & \textbf{1.00}           \\
                               &                                 & \texttt{\methodname-HS}  & 0.12              & 1.74         & 23.00  & 0.50             & 0.29                   & 1.17  & 2.00   & \textbf{1.00}           \\
                               &                                 & \texttt{\methodname-L}   & 0.0002              & \textbf{1.69}         & 20.00  & 0.001             & 0.0006                   & 1.22  & 2.50   & 0.003           \\
  \cline{2-11}
                               & Phi 2                           & \texttt{\methodname-HS}  & 0.24              & 1.97         & 20.69  & \textbf{0.59}             & 0.28                   & 2.03  & 19.96  & \textbf{0.65}           \\
  \bottomrule
\end{tabular}