% The results have been computed with Emanuele's KL
\newcommand{\MNISTAndCo}{{\tt MNIST \& Co}\xspace}

\begin{table*}
    \centering
    \scriptsize
    \begin{tabular}{p{2cm}p{6cm}p{6cm}}
        \toprule
            & \multicolumn{2}{c}{\textsc{\MNISTAndCo}} \\
        \cmidrule(lr){2-3}
            & \textsc{metric} 
            & \textsc{comment} \\
        \midrule
            \textsc{\YAcc} & accuracy computed on the factorized $p(y|x)$ & f1 is also available
            \\
            \textsc{\CAcc} & accuracy computed on the factorized $p(c|x)$ & there is also the $p(w|x)$ which is not factorized, but maybe is not suitable for the main tables (f1 is also available)
            \\
            \textsc{\YECE} & ECE computed on the factorized $p(y|x)$ & there is the single $y$ counterpart 
            \\
            \textsc{\CECE} & ECE computed on the factorized $p(c|x)$ & there is also the single concept counterpart, as well as the world ones
            \\
            \textsc{mean $H(W|x)$} & OVA $H(W|x)$ computed on each sample of the test set and then averaged & there is also the factorized counterpart
            \\
            \textsc{mean $H(W|x)$} & OVA $H(W|x)$ computed on each sample of the test set and then averaged & there is also the world specific entropy and the factorized $p(c|x)$ counterpart (including the concept specific version)
            \\
            \textsc{mean $Var(W|x)$} & $Var(W|x)$ computed on each sample of the test set and then averaged & there is also the world specific entropy and the factorized $p(c|x)$ counterpart (including the concept specific version)
            \\
            \textsc{mean $H(C|Y)$} & entropy computed on all the concept vector filtered per class ($y$) and then averaged & there is also the variance counterpart
            \\
        \bottomrule
    \end{tabular}
\end{table*}

\begin{table*}
    \centering
    \scriptsize
    \begin{tabular}{lll}
        \toprule
            & \multicolumn{2}{c}{\BOIA}
        \\
        \cmidrule(lr){2-3}
            & \textsc{metric}
            & \textsc{motivation}
        \\
        \midrule
        \textsc{\mFY} & F1 score per class and then averaged & accuracy is also computed like this for \BOIA
        \\
        \textsc{\mFC} & F1 score per concept and then averaged & accuracy is also computed like this for \BOIA
        \\
        \textsc{\mYECE} & ECE score computed per class and then averaged &
        \\
        \textsc{\mCECE} & ECE score computed per concept and then averaged
        \\
        \textsc{the same metrics computed for \MNISTAndCo} & &
        \\
        \bottomrule
    \end{tabular}
\end{table*}