\begin{table}[t]
\caption{Counts of data in SemTabNet. Tasks are explained in \cref{sec:experimentalresults}.\tablefootnote{The counts differ slightly due to the manner in which the final data was harmonized. The SE Indirect 1D data consists of the 84\,890 original cells annotated from 1\,107 tables. The test/train split of tables for SE Indirect 1D was prepared by stratifying across all cell labels. This split was augmented (as described in text) to prepare data for SE Indirect 2D. The test/train split and augmentation for SE Direct was done independently.}.}
\label{tab:table_counts}
% \vskip -5em
\begin{center}
\begin{small}
\begin{sc}
    \begin{tabular}{lrrr}
    \hline
        Task & Train & Test & Val \\ 
        \hline
        % UD2SD & 187,040 & 21,424 & 9,845 \\ 
        % UD2SD - Text & 83,585 & 9,742 & 4,400 \\ 
        SE Direct & 103,455 & 11,682 & 5,445 \\ 
        SE Indirect 1D & 72,580 & 8,489 & 3,821 \\ 
        SE Indirect 2D & 93,153 & 22,839 & 4,903 \\ 
        \hline
    \end{tabular}
\end{sc}
\end{small}
\end{center}
% \vskip -2em
\end{table}
