\begin{table}[]
\footnotesize
\centering
\begin{tabular}{clllll}
\toprule
\multicolumn{1}{l}{\textbf{Dataset}} & \textbf{Split}          & \textbf{Train} & \textbf{Validation} & \textbf{Test}  & \textbf{Overall} \\
\midrule
\multirow{4}{*}{GEOQUERY}   
                            & Standard       & 600   & -          & 280   & 880     \\
                            & Length         & 440   & -          & 440   & 880     \\
                            & TMCD           & 440   & -          & 440   & 880     \\
                            & Template       & 441   & -          & 439   & 880     \\
                            \midrule
\multirow{4}{*}{SPIDER}     & Random         & 3,282  & -          & 1,094  & 4,376    \\
                            & Length         & 3,282  & -          & 1,094  & 4,376    \\
                            & TMCD           & 3,282  & -          & 1,094  & 4,376    \\
                            & Template       & 3,280  & -          & 1,096  & 4,376    \\
                            \midrule
\multirow{6}{*}{SCAN}       & Standard       & 16,990 & -          & 3,920  & 20,910   \\
                            & Length         & 16,990 & -          & 3,920  & 20,910   \\
                            & Add Prmitive (JUMP)  & 14,670 & -          & 7,706  & 22,376   \\
                            & Add Primitive (TURN LEFT)  & 21,890 & -          & 1,208  & 23,098   \\
                             & Template (AROUND RIGHT)  & 15,225 & -          & 4,476  & 19,701   \\
                            & MCD1           & 8,365  & 1,045       & 1,045  & 10,455   \\
                            & MCD2           & 8,365  & 1,045       & 1,045  & 10,455   \\
                            & MCD3           & 8,365  & 1,045       & 1,045  & 10,455   \\
                            \midrule
\multirow{2}{*}{COGS}       & Standard       & 24,155 & 3,000       & 3,000  & 30,155   \\
                            & Generalization & -     & -          & 21,000 & 21,000   \\
\bottomrule
\end{tabular}
\caption{Number of instances for each dataset in each optimization split.}
\label{tab:num_instances}
\end{table}