\begin{table}[htb]
\centering
\resizebox{\columnwidth}{!}{
%\begin{threeparttable}
%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
\begin{tabular}{llllll}
\toprule
{} &                           GDT &                       sklearn &            GeneticTree &                   DNDT &                          DL85 \\
\midrule
Iris                 &  \bftab 1.000 $\pm$ 0.000 (1) &         0.973 $\pm$ 0.007 (4) &  0.954 $\pm$ 0.010 (5) &  0.994 $\pm$ 0.012 (3) &         0.997 $\pm$ 0.003 (2) \\
Balance Scale        &         0.891 $\pm$ 0.034 (3) &  \bftab 1.000 $\pm$ 0.000 (1) &  0.733 $\pm$ 0.012 (4) &  0.892 $\pm$ 0.023 (2) &         0.727 $\pm$ 0.004 (5) \\
Car                  &         0.959 $\pm$ 0.015 (2) &  \bftab 0.989 $\pm$ 0.005 (1) &  0.603 $\pm$ 0.034 (5) &  0.883 $\pm$ 0.031 (3) &         0.763 $\pm$ 0.021 (4) \\
Glass                &         0.760 $\pm$ 0.174 (4) &  \bftab 0.996 $\pm$ 0.006 (1) &  0.674 $\pm$ 0.024 (5) &  0.765 $\pm$ 0.180 (3) &         0.832 $\pm$ 0.015 (2) \\
Contraceptive        &  \bftab 0.684 $\pm$ 0.018 (1) &         0.669 $\pm$ 0.008 (3) &  0.619 $\pm$ 0.019 (5) &  0.646 $\pm$ 0.027 (4) &         0.674 $\pm$ 0.004 (2) \\
Solar Flare          &         0.500 $\pm$ 0.000 (3) &  \bftab 0.596 $\pm$ 0.052 (1) &  0.500 $\pm$ 0.000 (4) &  0.500 $\pm$ 0.000 (5) &         0.531 $\pm$ 0.027 (2) \\
Wine                 &  \bftab 1.000 $\pm$ 0.000 (1) &         1.000 $\pm$ 0.000 (2) &  0.962 $\pm$ 0.010 (5) &  0.974 $\pm$ 0.018 (4) &         0.984 $\pm$ 0.003 (3) \\
Zoo                  &         0.550 $\pm$ 0.150 (4) &  \bftab 1.000 $\pm$ 0.000 (1) &  0.872 $\pm$ 0.063 (3) &      nan $\pm$ nan (5) &         1.000 $\pm$ 0.000 (2) \\
Lymphography         &         0.549 $\pm$ 0.146 (4) &  \bftab 0.946 $\pm$ 0.149 (1) &  0.705 $\pm$ 0.091 (3) &      nan $\pm$ nan (5) &         0.897 $\pm$ 0.134 (2) \\
Segment              &         0.993 $\pm$ 0.002 (2) &  \bftab 0.998 $\pm$ 0.001 (1) &  0.876 $\pm$ 0.018 (4) &      nan $\pm$ nan (5) &         0.884 $\pm$ 0.002 (3) \\
Dermatology          &  \bftab 1.000 $\pm$ 0.001 (1) &         0.992 $\pm$ 0.002 (2) &  0.933 $\pm$ 0.044 (4) &      nan $\pm$ nan (5) &         0.972 $\pm$ 0.003 (3) \\
Landsat              &  \bftab 0.973 $\pm$ 0.004 (1) &         0.935 $\pm$ 0.002 (2) &  0.790 $\pm$ 0.023 (4) &      nan $\pm$ nan (5) &         0.871 $\pm$ 0.003 (3) \\
Annealing            &         0.892 $\pm$ 0.196 (3) &         0.948 $\pm$ 0.033 (2) &  0.697 $\pm$ 0.073 (4) &      nan $\pm$ nan (5) &  \bftab 0.979 $\pm$ 0.010 (1) \\
Splice               &         0.963 $\pm$ 0.005 (2) &  \bftab 0.967 $\pm$ 0.002 (1) &  0.763 $\pm$ 0.046 (4) &      nan $\pm$ nan (5) &         0.944 $\pm$ 0.002 (3) \\
\midrule
Mean Reciprocal Rank &         0.589 $\pm$ 0.317 (2) &  \bftab 0.792 $\pm$ 0.287 (1) &  0.250 $\pm$ 0.049 (5) &  0.333 $\pm$ 0.077 (4) &         0.473 $\pm$ 0.236 (3) \\
\bottomrule
\end{tabular}%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
%\begin{tablenotes}
%\item[a] \footnotesize
%\item[b] \footnotesize
%\end{tablenotes}
%\end{threeparttable}
}
\caption{\textbf{multi_valid Performance Comparison.} We report the train and test f1-score (mean $\pm$ stdev over 10 trials) and dataset specification. We also report the ranking of each approach for the corresponding dataset in brackets.}
\label{tab:eval-results_multi_valid}
\end{table}


