\begin{table}[htb]
\centering
\resizebox{\columnwidth}{!}{
%\begin{threeparttable}
%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
\begin{tabular}{llllll}
\toprule
{} &                           GDT &                       sklearn &            GeneticTree &                          DNDT &                          DL85 \\
\midrule
Iris                 &  \bftab 0.998 $\pm$ 0.005 (1) &         0.997 $\pm$ 0.003 (2) &  0.962 $\pm$ 0.010 (5) &         0.994 $\pm$ 0.012 (4) &         0.997 $\pm$ 0.003 (3) \\
Balance Scale        &         0.868 $\pm$ 0.019 (2) &         0.785 $\pm$ 0.011 (3) &  0.722 $\pm$ 0.010 (5) &  \bftab 0.892 $\pm$ 0.023 (1) &         0.727 $\pm$ 0.004 (4) \\
Car                  &  \bftab 0.918 $\pm$ 0.016 (1) &         0.808 $\pm$ 0.004 (3) &  0.614 $\pm$ 0.003 (5) &         0.883 $\pm$ 0.031 (2) &         0.763 $\pm$ 0.021 (4) \\
Glass                &         0.735 $\pm$ 0.158 (4) &  \bftab 0.888 $\pm$ 0.018 (1) &  0.712 $\pm$ 0.046 (5) &         0.765 $\pm$ 0.180 (3) &         0.832 $\pm$ 0.015 (2) \\
Contraceptive        &  \bftab 0.728 $\pm$ 0.019 (1) &         0.674 $\pm$ 0.007 (2) &  0.611 $\pm$ 0.024 (5) &         0.646 $\pm$ 0.027 (4) &         0.674 $\pm$ 0.004 (3) \\
Solar Flare          &         0.500 $\pm$ 0.000 (3) &         0.512 $\pm$ 0.013 (2) &  0.500 $\pm$ 0.000 (4) &         0.500 $\pm$ 0.000 (5) &  \bftab 0.531 $\pm$ 0.027 (1) \\
Wine                 &         1.000 $\pm$ 0.001 (2) &  \bftab 1.000 $\pm$ 0.000 (1) &  0.967 $\pm$ 0.008 (5) &         0.974 $\pm$ 0.018 (4) &         0.984 $\pm$ 0.003 (3) \\
Zoo                  &         0.548 $\pm$ 0.143 (4) &         0.960 $\pm$ 0.017 (2) &  0.840 $\pm$ 0.037 (3) &             nan $\pm$ nan (5) &  \bftab 1.000 $\pm$ 0.000 (1) \\
Lymphography         &         0.546 $\pm$ 0.137 (4) &         0.890 $\pm$ 0.136 (2) &  0.685 $\pm$ 0.086 (3) &             nan $\pm$ nan (5) &  \bftab 0.897 $\pm$ 0.134 (1) \\
Segment              &  \bftab 0.967 $\pm$ 0.007 (1) &         0.901 $\pm$ 0.001 (2) &  0.861 $\pm$ 0.026 (4) &             nan $\pm$ nan (5) &         0.884 $\pm$ 0.002 (3) \\
Dermatology          &  \bftab 0.991 $\pm$ 0.006 (1) &         0.973 $\pm$ 0.004 (2) &  0.907 $\pm$ 0.065 (4) &             nan $\pm$ nan (5) &         0.972 $\pm$ 0.003 (3) \\
Landsat              &  \bftab 0.960 $\pm$ 0.006 (1) &         0.878 $\pm$ 0.007 (2) &  0.804 $\pm$ 0.023 (4) &             nan $\pm$ nan (5) &         0.871 $\pm$ 0.003 (3) \\
Annealing            &         0.878 $\pm$ 0.190 (3) &         0.948 $\pm$ 0.033 (2) &  0.670 $\pm$ 0.080 (4) &             nan $\pm$ nan (5) &  \bftab 0.979 $\pm$ 0.010 (1) \\
Splice               &         0.930 $\pm$ 0.012 (2) &         0.930 $\pm$ 0.002 (3) &  0.782 $\pm$ 0.047 (4) &             nan $\pm$ nan (5) &  \bftab 0.944 $\pm$ 0.002 (1) \\
\midrule
Mean Reciprocal Rank &  \bftab 0.637 $\pm$ 0.325 (1) &         0.536 $\pm$ 0.201 (3) &  0.246 $\pm$ 0.050 (5) &         0.417 $\pm$ 0.252 (4) &         0.571 $\pm$ 0.324 (2) \\
\bottomrule
\end{tabular}%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
%\begin{tablenotes}
%\item[a] \footnotesize
%\item[b] \footnotesize
%\end{tablenotes}
%\end{threeparttable}
}
\caption{\textbf{multi_valid Performance Comparison.} We report the train and test f1-score (mean $\pm$ stdev over 10 trials) and dataset specification. We also report the ranking of each approach for the corresponding dataset in brackets.}
\label{tab:eval-results_multi_valid}
\end{table}


