\begin{table}[htb]
\centering
\resizebox{\columnwidth}{!}{
%\begin{threeparttable}
%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
\begin{tabular}{llllll}
\toprule
{} &                           GDT &                       sklearn &            GeneticTree &                          DNDT &                          DL85 \\
\midrule
Iris                 &  \bftab 0.944 $\pm$ 0.047 (1) &         0.930 $\pm$ 0.032 (3) &  0.890 $\pm$ 0.061 (5) &         0.933 $\pm$ 0.034 (2) &         0.913 $\pm$ 0.043 (4) \\
Balance Scale        &         0.737 $\pm$ 0.029 (3) &         0.773 $\pm$ 0.022 (2) &  0.713 $\pm$ 0.049 (4) &  \bftab 0.776 $\pm$ 0.024 (1) &         0.661 $\pm$ 0.045 (5) \\
Car                  &         0.852 $\pm$ 0.038 (2) &  \bftab 0.975 $\pm$ 0.003 (1) &  0.715 $\pm$ 0.044 (4) &         0.701 $\pm$ 0.042 (5) &         0.827 $\pm$ 0.024 (3) \\
Glass                &         0.678 $\pm$ 0.074 (2) &  \bftab 0.681 $\pm$ 0.076 (1) &  0.587 $\pm$ 0.102 (5) &         0.671 $\pm$ 0.082 (3) &         0.634 $\pm$ 0.069 (4) \\
Contraceptive        &         0.531 $\pm$ 0.026 (3) &         0.559 $\pm$ 0.025 (2) &  0.503 $\pm$ 0.048 (4) &         0.477 $\pm$ 0.048 (5) &  \bftab 0.568 $\pm$ 0.020 (1) \\
Solar Flare          &         0.793 $\pm$ 0.027 (3) &         0.795 $\pm$ 0.024 (2) &  0.793 $\pm$ 0.026 (4) &  \bftab 0.801 $\pm$ 0.028 (1) &         0.790 $\pm$ 0.026 (5) \\
Wine                 &  \bftab 0.923 $\pm$ 0.041 (1) &         0.914 $\pm$ 0.032 (2) &  0.891 $\pm$ 0.055 (3) &         0.847 $\pm$ 0.046 (5) &         0.856 $\pm$ 0.018 (4) \\
Zoo                  &         0.946 $\pm$ 0.054 (2) &  \bftab 0.970 $\pm$ 0.050 (1) &  0.850 $\pm$ 0.100 (4) &             nan $\pm$ nan (5) &         0.929 $\pm$ 0.087 (3) \\
Lymphography         &         0.769 $\pm$ 0.050 (2) &         0.724 $\pm$ 0.075 (4) &  0.740 $\pm$ 0.071 (3) &             nan $\pm$ nan (5) &  \bftab 0.824 $\pm$ 0.102 (1) \\
Segment              &         0.943 $\pm$ 0.009 (2) &  \bftab 0.966 $\pm$ 0.005 (1) &  0.770 $\pm$ 0.049 (4) &             nan $\pm$ nan (5) &         0.810 $\pm$ 0.013 (3) \\
Dermatology          &         0.934 $\pm$ 0.032 (2) &  \bftab 0.965 $\pm$ 0.023 (1) &  0.894 $\pm$ 0.102 (4) &             nan $\pm$ nan (5) &         0.929 $\pm$ 0.026 (3) \\
Landsat              &         0.852 $\pm$ 0.008 (2) &  \bftab 0.856 $\pm$ 0.008 (1) &  0.674 $\pm$ 0.041 (4) &             nan $\pm$ nan (5) &         0.808 $\pm$ 0.006 (3) \\
Annealing            &         0.970 $\pm$ 0.014 (3) &         0.973 $\pm$ 0.011 (2) &  0.821 $\pm$ 0.091 (4) &             nan $\pm$ nan (5) &  \bftab 0.985 $\pm$ 0.007 (1) \\
Splice               &         0.883 $\pm$ 0.011 (3) &         0.918 $\pm$ 0.006 (2) &  0.667 $\pm$ 0.066 (4) &             nan $\pm$ nan (5) &  \bftab 0.923 $\pm$ 0.015 (1) \\
\midrule
Mean Reciprocal Rank &         0.512 $\pm$ 0.213 (2) &  \bftab 0.685 $\pm$ 0.282 (1) &  0.255 $\pm$ 0.036 (5) &         0.490 $\pm$ 0.337 (3) &         0.487 $\pm$ 0.328 (4) \\
\bottomrule
\end{tabular}%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
%\begin{tablenotes}
%\item[a] \footnotesize
%\item[b] \footnotesize
%\end{tablenotes}
%\end{threeparttable}
}
\caption{\textbf{multi_test Performance Comparison.} We report the train and test f1-score (mean $\pm$ stdev over 10 trials) and dataset specification. We also report the ranking of each approach for the corresponding dataset in brackets.}
\label{tab:eval-results_multi_test}
\end{table}


