\begin{table}[htb]
\centering
\resizebox{\columnwidth}{!}{
%\begin{threeparttable}
%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
\begin{tabular}{llllll}
\toprule
{} &                           GDT &                       sklearn &            GeneticTree &                          DNDT &                          DL85 \\
\midrule
Iris                 &         0.973 $\pm$ 0.022 (2) &         0.948 $\pm$ 0.025 (3) &  0.919 $\pm$ 0.042 (5) &  \bftab 0.986 $\pm$ 0.014 (1) &         0.935 $\pm$ 0.033 (4) \\
Balance Scale        &         0.809 $\pm$ 0.039 (2) &         0.727 $\pm$ 0.017 (3) &  0.699 $\pm$ 0.032 (4) &  \bftab 0.885 $\pm$ 0.029 (1) &         0.662 $\pm$ 0.026 (5) \\
Car                  &         0.945 $\pm$ 0.021 (2) &  \bftab 0.963 $\pm$ 0.010 (1) &  0.598 $\pm$ 0.034 (5) &         0.871 $\pm$ 0.032 (3) &         0.765 $\pm$ 0.028 (4) \\
Glass                &         0.721 $\pm$ 0.154 (2) &         0.697 $\pm$ 0.142 (3) &  0.606 $\pm$ 0.078 (5) &  \bftab 0.764 $\pm$ 0.177 (1) &         0.646 $\pm$ 0.111 (4) \\
Contraceptive        &  \bftab 0.669 $\pm$ 0.021 (1) &         0.655 $\pm$ 0.021 (3) &  0.622 $\pm$ 0.028 (5) &         0.653 $\pm$ 0.030 (4) &         0.663 $\pm$ 0.015 (2) \\
Solar Flare          &  \bftab 0.521 $\pm$ 0.062 (1) &         0.501 $\pm$ 0.003 (3) &  0.500 $\pm$ 0.000 (5) &         0.510 $\pm$ 0.030 (2) &         0.501 $\pm$ 0.002 (4) \\
Wine                 &  \bftab 0.960 $\pm$ 0.036 (1) &         0.934 $\pm$ 0.023 (3) &  0.927 $\pm$ 0.036 (4) &         0.951 $\pm$ 0.023 (2) &         0.890 $\pm$ 0.018 (5) \\
Zoo                  &         0.596 $\pm$ 0.193 (2) &  \bftab 0.600 $\pm$ 0.200 (1) &  0.569 $\pm$ 0.143 (4) &             nan $\pm$ nan (5) &         0.594 $\pm$ 0.189 (3) \\
Lymphography         &         0.516 $\pm$ 0.047 (2) &         0.508 $\pm$ 0.023 (4) &  0.511 $\pm$ 0.033 (3) &             nan $\pm$ nan (5) &  \bftab 0.516 $\pm$ 0.048 (1) \\
Segment              &  \bftab 0.990 $\pm$ 0.002 (1) &         0.980 $\pm$ 0.003 (2) &  0.874 $\pm$ 0.024 (4) &             nan $\pm$ nan (5) &         0.889 $\pm$ 0.008 (3) \\
Dermatology          &  \bftab 0.991 $\pm$ 0.006 (1) &         0.964 $\pm$ 0.026 (2) &  0.928 $\pm$ 0.054 (4) &             nan $\pm$ nan (5) &         0.942 $\pm$ 0.028 (3) \\
Landsat              &  \bftab 0.968 $\pm$ 0.004 (1) &         0.900 $\pm$ 0.006 (2) &  0.788 $\pm$ 0.022 (4) &             nan $\pm$ nan (5) &         0.866 $\pm$ 0.005 (3) \\
Annealing            &  \bftab 0.888 $\pm$ 0.194 (1) &         0.831 $\pm$ 0.169 (3) &  0.640 $\pm$ 0.101 (4) &             nan $\pm$ nan (5) &         0.869 $\pm$ 0.186 (2) \\
Splice               &  \bftab 0.960 $\pm$ 0.005 (1) &         0.936 $\pm$ 0.006 (3) &  0.759 $\pm$ 0.048 (4) &             nan $\pm$ nan (5) &         0.943 $\pm$ 0.012 (2) \\
\midrule
Mean Reciprocal Rank &  \bftab 0.786 $\pm$ 0.247 (1) &         0.458 $\pm$ 0.233 (3) &  0.238 $\pm$ 0.035 (5) &         0.655 $\pm$ 0.310 (2) &         0.374 $\pm$ 0.201 (4) \\
\bottomrule
\end{tabular}%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
%\begin{tablenotes}
%\item[a] \footnotesize
%\item[b] \footnotesize
%\end{tablenotes}
%\end{threeparttable}
}
\caption{\textbf{multi_test Performance Comparison.} We report the train and test f1-score (mean $\pm$ stdev over 10 trials) and dataset specification. We also report the ranking of each approach for the corresponding dataset in brackets.}
\label{tab:eval-results_multi_test}
\end{table}


