\begin{table}[htb]
\centering
\resizebox{\columnwidth}{!}{
%\begin{threeparttable}
%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
\begin{tabular}{llllll}
\toprule
{} &                           GDT &                sklearn &            GeneticTree &                          DNDT &                          DL85 \\
\midrule
Iris                 &         0.965 $\pm$ 0.022 (2) &  0.952 $\pm$ 0.028 (3) &  0.936 $\pm$ 0.028 (4) &  \bftab 0.986 $\pm$ 0.014 (1) &         0.935 $\pm$ 0.033 (5) \\
Balance Scale        &         0.776 $\pm$ 0.051 (2) &  0.714 $\pm$ 0.015 (3) &  0.690 $\pm$ 0.022 (4) &  \bftab 0.885 $\pm$ 0.029 (1) &         0.662 $\pm$ 0.026 (5) \\
Car                  &  \bftab 0.905 $\pm$ 0.015 (1) &  0.802 $\pm$ 0.009 (3) &  0.608 $\pm$ 0.011 (5) &         0.871 $\pm$ 0.032 (2) &         0.765 $\pm$ 0.028 (4) \\
Glass                &         0.737 $\pm$ 0.159 (2) &  0.692 $\pm$ 0.134 (3) &  0.612 $\pm$ 0.082 (5) &  \bftab 0.764 $\pm$ 0.177 (1) &         0.646 $\pm$ 0.111 (4) \\
Contraceptive        &  \bftab 0.696 $\pm$ 0.022 (1) &  0.651 $\pm$ 0.017 (4) &  0.612 $\pm$ 0.035 (5) &         0.653 $\pm$ 0.030 (3) &         0.663 $\pm$ 0.015 (2) \\
Solar Flare          &  \bftab 0.526 $\pm$ 0.079 (1) &  0.500 $\pm$ 0.001 (4) &  0.500 $\pm$ 0.000 (5) &         0.510 $\pm$ 0.030 (2) &         0.501 $\pm$ 0.002 (3) \\
Wine                 &         0.950 $\pm$ 0.029 (2) &  0.934 $\pm$ 0.023 (3) &  0.925 $\pm$ 0.030 (4) &  \bftab 0.951 $\pm$ 0.023 (1) &         0.890 $\pm$ 0.018 (5) \\
Zoo                  &  \bftab 0.597 $\pm$ 0.195 (1) &  0.593 $\pm$ 0.187 (3) &  0.558 $\pm$ 0.116 (4) &             nan $\pm$ nan (5) &         0.594 $\pm$ 0.189 (2) \\
Lymphography         &  \bftab 0.527 $\pm$ 0.082 (1) &  0.514 $\pm$ 0.043 (3) &  0.511 $\pm$ 0.033 (4) &             nan $\pm$ nan (5) &         0.516 $\pm$ 0.048 (2) \\
Segment              &  \bftab 0.964 $\pm$ 0.008 (1) &  0.900 $\pm$ 0.005 (2) &  0.859 $\pm$ 0.032 (4) &             nan $\pm$ nan (5) &         0.889 $\pm$ 0.008 (3) \\
Dermatology          &  \bftab 0.979 $\pm$ 0.012 (1) &  0.965 $\pm$ 0.015 (2) &  0.907 $\pm$ 0.075 (4) &             nan $\pm$ nan (5) &         0.942 $\pm$ 0.028 (3) \\
Landsat              &  \bftab 0.956 $\pm$ 0.003 (1) &  0.862 $\pm$ 0.006 (3) &  0.803 $\pm$ 0.022 (4) &             nan $\pm$ nan (5) &         0.866 $\pm$ 0.005 (2) \\
Annealing            &         0.866 $\pm$ 0.185 (2) &  0.831 $\pm$ 0.169 (3) &  0.634 $\pm$ 0.097 (4) &             nan $\pm$ nan (5) &  \bftab 0.869 $\pm$ 0.186 (1) \\
Splice               &         0.932 $\pm$ 0.010 (2) &  0.925 $\pm$ 0.008 (3) &  0.778 $\pm$ 0.050 (4) &             nan $\pm$ nan (5) &  \bftab 0.943 $\pm$ 0.012 (1) \\
\midrule
Mean Reciprocal Rank &  \bftab 0.786 $\pm$ 0.247 (1) &  0.345 $\pm$ 0.069 (4) &  0.236 $\pm$ 0.023 (5) &         0.762 $\pm$ 0.280 (2) &         0.436 $\pm$ 0.256 (3) \\
\bottomrule
\end{tabular}%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
%\begin{tablenotes}
%\item[a] \footnotesize
%\item[b] \footnotesize
%\end{tablenotes}
%\end{threeparttable}
}
\caption{\textbf{multi_test Performance Comparison.} We report the train and test f1-score (mean $\pm$ stdev over 10 trials) and dataset specification. We also report the ranking of each approach for the corresponding dataset in brackets.}
\label{tab:eval-results_multi_test}
\end{table}


