\begin{table}[htb]
\centering
\resizebox{\columnwidth}{!}{
%\begin{threeparttable}
%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
\begin{tabular}{llllll}
\toprule
{} &                           GDT &                       sklearn &            GeneticTree &                          DNDT &                          DL85 \\
\midrule
Iris                 &         0.927 $\pm$ 0.036 (3) &  \bftab 0.937 $\pm$ 0.035 (1) &  0.914 $\pm$ 0.039 (4) &         0.933 $\pm$ 0.034 (2) &         0.913 $\pm$ 0.043 (5) \\
Balance Scale        &         0.722 $\pm$ 0.051 (3) &         0.736 $\pm$ 0.016 (2) &  0.700 $\pm$ 0.033 (4) &  \bftab 0.776 $\pm$ 0.024 (1) &         0.661 $\pm$ 0.045 (5) \\
Car                  &         0.781 $\pm$ 0.019 (3) &  \bftab 0.848 $\pm$ 0.011 (1) &  0.729 $\pm$ 0.016 (4) &         0.701 $\pm$ 0.042 (5) &         0.827 $\pm$ 0.024 (2) \\
Glass                &         0.512 $\pm$ 0.126 (5) &  \bftab 0.678 $\pm$ 0.074 (1) &  0.574 $\pm$ 0.062 (4) &         0.671 $\pm$ 0.082 (2) &         0.634 $\pm$ 0.069 (3) \\
Contraceptive        &         0.533 $\pm$ 0.021 (3) &         0.553 $\pm$ 0.022 (2) &  0.488 $\pm$ 0.056 (4) &         0.477 $\pm$ 0.048 (5) &  \bftab 0.568 $\pm$ 0.020 (1) \\
Solar Flare          &         0.793 $\pm$ 0.027 (3) &         0.794 $\pm$ 0.031 (2) &  0.793 $\pm$ 0.026 (4) &  \bftab 0.801 $\pm$ 0.028 (1) &         0.790 $\pm$ 0.026 (5) \\
Wine                 &         0.902 $\pm$ 0.035 (2) &  \bftab 0.914 $\pm$ 0.032 (1) &  0.889 $\pm$ 0.045 (3) &         0.847 $\pm$ 0.046 (5) &         0.856 $\pm$ 0.018 (4) \\
Zoo                  &         0.867 $\pm$ 0.082 (3) &         0.921 $\pm$ 0.090 (2) &  0.828 $\pm$ 0.105 (4) &             nan $\pm$ nan (5) &  \bftab 0.929 $\pm$ 0.087 (1) \\
Lymphography         &         0.720 $\pm$ 0.090 (4) &         0.746 $\pm$ 0.083 (2) &  0.732 $\pm$ 0.095 (3) &             nan $\pm$ nan (5) &  \bftab 0.824 $\pm$ 0.102 (1) \\
Segment              &  \bftab 0.832 $\pm$ 0.029 (1) &         0.795 $\pm$ 0.024 (3) &  0.731 $\pm$ 0.074 (4) &             nan $\pm$ nan (5) &         0.810 $\pm$ 0.013 (2) \\
Dermatology          &         0.920 $\pm$ 0.052 (3) &  \bftab 0.949 $\pm$ 0.023 (1) &  0.865 $\pm$ 0.115 (4) &             nan $\pm$ nan (5) &         0.929 $\pm$ 0.026 (2) \\
Landsat              &         0.807 $\pm$ 0.020 (3) &  \bftab 0.811 $\pm$ 0.009 (1) &  0.707 $\pm$ 0.040 (4) &             nan $\pm$ nan (5) &         0.808 $\pm$ 0.006 (2) \\
Annealing            &         0.931 $\pm$ 0.018 (3) &         0.973 $\pm$ 0.011 (2) &  0.803 $\pm$ 0.078 (4) &             nan $\pm$ nan (5) &  \bftab 0.985 $\pm$ 0.007 (1) \\
Splice               &         0.821 $\pm$ 0.022 (3) &         0.900 $\pm$ 0.008 (2) &  0.703 $\pm$ 0.084 (4) &             nan $\pm$ nan (5) &  \bftab 0.923 $\pm$ 0.015 (1) \\
\midrule
Mean Reciprocal Rank &         0.377 $\pm$ 0.183 (4) &  \bftab 0.702 $\pm$ 0.261 (1) &  0.262 $\pm$ 0.029 (5) &         0.514 $\pm$ 0.331 (3) &         0.585 $\pm$ 0.328 (2) \\
\bottomrule
\end{tabular}%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
%\begin{tablenotes}
%\item[a] \footnotesize
%\item[b] \footnotesize
%\end{tablenotes}
%\end{threeparttable}
}
\caption{\textbf{multi_test Performance Comparison.} We report the train and test f1-score (mean $\pm$ stdev over 10 trials) and dataset specification. We also report the ranking of each approach for the corresponding dataset in brackets.}
\label{tab:eval-results_multi_test}
\end{table}


