\begin{table}[htb]
\centering
\resizebox{\columnwidth}{!}{
%\begin{threeparttable}
%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
\begin{tabular}{llllll}
\toprule
{} &                           GDT &                       sklearn &            GeneticTree &                   DNDT &                          DL85 \\
\midrule
Iris                 &  \bftab 1.000 $\pm$ 0.000 (1) &         0.964 $\pm$ 0.009 (3) &  0.939 $\pm$ 0.013 (5) &  0.950 $\pm$ 0.034 (4) &         0.996 $\pm$ 0.004 (2) \\
Balance Scale        &         0.842 $\pm$ 0.021 (2) &  \bftab 1.000 $\pm$ 0.000 (1) &  0.778 $\pm$ 0.017 (4) &  0.788 $\pm$ 0.043 (3) &         0.768 $\pm$ 0.007 (5) \\
Car                  &         0.879 $\pm$ 0.034 (2) &  \bftab 0.995 $\pm$ 0.001 (1) &  0.720 $\pm$ 0.049 (4) &  0.709 $\pm$ 0.044 (5) &         0.838 $\pm$ 0.007 (3) \\
Glass                &         0.741 $\pm$ 0.044 (3) &  \bftab 0.995 $\pm$ 0.006 (1) &  0.593 $\pm$ 0.038 (5) &  0.659 $\pm$ 0.113 (4) &         0.785 $\pm$ 0.011 (2) \\
Contraceptive        &         0.559 $\pm$ 0.015 (3) &         0.578 $\pm$ 0.008 (2) &  0.509 $\pm$ 0.032 (4) &  0.472 $\pm$ 0.038 (5) &  \bftab 0.585 $\pm$ 0.004 (1) \\
Solar Flare          &         0.784 $\pm$ 0.022 (3) &  \bftab 0.825 $\pm$ 0.007 (1) &  0.766 $\pm$ 0.006 (5) &  0.779 $\pm$ 0.026 (4) &         0.804 $\pm$ 0.006 (2) \\
Wine                 &  \bftab 1.000 $\pm$ 0.000 (1) &         1.000 $\pm$ 0.000 (2) &  0.947 $\pm$ 0.015 (4) &  0.896 $\pm$ 0.039 (5) &         0.976 $\pm$ 0.005 (3) \\
Zoo                  &         0.975 $\pm$ 0.049 (3) &  \bftab 1.000 $\pm$ 0.000 (1) &  0.880 $\pm$ 0.064 (4) &      nan $\pm$ nan (5) &         1.000 $\pm$ 0.000 (2) \\
Lymphography         &         0.862 $\pm$ 0.063 (3) &  \bftab 0.993 $\pm$ 0.012 (1) &  0.816 $\pm$ 0.044 (4) &      nan $\pm$ nan (5) &         0.969 $\pm$ 0.008 (2) \\
Segment              &         0.959 $\pm$ 0.004 (2) &  \bftab 0.997 $\pm$ 0.002 (1) &  0.763 $\pm$ 0.046 (4) &      nan $\pm$ nan (5) &         0.799 $\pm$ 0.004 (3) \\
Dermatology          &  \bftab 0.993 $\pm$ 0.009 (1) &         0.988 $\pm$ 0.003 (2) &  0.900 $\pm$ 0.064 (4) &      nan $\pm$ nan (5) &         0.960 $\pm$ 0.005 (3) \\
Landsat              &         0.867 $\pm$ 0.006 (2) &  \bftab 0.909 $\pm$ 0.002 (1) &  0.676 $\pm$ 0.044 (4) &      nan $\pm$ nan (5) &         0.816 $\pm$ 0.003 (3) \\
Annealing            &         0.977 $\pm$ 0.014 (3) &         0.987 $\pm$ 0.004 (2) &  0.842 $\pm$ 0.062 (4) &      nan $\pm$ nan (5) &  \bftab 0.996 $\pm$ 0.001 (1) \\
Splice               &         0.888 $\pm$ 0.012 (3) &  \bftab 0.957 $\pm$ 0.003 (1) &  0.670 $\pm$ 0.068 (4) &      nan $\pm$ nan (5) &         0.925 $\pm$ 0.003 (2) \\
\midrule
Mean Reciprocal Rank &         0.524 $\pm$ 0.259 (3) &  \bftab 0.845 $\pm$ 0.248 (1) &  0.239 $\pm$ 0.021 (5) &  0.240 $\pm$ 0.044 (4) &         0.526 $\pm$ 0.263 (2) \\
\bottomrule
\end{tabular}%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
%\begin{tablenotes}
%\item[a] \footnotesize
%\item[b] \footnotesize
%\end{tablenotes}
%\end{threeparttable}
}
\caption{\textbf{multi_valid Performance Comparison.} We report the train and test f1-score (mean $\pm$ stdev over 10 trials) and dataset specification. We also report the ranking of each approach for the corresponding dataset in brackets.}
\label{tab:eval-results_multi_valid}
\end{table}


