%------------------------------------------------------------------------------
% UAI 2023: Fred & Lounes
%------------------------------------------------------------------------------

\documentclass[accepted]{uai2023} % for initial submission
% \documentclass[accepted]{uai2023} % after acceptance, for a revised
                                    % version; also before submission to
                                    % see how the non-anonymous paper
                                    % would look like
%% There is a class option to choose the math font
% \documentclass[mathfont=ptmx]{uai2023} % ptmx math instead of Computer
                                         % Modern (has noticable issues)
% \documentclass[mathfont=newtx]{uai2023} % newtx fonts (improves upon
                                          % ptmx; less tested, no support)
% NOTE: Only keep *one* line above as appropriate, as it will be replaced
%       automatically for papers to be published. Do not make any other
%       change above this note for an accepted version.

%------------------------------------------------------------------------------
% Packages
%------------------------------------------------------------------------------

%% Choose your variant of English; be consistent
\usepackage[american]{babel}
% \usepackage[british]{babel}

%% Some suggested packages, as needed:
\usepackage{natbib} % has a nice set of citation styles and commands
    \bibliographystyle{plainnat}
    \renewcommand{\bibsection}{\subsubsection*{References}}
\usepackage{mathtools} % amsmath with fixes and additions
\usepackage{amsthm}
\usepackage{amsmath}
\usepackage{amsbsy}
\usepackage{amssymb}
\usepackage{amsfonts}
\usepackage{nicefrac}
\usepackage{bm}
\usepackage{bbm}
\usepackage{adjustbox}
\usepackage{multirow}
\usepackage{booktabs}
\usepackage{bbm, dsfont}
\usepackage{bbold}
\usepackage{booktabs} % commands to create good-looking tables
\usepackage{caption}
\usepackage{subcaption}
\usepackage[most]{tcolorbox}
% Algorithms
\usepackage[ruled,noend,vlined]{algorithm2e}
%Tikz
\usepackage{pgf,tikz}
\usetikzlibrary{shapes,arrows,automata,positioning,calc,matrix}
% Savetrees
%\usepackage[subtle,mathspacing=normal,wordspacing=normal]{savetrees}
% \usepackage{siunitx} % for proper typesetting of numbers and units

%% Provided macros
% \smaller: Because the class footnote size is essentially LaTeX's \small,
%           redefining \footnotesize, we provide the original \footnotesize
%           using this macro.
%           (Use only sparingly, e.g., in drawings, as it is quite small.)


%------------------------------------------------------------------------------
% Theorem Styles
%------------------------------------------------------------------------------

\newtheoremstyle{example}% name
  {9pt}%      Space above, empty = `usual value'
  {9pt}%      Space below
  {}%         Body font
  {}%         Indent amount (empty = no indent, \parindent = para indent)
  {\bfseries}% Thm head font
  {.}%        Punctuation after thm head
  { }%         Space after thm head: \newline = linebreak
  {}%         Thm head spec
\theoremstyle{example}
\newtheorem{example}{Example}
\newtheoremstyle{theorem}% name
  {9pt}%      Space above, empty = `usual value'
  {9pt}%      Space below
  {}%         Body font
  {}%         Indent amount (empty = no indent, \parindent = para indent)
  {\bfseries}% Thm head font
  {.}%        Punctuation after thm head
  { }% Space after thm head: \newline = linebreak
  {}%         Thm head spec
\theoremstyle{theorem}
\newtheorem{theorem}{Theorem}
\newtheorem{conjecture}{Conjecture}
\newtheorem{corollary}{Corollary}
\newtheorem{lemma}{Lemma}
\newtheorem{problem}{Problem}
\newtheorem{proposition}{Proposition}
\newtheorem{definition}{Definition}
\newtheorem{remark}{Remark}
\newtheorem{note}{Note}
\newtheorem{open}{Open question}

%------------------------------------------------------------------------------
% Commands
%------------------------------------------------------------------------------

%% Self-defined macros
\newcommand{\swap}[3][-]{#3#1#2} % just an example


\newcommand{\B}{\mathbb{B}}
\newcommand{\PP}{\mathbb{P}}
\newcommand{\R}{\mathbb{R}}
\newcommand{\Rp}{\mathbb{R}_+}
\newcommand{\Rpp}{\mathbb{R}_{++}}
\renewcommand{\S}{\mathbb{S}}
\newcommand{\Q}{\mathbb{Q}}
\newcommand{\Z}{\mathbb{Z}}
\newcommand{\Zp}{\mathbb{Z}_+}
\newcommand{\Zpp}{\mathbb{Z}_{++}}
\renewcommand{\emptyset}{\varnothing}
\newcommand{\Id}[1]{#1}

\DeclareMathOperator*{\argmax}{argmax}
\DeclareMathOperator*{\argmin}{argmin}
\DeclareMathOperator*{\Argmax}{Argmax}
\DeclareMathOperator*{\Argmin}{Argmin}

\newcommand{\Binom}[1]{\binom{[#1]}{2}}
\renewcommand{\vec}[1]{\bm{#1}}
\newcommand{\Var}[1]{\mathit{Var}(#1)}
\newcommand{\seq}[1]{\langle #1 \rangle}
\newcommand{\inner}[2]{\langle #1, #2 \rangle}
\newcommand{\norm}[1]{\left\|#1\right\|}
\newcommand{\bignorm}[1]{\bigl\|#1\bigr\|}
\newcommand{\norma}[1]{\|#1\|_{\mathrm{a}}}
\newcommand{\normas}[1]{\|#1\|_{\mathrm{a^*}}}
\newcommand{\normb}[1]{\|#1\|_{\mathrm{b}}}
\newcommand{\normbs}[1]{\|#1\|_{\mathrm{b^*}}}
\newcommand{\sgn}{\mathrm{sgn}}
\newcommand{\size}[1]{|#1|}
\newcommand{\vecphi}{\bm{\phi}}
\newcommand{\vecPhi}{\bm{\Phi}}
\newcommand{\vecbeta}{\bm{\beta}}
\newcommand{\vectheta}{\bm{\theta}}
\newcommand{\vecTheta}{\bm{\Theta}}

\newcommand{\longpage}{\enlargethispage{\baselineskip}}
\newcommand{\shortpage}{\enlargethispage{-\baselineskip}}


%------------------------------------------------------------------------------
% Front Page
%------------------------------------------------------------------------------

\title{Approximating Probabilistic Explanations via Supermodular Minimization (Supplementary Material)}

% The standard author block has changed for UAI 2023 to provide
% more space for long author lists and allow for complex affiliations
%
% All author information is authomatically removed by the class for the
% anonymous submission version of your paper, so you can already add your
% information below.
%
% Add authors
\author[1]{\href{mailto:<bounia@cril.fr>?Subject=Your UAI 2023 paper}{Louenas Bounia}{}}
\author[1]{\href{mailto:<koriche@cril.fr>?Subject=Your UAI 2023 paper}{Frederic Koriche}{}}
% Add affiliations after the authors
\affil[1]{%
    CRIL UMR CNRS 8188\\
    Université d'Artois, France
}
  
\begin{document}
\maketitle

%------------------------------------------------------------------------------
% Introduction
%------------------------------------------------------------------------------

\appendix
\section{Additional Experiments}\label{sec:additional}

In this section, we present all experimental results obtained for all benchmarks.
Recall that for each benchmark $b$, an explanation task consists a tuple $(\mathcal T,\vec x,I,k)$, where 
\begin{itemize}
  \item $\mathcal T$ is a decision tree learned, using the \textsc{Cart} algorithm;
  \item $\vec x$ is a data instance from the test set, which is binarized according to the features in $\mathcal T$;
  \item $I$ is a path-explanation for $\vec x$ and $\mathcal T$;
  \item $k$ is the size limit. 
\end{itemize}  
Let $h$ denote the hypothesis associated with $\mathcal T$.
As indicated in the main paper, 
the performance of explainers on a benchmark $b$ is measured by drawing uniformly at random $m$ instances $\vec x$ 
from the test set of $b$, and averaging the resulting error $\epsilon_{h,\vec x}(S)$ 
and size $\size{S}$ of the output $S \subseteq I$. In our experiments, 
$m = \min \{s,150\}$, where $s$ is the size of the test set of $b$.
The URL addresses of all benchmarks is given in Table~\ref{tab.benchmarks}. 

\paragraph{Results for $k = 7$.} In Table~\ref{tab:complete} are reported the 
results for all the 50 benchmarks considered in this study. The leftmost column gives the name of the dataset $b$,
and the next two columns report statistics about the decision tree accuracy $(\mathit{acc})$, and the number of
its internal nodes $(d)$. The fourth column gives the average size of the path-explanation $I$ for a random 
($d$-dimensional) test instance $\vec x$. The next two groups of three columns report the average errors 
($\epsilon_{h,\vec x}(S)$) and sizes ($\size{S}$) for the approximation algorithms \textsc{ga} and \textsc{gd},
and the SAT-based method. Finally, the average run-time of the SAT-method is provided in the last column. 
The benchmarks colored in blue indicate that, for some explanation tasks, the SAT-method has reached the 
timeout before completing binary search, which results in a degradation of precision (and conciseness).
For the benchmarks in magenta, the solver could not perform a single run of binary search before reaching the timeout.

\paragraph{Results for $k = 7 \pm 2$.} In Figure~\ref{fig.barplots} are merged 12 bar plots reporting the 
error results for \textsc{ga} and \textsc{gd}, when $k$ ranges from $5$ to $9$. Note that for most of these explanation 
tasks, the SAT solver could not complete binary search before reaching the timeout. We can observe that the 
performances of \textsc{ga} and \textsc{gd} are very similar. A notable exception is the dataset \emph{compas},
where \textsc{ga} is slightly better than \textsc{gd} when $k$ increases. 


\paragraph{Results for $I = [d]$ (and $k = 7$).} 
As emphasized by Izza et al. \citeyear{IzzaIM.2022}, path-explanations are not necessarily abductive, since  
decision trees can include irrelevant features. Nevertheless, the above results indicate that 
\textsc{ga} and \textsc{gd} are robust enough to reduce such input explanations.
Through further analysis, one may wonder whether these approximation algorithms are able to find 
probabilistic explanations when $I$ is no longer a path-explanation 
for $\vec x$ and $\mathcal T$, but includes all features occurring in $\vec x$ (i.e. $I = [d]$). 
The corresponding results are reported in Table~\ref{tab.allfeatures}.   
Unsurprisingly, the performance of the SAT-based approach degrades when $d$ increases.
We can also observe that the performance of \textsc{gd} is slightly worse than the performance of \textsc{ga}. 
Starting from $S_n = [d]$, \textsc{gd} must perform $d$ iterations of the main loop, 
which increases the chance of reaching a bad local optimum. On the other hand, \textsc{ga} only performs 
$\mathcal O(k \ln(1/\gamma))$ iterations of the main loop in order to select a solution that is 
close to the optimum found by the SAT approach.

\setcounter{table}{1}
\begin{table*}[t]
  \centering
  \begin{footnotesize}
    \begin{adjustbox}{width=1.1\linewidth,center}  
    \begin{tabular}{lrrrrrrrrrrrrr}
    \toprule
    \multicolumn{4}{c}{Benchmark} & & \multicolumn{3}{c}{$\epsilon_{h,\vec x}(S)$} & &\multicolumn{3}{c}{$|S|$} & & \multicolumn{1}{c}{Time (s)} \\
    \cmidrule{1-4}\cmidrule{6-8} \cmidrule{10-12} \cmidrule{14-14}
    name & $\mathit{acc}$ & $d$ & \size{$I$} && \textsc{ga} & \textsc{gd} & \textsc{Sat} && \textsc{ga} & \textsc{gd} & \textsc{Sat} && \textsc{Sat} \\
    \midrule   
    \emph{voting} &94.66 & 16 & 3.05 && 0.07 ($\pm$0.09)& 0.07 ($\pm$0.09)& 0.07 ($\pm$0.09) && 2.00& 2.00&2.00 && 0.37\\

    \emph{placement} &95.38&18&3.62 && 0.14 ($\pm$0.20)& 0.14 ($\pm$0.20)& 0.14 ($\pm$0.20) && 2.02&2.02&2.02 && 0.55\\

    \emph{anneal2} &98.52&14&4.03 && 0.19 ($\pm$0.11)& 0.19 ($\pm$0.11)& 0.19 ($\pm$0.11) && 2.10&2.10&2.10 && 0.21\\

    \emph{cars} &98.36 & 21 & 4.33 && 0.16 ($\pm$0.11)& 0.16 ($\pm$0.11)& 0.16 ($\pm$0.11) && 2.08 & 2.08&2.08 && 0.74\\

    \emph{hepatitis} &83.72 & 13 & 4.47 && 0.05 ($\pm$0.10)& 0.05 ($\pm$0.10)& 0.05 ($\pm$0.10) && 3.00& 3.00&3.00 && 0.41\\

    \emph{autos} &87.10&21&4.50 && 0.12 ($\pm$0.12)& 0.12 ($\pm$0.12)& 0.12 ($\pm$0.12) && 3.53&3.53&3.53 && 0.72\\

    \emph{backache} &88.89 & 18 & 4.83 && 0.24 ($\pm$0.11)& 0.24 ($\pm$0.11)& 0.24 ($\pm$0.11)  && 2.22& 2.22&2.22 && 0.66\\

    \emph{cleveland2} &75.82 & 35 &4.98 && 0.05 ($\pm$0.08)& 0.05 ($\pm$0.08)& 0.05 ($\pm$0.08) && 4.10& 4.10&4.10 && 4.42\\

    \emph{mushroom} &100 & 17 & 4.99 && 0.28 ($\pm$0.15)& 0.28 ($\pm$0.15)& 0.28 ($\pm$0.15) && 3.02&3.02&3.02 && 0.55\\
   
    \emph{meta-data} &87.42&44&5.09 && 0.08 ($\pm$0.11)& 0.08 ($\pm$0.11)& 0.08 ($\pm$0.11) && 3.10&3.10&3.10 && 12.14\\
    
    \emph{vehicle} &96.85 & 23 & 5.19 && 0.21 ($\pm$0.10)& 0.21 ($\pm$0.10)& 0.21 ($\pm$0.10) && 2.02& 2.02&2.02 && 1.23\\

    \emph{ionosphere} &95.28 & 19 & 5.22 && 0.54 ($\pm$0.40)& 0.54 ($\pm$0.40)& 0.54 ($\pm$0.40)&& 1.03& 1.03&1.03 && 0.39\\

    \emph{kr-vs-kp}  &99.79 & 32 & 5.29 && 0.21 ($\pm$0.15)& 0.21($\pm$0.15)& 0.21 ($\pm$0.15) && 1.07& 1.07&1.07 && 2.08\\
   
    \emph{balance} &85.64 &17&5.37 && 0.06 ($\pm$0.08)& 0.06 ($\pm$0.08)& 0.06 ($\pm$0.08) && 4.03&4.03&4.03 && 1.82\\
   
    \emph{glass} &78.46&31&5.38 && 0.26 ($\pm$0.11)& 0.26 ($\pm$0.11)& 0.26 ($\pm$0.11) && 2.14&2.14&2.14 && 2.36\\

    \emph{student perf.} &91.79&30&5.41 && 0.26 ($\pm$0.11)& 0.26 ($\pm$0.11)& 0.26 ($\pm$0.11) && 2.00&2.00&2.00 && 2.16\\

    \emph{biomed} &96.83 & 15 & 5.68 && 0.25 ($\pm$0.10)& 0.25 ($\pm$0.10)& 0.25 ($\pm$0.10) && 2.32& 2.32&2.32 && 0.45\\

    \emph{tae} &65.22 & 32 & 5.78 && 0.12 ($\pm$0.19)& 0.13 ($\pm$0.20)& 0.12 ($\pm$0.18) && 3.96 & 3.91&3.94 && 3.22\\
    
    \emph{primary tumor}&84.31&23&6.23 && 0.09 ($\pm$0.09)& 0.09 ($\pm$0.09)& 0.09 ($\pm$0.08) && 4.22&4.22&4.22 && 3.58\\

    \emph{liver disorders} &75.96&58&6.38 && 0.18 ($\pm$0.09)& 0.18 ($\pm$0.08)& 0.18 ($\pm$0.08) && 4.00&4.00&4.00 && 27.33\\

    \emph{schizophrenia} &80.39&33&6.39 && 0.37 ($\pm$0.24)& 0.37 ($\pm$0.24)& 0.37 ($\pm$0.24) && 1.27&1.27&1.27 && 4.79\\

    \emph{tic-tac-toe} &92.36 & 9 & 6.46 && 0.24 ($\pm$0.13)& 0.24 ($\pm$0.13)& 0.23 ($\pm$0.10) && 2.96 & 2.87&2.87 && 1.43\\

    \emph{australian} &84.06 & 70 & 6.48 && 0.24 ($\pm$0.13)& 0.24 ($\pm$0.14)& 0.24 ($\pm$0.13) && 3.56 & 3.55&3.55 && 63.49\\

    \emph{hungarian} &62.92&13&6.65 && 0.12 ($\pm$0.12)& 0.12 ($\pm$0.12)& 0.11 ($\pm$0.10) && 3.58&3.56&3.56 && 1.68\\

    \emph{horse colic} &75.68&40&6.73 && 0.14 ($\pm$0.07)& 0.13 ($\pm$0.07)& 0.13 ($\pm$0.07) && 4.03&4.06&4.06 && 11.56\\

    \textcolor{magenta}{\emph{madelon}} &66.41 & 500 & 7.33 && 0.06 ($\pm$0.09)& 0.06 ($\pm$0.09)&$-$ && 6.50&6.50&$-$ &&$-$\\

    \emph{haberman} &67.39 & 53 & 8.18 && 0.73 ($\pm$0.11)& 0.76 ($\pm$0.09)& 0.75 ($\pm$0.10) && 2.96 & 3.02&3.08&& 29.43\\
    
    \textcolor{blue}{\emph{indian liver}} &64.57&84&8.21 && 0.10 ($\pm$0.09)& 0.10 ($\pm$0.09)& 0.16 ($\pm$0.12)&& 5.08&4.89&6.12 && 176.28\\

    \textcolor{blue}{\emph{pima indians}} &75.32&97&8.30 && 0.15 ($\pm$0.14)& 0.15 ($\pm$0.14)& 0.16 ($\pm$0.12) && 5.85&5.84&6.58 && 484.6\\

    \textcolor{magenta}{\emph{dexter}} &86.11 & 20000 & 8.32 && 0.06 ($\pm$0.08)& 0.06 ($\pm$0.08)& $-$ && 5.95&5.96&$-$ && $-$\\
    
    \textcolor{blue}{\emph{loan eligibility}} &74.31&68&8.47 && 0.19 ($\pm$0.13)& 0.18 ($\pm$0.13)& 0.20 ($\pm$0.14) && 5.60&5.70&6.82&& 42.87\\

    \emph{patient treat.} &66.01&10&8.92 && 0.05 ($\pm$0.09)& 0.03 ($\pm$0.06)& 0.03 ($\pm$0.08) && 5.63&5.94&5.94 && 24.08\\

    \emph{wine} &69.58&11&9.03 && 0.09 ($\pm$0.10)& 0.09 ($\pm$0.09)& 0.09 ($\pm$0.12) && 5.59& 5.64&5.62 && 36.32\\

    \textcolor{magenta}{\emph{christine}} &50.8 & 1023 & 9.47 && 0.28 ($\pm$0.10)& 0.28 ($\pm$0.10) & $-$ && 7.00 & 6.99&$-$ && $-$\\

    \textcolor{magenta}{\emph{gina agnostic}} &85.31 & 970 & 9.69 && 0.20 ($\pm$0.15)& 0.20 ($\pm$0.15)& $-$ && 6.90&6.90&$-$ && $-$\\

    \textcolor{magenta}{\emph{email spam}} &93.88 & 3000 & 10.46 && 0.09 ($\pm$0.13)& 0.09 ($\pm$0.13) & $-$ && 5.22&5.22&$-$ && $-$\\
    
    \textcolor{magenta}{\emph{gina prior}} &85.59 & 784 & 10.53 && 0.27 ($\pm$0.16)& 0.27 ($\pm$0.16)&$-$ && 6.89&6.89&$-$ && $-$\\

    \textcolor{blue}{\emph{employee attr.}} &82.45&63&10.56 && 0.06 ($\pm$0.09)& 0.06 ($\pm$0.09)& 0.20 ($\pm$0.11) && 6.41&6.39&6.98 && 1017.24\\
                    
    \textcolor{blue}{\emph{contraceptive}} &51.36&90&10.84 && 0.06 ($\pm$0.08)& 0.06 ($\pm$0.08)& 0.39 ($\pm$0.17) && 4.27&4.26&5.95 && 1096.07\\

    \textcolor{blue}{\emph{compas}} &67.60&40&10.95 && 0.03 ($\pm$0.07)& 0.04 ($\pm$0.08)& 0.05 ($\pm$0.09) && 5.68&5.83&6.78 && 1082.32\\
    
    \textcolor{blue}{\emph{fetal health}} &91.85&93&11.33 && 0.12 ($\pm$0.06)& 0.12 ($\pm$0.06)& 0.23 ($\pm$0.11) && 5.59&5.59&6.00 && 930.61\\

    \textcolor{magenta}{\emph{dorothea}} &91.88&100000&12.90 && 0.25 ($\pm$0.10)& 0.25 ($\pm$0.10)& $-$ && 6.70&6.70&$-$ && $-$\\

    \textcolor{magenta}{\emph{bank market.}} &89.49&882&13.11 && 0.29 ($\pm$0.08)& 0.29 ($\pm$0.07)& $-$ && 6.99&6.99&$-$ && $-$\\

    \textcolor{magenta}{\emph{mnist49}} &95.99&784&15.57 && 0.37 ($\pm$0.14)& 0.37 ($\pm$0.14)& $-$ && 6.97&6.89&$-$ && $-$\\

    \textcolor{magenta}{\emph{spambase}} &92.11&236&16.09 && 0.24 ($\pm$0.11)& 0.23 ($\pm$0.09)& $-$ && 6.87&6.87&$-$ && $-$\\

    \textcolor{magenta}{\emph{adult}} &81.16 & 2433 & 16.43 && 0.33 ($\pm$0.12)& 0.33 ($\pm$0.12)& $-$ && 6.87 & 6.87&$-$ && $-$\\
    
    \textcolor{magenta}{\emph{mnist38}} &96.42&784&17.89 && 0.37 ($\pm$0.13)& 0.38 ($\pm$0.14)& $-$&& 6.93&6.93&$-$ && $-$\\

    \textcolor{magenta}{\emph{cnae}} &92.59&856&19.07 && 0.32 ($\pm$0.25)& 0.32 ($\pm$0.25)& $-$ && 5.97&5.97&$-$ && $-$\\

    \textcolor{magenta}{\emph{gisette}} &94.10&5000&21.42 && 0.32 ($\pm$0.11)& 0.32 ($\pm$0.11)& $-$ && 6.88&6.88&$-$ && $-$\\

    \textcolor{magenta}{\emph{farm ads}} &80.78&$54877$&23.15 && 0.13 ($\pm$0.17)& 0.13 ($\pm$0.17)& $-$&& 6.31&6.31&$-$ && $-$\\
        
    \bottomrule
    \end{tabular}
    \end{adjustbox}
  \end{footnotesize}
  \caption{Experimental results on 50 benchmarks for decision tree explanations, using $k = 7$.}
  \label{tab:complete}
\end{table*}


\begin{table*}[t]
    \centering
    \begin{scriptsize}
    \begin{tabular}{rrrrrrrrrrrrrrr}
      \toprule
      \multicolumn{3}{c}{Benchmark}&& \multicolumn{3}{c}{$\epsilon_{h, x}(S)$}&&\multicolumn{3}{c}{$|\text{S}|$} &&\multicolumn{3}{c}{Time $(s)$} \\
      \cmidrule{1-3}\cmidrule{5-7} \cmidrule{9-11} \cmidrule{13-15}
      name & $acc$ & $d$ && GA & GD & SAT && GA & GD & SAT && GA & GD & SAT \\
      \midrule
        shuttle &94.87&9 && 0.0019 ($\pm$0.0229)& 0.0017 ($\pm$0.0203)& 0.0017 ($\pm$0.0203) && 2.15&2.75&4.26 && 0.0002&0.0004&1.02\\

        tic-tac-toe &95.58&9 && 0.0008 ($\pm$0.0102)& 0.0092 ($\pm$0.0326)& 0.0008 ($\pm$0.0101) && 4.68&4.97&5.85 && 0.0006&0.0008&0.79\\

        patient treat. &66.77&10 && 0.0154 ($\pm$0.0555)& 0.0157 ($\pm$0.0664)& 0.0152 ($\pm$0.0574) && 5.67&6.37&6.52 && 0.0023&0.0034&35.30\\

        wine &70.0&11 && 0.0150 ($\pm$0.0406)& 0.0308 ($\pm$0.0487)& 0.0153 ($\pm$0.0383) && 5.98&6.66&6.90 && 0.0025&0.0037&25.83\\

        hepatitis &81.74&13 && 0.0038 ($\pm$0.0377)& 0.0087 ($\pm$0.0318)& 0.0034 ($\pm$0.0187) && 2.86&4.07&3.85 && 0.0002&0.0002&0.63\\

        hungarian &80.90&13 && 0.0075 ($\pm$0.0503)& 0.0116 ($\pm$0.0271)& 0.0075 ($\pm$0.0442) && 5.46&5.80&6.90 && 0.0009&0.0013&1.53\\

        anneal2 &99.63&14 && 0.0248 ($\pm$0.0498)& 0.0332 ($\pm$0.0450)& 0.0245 ($\pm$0.0490) && 3.66&3.98&5.00 && 0.0002&0.0003&0.32\\

        biomed &93.65&15 && 0.0000 ($\pm$0.0000)& 0.0000 ($\pm$0.0000)& 0.0009 ($\pm$0.0000) && 4.52&4.59&4.52 && 0.0004&0.0005&0.47\\

        voting &93.89&16 && 0.0026 ($\pm$0.0188)& 0.0048 ($\pm$0.0269)& 0.0026 ($\pm$0.0164) && 3.01&3.78&5.02 && 0.0003&0.0006&0.54\\

        balance &81.38&17 && 0.0032 ($\pm$0.0118)& 0.0121 ($\pm$0.0183)& 0.0020 ($\pm$0.0084) && 5.45&5.77&5.85 && 0.0014&0.0025&27.22\\

        mushroom &100.0&17 && 0.0009 ($\pm$0.0066)& 0.0052 ($\pm$0.0222)& 0.0005 ($\pm$0.0015) && 4.55&4.87&5.45 && 0.0004&0.0007&2.59\\

        backache &85.19&18 && 0.0100 ($\pm$0.0357)& 0.0535 ($\pm$0.0512)& 0.0080 ($\pm$0.0237) && 3.43&4.43&4.92 && 0.0003&0.0006&1.16\\

        placement &92.31&18 && 0.0000 ($\pm$0.0000)& 0.0010 ($\pm$0.0291)& 0.0000 ($\pm$0.0000) && 3.66&4.15&5.10 && 0.0002&0.0002&0.32\\ 

        ionosphere &96.23&19 && 0.0121 ($\pm$0.0490)& 0.0301 ($\pm$0.0493)& 0.0075 ($\pm$0.0355) && 4.36&5.00&5.85 && 0.0005&0.0001&1.51\\

        autos &85.48&21 && 0.0499 ($\pm$0.0741)& 0.0838 ($\pm$0.0650)& 0.0045 ($\pm$0.0219) && 4.48&4.90&6.12 && 0.0005&0.0009&5.71\\

        cars &91.80&21 && 0.0329 ($\pm$0.0864)& 0.0701 ($\pm$0.1120)& 0.0238 ($\pm$0.0550) && 3.47&3.71&5.05 && 0.0006&0.0013&4.70\\

        primary tumour &81.37&23 && 0.0206 ($\pm$0.0493)& 0.0464 ($\pm$0.0459)& 0.0074 ($\pm$0.0221) && 5.37&5.74&6.08 && 0.0013&0.0030&47.23\\

        vehicle &96.06&23 && 0.0304 ($\pm$0.0458)& 0.0619 ($\pm$0.0608)& 0.0143 ($\pm$0.0344) && 4.49&4.77&4.90 && 0.0008&0.0014&14.31\\

        breast cancer &92.98&30 && 0.0091 ($\pm$0.0293)& 0.0244 ($\pm$0.0439)& 0.0066 ($\pm$0.0237) && 4.43&4.94&5.52 && 0.0005&0.0009&4.84\\

        student perf &90.77&30 && 0.0077 ($\pm$0.0316)& 0.0219 ($\pm$0.0394)& 0.0005 ($\pm$0.0010) && 4.23&5.00&5.75 && 0.0007&0.0016&10.50\\

        glass &87.69&31 && 0.1168 ($\pm$0.0791)& 0.1410 ($\pm$0.0906)& 0.0772 ($\pm$0.0758) && 4.75&4.85&5.50 && 0.0010&0.0019&56.90\\

        kr-vs-kp  &99.79&32 && 0.0096 ($\pm$0.0299)& 0.0300 ($\pm$0.0573)& 0.0095 ($\pm$0.0285) && 3.07&3.52&4.40 && 0.0015&0.0047&34.30\\

        tae &69.57&32 && 0.0339 ($\pm$0.0634)& 0.0385 ($\pm$0.0950)& 0.0236 ($\pm$0.0492) && 5.20&5.37&5.82 && 0.0011&0.0022&72.75\\

        schizophrenia &90.20&33 && 0.0022 ($\pm$0.0142)& 0.0024 ($\pm$0.0089)& 0.0019 ($\pm$0.0070) && 4.29&4.48&6.80 && 0.0014&0.0037&46.06\\

        cleveland2 &65.93&35 && 0.1217 ($\pm$0.0797)& 0.1594 ($\pm$0.0923)& 0.0626 ($\pm$0.0750) && 4.87&4.93&5.04 && 0.0017&0.0048&301.59\\

        haberman &67.39 &53 && 0.7467 ($\pm$0.1123)& 0.7941 ($\pm$0.1074)& 0.7430 ($\pm$0.1252) && 2.96 & 3.02&3.08 && 0.0034& 0.0041& 31.50\\

        \textcolor{blue}{compas} &66.41&40 && 0.0569 ($\pm$0.0697)& 0.0694 ($\pm$0.0783)& 0.1586 ($\pm$0.0879) && 5.65&6.55&7.00 && 0.0298&0.0931&1486.50\\

        horse colic &79.28&40 && 0.0503 ($\pm$0.0699)& 0.0342 ($\pm$0.0543)& 0.0133 ($\pm$0.0176) && 6.43&6.70&7.00 && 0.0028&0.0059&671.60\\

        meta-data &88.68&44 && 0.0223 ($\pm$0.0821)& 0.0290 ($\pm$0.0572)& 0.0199 ($\pm$0.0771) && 3.62&5.54&5.96 && 0.0017&0.0089&171.91\\

        \textcolor{blue}{employee attr.} &81.88&63 && 0.0708 ($\pm$0.0610)& 0.0960 ($\pm$0.0723)& 0.2212 ($\pm$0.1525) && 6.25&6.45&7.00 && 0.0958&0.1032&1340.60\\

        \textcolor{blue}{loan eligibility} &70.14&68&& 0.0629 ($\pm$0.0616)& 0.0870 ($\pm$0.0668)& 0.0956 ($\pm$0.0500) && 6.10&6.00&6.50 && 0.0090&0.0378&856.10\\

        \textcolor{blue}{australian} &79.23&70 && 0.0000 ($\pm$0.0000)& 0.0311 ($\pm$0.0592)& 0.0137 ($\pm$0.0286) && 4.70&6.40&6.10 && 0.0041&0.0308&573.94\\

        \textcolor{blue}{liver disorders} &71.43&84 && 0.0939 ($\pm$0.1087)& 0.1101 ($\pm$0.0891)& 0.1278 ($\pm$0.0878) && 6.03&6.90&7.00 && 0.0150&0.0744&897.81\\

        \textcolor{blue}{contraceptive} &51.36&90 && 0.0600 ($\pm$0.0800)& 0.0600 ($\pm$0.0800)& 0.3910 ($\pm$0.1700) && 4.27&4.26&5.95 && 0.0452 & 0.0892 & 1096.07\\

        \textcolor{blue}{fetal health} &91.85&93 && 0.1200 ($\pm$0.0600)& 0.1200 ($\pm$0.0600)& 0.2310 ($\pm$0.1100) && 5.59&5.59&6.25 && 0.0568 & 0.0723 & 930.61\\

        \textcolor{blue}{pimas indians} &72.56&97 && 0.1181 ($\pm$0.0834)& 0.1897 ($\pm$0.1072)& 0.1812 ($\pm$0.0622) && 6.75&7.00&6.95 && 0.0183&0.1675&709.57\\

        \textcolor{magenta}{spambase} &92.03&236 && 0.1268 ($\pm$0.0645)& 0.1845 ($\pm$0.0813)& $-$ && 6.89&6.99&$-$ && 0.0974&0.1828&$-$\\

        \textcolor{magenta}{madelon} &71.03&500 && 0.1257 ($\pm$0.1198)& 0.1971 ($\pm$0.0930)& $-$ && 6.85&6.98&$-$ && 0.0709&0.2611&$-$\\  

        \textcolor{magenta}{gina-prior} &87.13&784 && 0.2073 ($\pm$0.0837)& 0.2496 ($\pm$0.0874)& $-$ && 6.97&6.99&$-$ && 0.1087&1.3443&$-$\\

        \textcolor{magenta}{mnist38} &95.82&784 && 0.1561 ($\pm$0.0743)& 0.2675 ($\pm$0.0698)& $-$ && 6.95&7.00&$-$ && 0.1082&1.4738&$-$\\

        \textcolor{magenta}{mnist49} &95.02&784 && 0.1857 ($\pm$0.0731)& 0.2867 ($\pm$0.0970)& $-$ && 6.97&6.98&$-$ && 0.2019&1.3611&$-$\\

        \textcolor{magenta}{bank market.} &89.49&882 && 0.3245 ($\pm$0.1201)& 0.3890 ($\pm$0.1267)& $-$ && 6.99&6.99&$-$ && 0.2631& 1.4288& $-$\\

        \textcolor{magenta}{gina-agnostic} &83.86&970 && 0.1593 ($\pm$0.0792)& 0.2102 ($\pm$0.1084)& $-$ && 6.96&7.00&$-$ && 0.1306&1.7953&$-$\\

        \textcolor{magenta}{christine} &50.37&1023 && 0.2710 ($\pm$0.0678)& 0.3207 ($\pm$0.0816)& $-$ && 7.00&7.00&$-$ && 0.6179&1.9402&$-$\\

        \textcolor{magenta}{adult} &81.16& 2433 && 0.3882 ($\pm$0.1521)& 0.3925 ($\pm$0.1877)& $-$ && 6.87 & 6.87&$-$ && 0.1461& 0.9339& $-$\\

        \textcolor{magenta}{email spam} &94.07&3000 && 0.1090 ($\pm$0.1494)& 0.1761 ($\pm$0.2169)& $-$ && 4.90&6.78&$-$ && 0.0704&1.0079&$-$\\

        \textcolor{magenta}{gisette} &93.81&5000 && 0.1309 ($\pm$0.0706)& 0.2006 ($\pm$0.1056)& $-$ && 6.87&6.94&$-$ && 0.0746&2.8047&$-$\\
        
        \textcolor{magenta}{dexter} &83.89&20000 && 0.0321 ($\pm$0.0532)& 0.0614 ($\pm$0.0525)& $-$ && 5.74&6.63&$-$ && 0.1250&0.2330&$-$\\

        \textcolor{magenta}{farm ads} &80.78& 54877 && 0.1300 ($\pm$0.1700)& 0.1300 ($\pm$0.1700)& $-$&& 6.31&6.31&$-$ && 0.2710& 0.9892 &$-$\\

        \textcolor{magenta}{dorothea} &93.04&$10^5$ && 0.2383 ($\pm$0.0743)& 0.2514 ($\pm$0.0758)& $-$ && 6.87&6.97&$-$ && 0.2027&1.2040&$-$\\
        
      \bottomrule
    \end{tabular}
    \end{scriptsize}
    \caption{Experimental results on 50 benchmarks, using $I = [d]$ and $k = 7$.}
    \label{tab.allfeatures}
  \end{table*}


\setcounter{figure}{3}
\begin{figure*}
	\centering
  \begin{subfigure}[h]{.48\linewidth}
    \includegraphics[width=\linewidth]{fig/adult.jpg}
    \caption{\emph{adult}} 
  \end{subfigure}
  \hfill
  \begin{subfigure}[h]{.48\linewidth}
    \includegraphics[width=\linewidth]{fig/cnae.jpg}
    \caption{\emph{cnae}} 
  \end{subfigure}
  \begin{subfigure}[h]{.48\linewidth}
    \includegraphics[width=\linewidth]{fig/compas.jpg}
    \caption{\emph{compas}} 
  \end{subfigure}
  \hfill
  \begin{subfigure}[h]{.48\linewidth}
    \includegraphics[width=\linewidth]{fig/dexter.jpg}
    \caption{\emph{dexter}} 
  \end{subfigure}
  \begin{subfigure}[h]{.48\linewidth}
    \includegraphics[width=\linewidth]{fig/emails.jpg}
    \caption{\emph{email spam}} 
  \end{subfigure}
  \hfill
  \begin{subfigure}[h]{.48\linewidth}
    \includegraphics[width=\linewidth]{fig/employee.jpg}
    \caption{\emph{employee attr.}} 
  \end{subfigure}
  \caption{Bar plots for the errors of \textsc{ga} (yellow) and \textsc{gd} (blue), using $k = 7 \pm 2$.}
	\label{fig.barplots}
\end{figure*}

\begin{figure*}\ContinuedFloat
	\centering
  \begin{subfigure}[h]{.48\linewidth}
    \includegraphics[width=\linewidth]{fig/farm.jpg}
    \caption{\emph{farm ads}} 
  \end{subfigure}
  \hfill
  \begin{subfigure}[h]{.48\linewidth}
    \includegraphics[width=\linewidth]{fig/gina-agnostic.jpg}
    \caption{\emph{gina agnostic}} 
  \end{subfigure}
  \begin{subfigure}[h]{.48\linewidth}
    \includegraphics[width=\linewidth]{fig/gina-prior.jpg}
    \caption{\emph{gina prior}} 
  \end{subfigure}
  \hfill
  \begin{subfigure}[h]{.48\linewidth}
    \includegraphics[width=\linewidth]{fig/gisette.jpg}
    \caption{\emph{gisette}}
  \end{subfigure}     
    \begin{subfigure}[h]{.48\linewidth}
      \includegraphics[width=\linewidth]{fig/mnist38.jpg}
      \caption{\emph{mnist38}} 
    \end{subfigure}
    \hfill
    \begin{subfigure}[h]{.48\linewidth}
      \includegraphics[width=\linewidth]{fig/mnist49.jpg}
      \caption{\emph{mnist49}}   
  \end{subfigure}
  \caption{Bar plots for the errors of \textsc{ga} (yellow) and \textsc{gd} (blue), using $k = 7 \pm 2$ (\emph{cont.}).}
	\label{fig.barplots}
\end{figure*}

\begin{table*}[t]
    \centering
    \begin{scriptsize}
    \begin{tabular}{lll}
      \toprule
      Benchmark & Source & Link \\    
      \midrule
      \emph{adult} & UCI & \url{https://archive.ics.uci.edu/ml/datasets/adult} \\

      \emph{anneal2} & UCI & \url{https://archive.ics.uci.edu/ml/datasets/Annealing} \\ 

      \emph{australian} & OpenML & \url{https://www.openml.org/search?type=data&status=active&id=40981} \\

      \emph{autos} & UCI & \url{https://archive.ics.uci.edu/ml/machine-learning-databases/autos/} \\

      \emph{backache} & Kaggle & \url{www.kaggle.com/datasets/sammy123/lower-back-pain-symptoms-dataset} \\

      \emph{balance} & UCI & \url{https://archive.ics.uci.edu/ml/datasets/balance+scale} \\

      \emph{bank market.} & UCI & \url{https://archive.ics.uci.edu/ml/datasets/bank+marketing} \\

      \emph{biomed} & OpenML & \url{https://www.openml.org/search?type=data&status=active&id=481}\\

      \emph{cars} & OpenML & \url{www.openml.org/search?type=data&status=active&id=967} \\

      \emph{christine} & OpenML & \url{https://www.openml.org/search?type=data&status=active&id=41142}\\

      \emph{cleveland2} & Kaggle & \url{https://www.kaggle.com/datasets/cherngs/heart-disease-cleveland-uci} \\

      \emph{cnae} & UCI & \url{https://archive.ics.uci.edu/ml/datasets/cnae-9} \\

      \emph{compas} & OpemML & \url{www.openml.org/search?type=data&sort=runs&id=42193&status=active} \\

      \emph{contraceptive} & UCI & \url{https://archive.ics.uci.edu/ml/datasets/Contraceptive+Method+Choice} \\

      \emph{dexter} & UCI & \url{https://archive.ics.uci.edu/ml/datasets/dexter} \\

      \emph{dorothea} & OpenML & \url{www.openml.org/search?type=data&status=active&id=4137} \\

      \emph{email spam} & Kaggle & \url{https://www.kaggle.com/datasets/veleon/ham-and-spam-dataset}\\

      \emph{employee attr.} & Kaggle & \url{https://www.kaggle.com/datasets/HRAnalyticRepository/employee-attrition-data} \\

      \emph{farm-ads} & UCI & \url{https://archive.ics.uci.edu/ml/datasets/Farm+Ads} \\

      \emph{fetal health} & Kaggle & \url{www.kaggle.com/datasets/andrewmvd/fetal-health-classification} \\

      \emph{gina agnostic} & OpenML & \url{www.openml.org/search?type=data&sort=runs&id=1038&status=active} \\

      \emph{gina prior} & OpenML & \url{https://www.openml.org/search?type=data&status=active&id=1042} \\

      \emph{gisette} & UCI & \url{https://archive.ics.uci.edu/ml/datasets/Gisette} \\

      \emph{glass} & UCI & \url{https://archive.ics.uci.edu/ml/datasets/glass+identification} \\
 
      \emph{haberman} & UCI & \url{https://archive.ics.uci.edu/ml/datasets/haberman's+survival} \\

      \emph{hepatisis} & UCI & \url{https://archive.ics.uci.edu/ml/datasets/hepatitis} \\

      \emph{horse colic} & Kaggle & \url{www.kaggle.com/datasets/uciml/horse-colic?select=horse.csv} \\

      \emph{hungarian} & OpenML & \url{www.openml.org/search?type=data&status=active&id=858} \\

      \emph{indian liver} & Kaggle & \url{www.kaggle.com/datasets/uciml/indian-liver-patient-records} \\

      \emph{ionosphere} & UCI & \url{https://archive.ics.uci.edu/ml/datasets/ionosphere}\\

      \emph{kr-vs-kp} & UCI & \url{https://archive.ics.uci.edu/ml/datasets/Chess+(King-Rook+vs.+King-Pawn)} \\

      \emph{liver disorders} & UCI & \url{https://archive.ics.uci.edu/ml/datasets/Liver+Disorders} \\

      \emph{loan eligibility} & Kaggle & \url{www.kaggle.com/datasets/devzohaib/eligibility-prediction-for-loan} \\

      \emph{madelon} & UCI & \url{https://archive.ics.uci.edu/ml/datasets/madelon} \\

      \emph{meta-data} & UCI & \url{https://archive.ics.uci.edu/ml/datasets/Meta-data} \\

      \emph{mnist38} & Kaggle & \url{https://www.kaggle.com/datasets/oddrationale/mnist-in-csv} \\

      \emph{mnist49} & Kaggle & \url{https://www.kaggle.com/datasets/oddrationale/mnist-in-csv} \\

      \emph{mushroom} & UCI & \url{https://archive.ics.uci.edu/ml/datasets/mushroom} \\

      \emph{patient treat.} & Kaggle & \url{www.kaggle.com/datasets/manishkc06/patient-treatment-classification} \\

      \emph{pima indians} & Kaggle & \url{www.kaggle.com/datasets/uciml/pima-indians-diabetes-database} \\

      \emph{placement} & Kaggle & \url{https://www.kaggle.com/datasets/ahsan81/job-placement-dataset} \\

      \emph{primary tumor} & UCI & \url{https://archive.ics.uci.edu/ml/datasets/primary+tumor} \\

      \emph{schizophrenia} & UCI & \url{http://archive.ics.uci.edu/ml/datasets/mhealth+dataset} \\

      \emph{shuttle} & UCI & \url{https://archive.ics.uci.edu/ml/datasets/Shuttle+Landing+Control}\\  

      \emph{spambase} & UCI & \url{https://archive.ics.uci.edu/ml/datasets/spambase} \\

      \emph{student perf.} & OpenML & \url{www.openml.org/search?type=data&sort=runs&id=42351&status=active} \\

      \emph{tae} & UCI & \url{archive.ics.uci.edu/ml/datasets/teaching+assistant+evaluation} \\

      \emph{tic-tac-toe} & UCI & \url{https://archive.ics.uci.edu/ml/datasets/Tic-Tac-Toe+Endgame} \\

      \emph{vehicle} & Kaggle & \url{www.kaggle.com/datasets/nehalbirla/vehicle-dataset-from-cardekho} \\

      \emph{voting} & Kaggle & \url{www.kaggle.com/datasets/devvret/congressional-voting-records} \\

      \emph{wine} & Kaggle & \url{www.kaggle.com/datasets/uciml/red-wine-quality-cortez-et-al-2009} \\

      \bottomrule
    \end{tabular}
    \end{scriptsize}
    \caption{List of benchmarks used in the experiments. Notably, \emph{anneal2} is a binarized version of \emph{annealing}, where the goal is to separate the label 2 from all other labels;
    \emph{mnist49} (resp. \emph{mnist38}) is a subset of \emph{mnist} restricted to the instances labeled as 4 and 9 (resp. 3 and 8).}
    \label{tab.benchmarks}
  \end{table*}

%------------------------------------------------------------------------------
% References
%------------------------------------------------------------------------------

\bibliography{bounia_332-supp}
\end{document}
