\documentclass{midl} % Include author names
%\documentclass[anon]{midl} % Anonymized submission

% The following packages will be automatically loaded:
% jmlr, amsmath, amssymb, natbib, graphicx, url, algorithm2e
% ifoddpage, relsize and probably more
% make sure they are installed with your latex distribution

\usepackage{mwe} % to get dummy images

% Header for extended abstracts
\jmlrproceedings{MIDL}{Medical Imaging with Deep Learning}
\jmlrpages{}
\jmlryear{2021}

% to be uncommented for submissions under review
\jmlrworkshop{Short Paper -- MIDL 2021 submission}
\jmlrvolume{-- Under Review}
\editors{Under Review for MIDL 2021}

\title[ICAM-reg: Interpretable Classification and Regression]{ICAM-reg: Interpretable Classification and Regression with Feature Attribution for Mapping Neurological Phenotypes in Individual Scans}

 % Use \Name{Author Name} to specify the name.
 % If the surname contains spaces, enclose the surname
 % in braces, e.g. \Name{John {Smith Jones}} similarly
 % if the name has a "von" part, e.g \Name{Jane {de Winter}}.
 % If the first letter in the forenames is a diacritic
 % enclose the diacritic in braces, e.g. \Name{{\'E}louise Smith}

 % Two authors with the same address
 % \midlauthor{\Name{Author Name1} \Email{abc@sample.edu}\and
 %  \Name{Author Name2} \Email{xyz@sample.edu}\\
 %  \addr Address}

 % Three or more authors with the same address:
 % \midlauthor{\Name{Author Name1} \Email{an1@sample.edu}\\
 %  \Name{Author Name2} \Email{an2@sample.edu}\\
 %  \Name{Author Name3} \Email{an3@sample.edu}\\
 %  \addr Address}


% Authors with different addresses:
% \midlauthor{\Name{Author Name1} \Email{abc@sample.edu}\\
% \addr Address 1
% \AND
% \Name{Author Name2} \Email{xyz@sample.edu}\\
% \addr Address 2
% }

%\footnotetext[1]{Contributed equally}

% More complicate cases, e.g. with dual affiliations and joint authorship
\midlauthor{\Name{Cher Bass \nametag{$^{1}$}} \Email{cher.bass@kcl.ac.uk}\\
\addr $^{1}$ King's College London \\
\Name{Mariana {da Silva} \nametag{$^{1}$}} \Email\\
\Name{Carole Sudre \nametag{$^{1}$}} \Email\\
\Name{Logan Z. J. Williams \nametag{$^{1}$}} \\
\Name{Petru-Daniel Tudosiu \nametag{$^{1}$}} \\
\Name{Fidel {Alfaro-Almagro} \nametag{$^{1}$}} \\
\Name{Sean P. Fitzgibbon \nametag{$^{2}$}} \\
\addr $^{2}$ University of Oxford \\
\Name{Matthew F. Glasser \nametag{$^{3}$}} \\
\addr $^{3}$ Washington University in St Louis \\
\Name{Stephen M. Smith \nametag{$^{2}$}} \\
\Name{Emma C. Robinson \nametag{$^{1}$}} \Email{emma.robinson@kcl.ac.uk}\\ 
}
\begin{document}

\maketitle

\begin{abstract}
Feature attribution (FA), or the assignment of class-relevance to different locations in an image, is important for many classification and regression problems but is particularly crucial within the neuroscience domain, where accurate mechanistic models of behaviours, or disease, require knowledge of all features discriminative of a trait. At the same time, predicting class relevance from brain images is challenging as phenotypes are typically heterogeneous, and changes occur against a background of significant natural variation.  Here, we present an extension of the ICAM framework for creating prediction specific FA maps through image-to-image translation.
\end{abstract}

\begin{keywords}
Interpretable, Classification, Regression, Deep Generative Networks.
\end{keywords}

\section{Introduction}
Brain images represent a significant resource in the development of mechanistic models of behaviour and neurological/psychiatric disease as, in principle, they capture measurable neuroanatomical traits that are heritable, present in unaffected siblings and detectable prior to disease onset. For many complex disorders, however, these features of disease are subtle, variable and obscured by a back-drop of significant natural variation in brain shape and appearance; this makes them extremely difficult to detect. 

To detect features of disease in brain imaging, recent studies have started to apply deep learning methods that examine features or the weights of CNNs, called feature attribution (FA) methods. These methods include gradient based methods that analyse the gradients with respect to a given input image such as guided backpropagation \cite{springenberg2014striving}, and perturbation methods such as occlusion. These methods however are low resolution, also do not detect heterogeneous structures (i.e. features that do not appear in all subjects), and often require averaging across multiple subjects to achieve good detection \cite{bohle2019layer}. An alternative method called VA-GAN \cite{baumgartner2018visual} that uses a generative model, was still unable to detect all salient features.

To address these challenges, in \citet{bass2020icam} we developed ICAM; which addressed this problem through disentangling class-relevant disease \textit{attributes} (attr) from class-irrelevant shape \textit{content}. In this way the method was able to generate much more accurate maps of cortical atrophy due to Alzheimer's. Here, we extend the approach with a regression module, to enable the network to do regression as well as classification.

\begin{figure}[!bt]
 \centering
\makebox[\linewidth]{%to center the image
	\includegraphics[width=0.6\textwidth]{figures/network_camera_ready.png}}
\caption{Overview of method. An example of how ICAM performs classification/ regression with attribute map generation for 2 given input images x and y.} 
\label{fig:network_translation}
\end{figure}

\section{Methods}

The goal of the $ICAM_{reg}$ framework \cite{bass2020icam, bass2021icam} is to perform classification (or regression) with simultaneous feature attribution, by training a VAE-GAN to swap the classes of input images: $x$, $y$; changing only the features of each image which are specific to the target phenotype. The design of the network is outlined in Fig.~\ref{fig:network_translation}.

\begin{figure*}[!bt]
  \centering
\makebox[\linewidth]{%to center the image
	\includegraphics[width=1.0\textwidth]{figures/biobank_interpolation_outlier.png}}
\caption{Highlights of UK Biobank results: outlier explanation, and interpolation between groups. Green arrows, cortex; blue arrows, ventricles. }
\label{fig:biobank_results}
\end{figure*}


\section{Results}

Here, we show our results on the UK Biobank for age prediction (see \citet{bass2021icam} for full experiments on 2 other datasets). In our regression experiments, we found that brain age prediction by $ICAM_{reg}$ ($2.20\pm1.86$ MAE) performs competitively relative to other deep learning methods trained on age prediction using the UK Biobank (reported test MAE scores of $2.14 \pm 0.05$ \cite{peng2021accurate}).
In addition, we give a highlight of our qualitative results with $ICAM_{reg}$ in Fig.~\ref{fig:biobank_results}, showing an example of outlier explanation and interpolation between 2 subjects. In Fig.~\ref{fig:biobank_results} A), aged match subjects with one subject predicted as an outlier (subject 2, predicted=56, true=47 years), are used to demonstrate outlier detection. Evidence for the outlier prediction of subject 2 is presented through translating between the 2 subjects, indicating the presence of larger ventricles, hippocampal atrophy and cortical shrinking in subject 2. In Fig.~\ref{fig:biobank_results} B), we demonstrate that the latent space is interpretable by linearly interpolation between the encoded attribute vectors (i.e. of 2 subjects with different ages), and showing clear interpolation between them, where both the predicted ages and FA maps the are smoothly translated. 

\bibliography{mybibliography}


\end{document}
