\section{\textsc{Nito}}\label{sec:impl}


\begin{figure*}[t]
    \centering
    \begin{subfigure}{0.3\textwidth}
        \centering 
        \includegraphics[scale=0.4]{images/grid/tumour.png}
        \caption{An MRI slice with a tumor}
        \label{fig:tumour}
    \end{subfigure}
    \hfill
       \begin{subfigure}{0.3\textwidth}
        \centering 
        \includegraphics[scale=0.4]{images/grid/full_grid_black.png}
        \caption{The grid in black}
        \label{fig:grid_black}
    \end{subfigure}
    \hfill
    \begin{subfigure}{0.3\textwidth}
        \centering 
        \includegraphics[scale=0.4]{images/grid/full_grid_colour.png}
        \caption{A grid in real colors}
        \label{fig:grid_colour}
    \end{subfigure}
    \caption{A MRI slice with tumor (upper right quadrant of brain) with two grid overlays: with nodes in black~\Cref{fig:grid_black}, and in the original
    color of the image~\Cref{fig:grid_colour}. Note that the grid does not respect physical features of the brain. In practice, having the grid in the original
    colors of the image does not provide sufficient contrast to change the classification, whereas having the grid in black (or other high-contrast color)
    does.}
     \label{fig:grid_types}
\end{figure*}

\begin{figure*}[t]
    \centering
    \begin{subfigure}[b]{0.3\textwidth}
        \centering 
        \includegraphics[scale=0.4]{images/grid_calculate/grid_3_1_1.png}
        \caption{Insufficiently dense grid for class $0$}
        \label{fig:grid_311}
    \end{subfigure}
    \hfill
       \begin{subfigure}[b]{0.3\textwidth}
        \centering 
        \includegraphics[scale=0.4]{images/grid_calculate/grid_3_2_1.png}
        \caption{A denser grid, but still insufficient}
        \label{fig:grid_321}
    \end{subfigure}
    \hfill
    \begin{subfigure}[b]{0.3\textwidth}
        \centering 
        \includegraphics[scale=0.4]{images/grid_calculate/grid_3_3_0.png}
        \caption{A sufficient grid for class $0$}
        \label{fig:grid_330}
    \end{subfigure}
    \caption{The grid is refined by search (here shown over an entire slice for clarity). The grids in \Cref{fig:grid_311} and \Cref{fig:grid_321} are insufficiently dense to change the class of the image from $1$ to $0$. The final grid, sufficient to change the class, is in \Cref{fig:grid_330}.}
    \label{fig:grid_search}
\end{figure*}

\begin{figure*}[t]
    \centering
    \begin{subfigure}[b]{0.15\textwidth}
        \centering 
        \includegraphics[scale=0.3]{images/overlay/overlay_raw.png}
        \caption{class $0$}
        \label{fig:overlay_raw}
    \end{subfigure}
    \hfill
       \begin{subfigure}[b]{0.15\textwidth}
        \centering 
        \includegraphics[scale=0.3]{images/overlay/grid_2_3.png}
        \caption{absence grid}
        \label{fig:overlay_grid}
    \end{subfigure}
    \hfill
    \begin{subfigure}[b]{0.15\textwidth}
        \centering 
        \includegraphics[scale=0.3]{images/overlay/overlay1.png}
        \caption{excluded tumor}
        \label{fig:overlay1}
    \end{subfigure}
    \hfill
    \begin{subfigure}[b]{0.15\textwidth}
        \centering 
        \includegraphics[scale=0.3]{images/overlay/overlay2.png}
        \caption{excluded tumor}
        \label{fig:overlay2}
    \end{subfigure}
    \hfill
    \begin{subfigure}[b]{0.15\textwidth}
        \centering 
        \includegraphics[scale=0.3]{images/overlay/overlay3.png}
        \caption{excluded tumor}
        \label{fig:overlay3}
    \end{subfigure}
    \caption{The grid prevents an explanation of a tumor from fitting into the image. As a causal explanation is approximately minimal and is recognized as class $1$ by the model, this means that, modulo the dataset, no tumor can be present in the image. We cannot lose parts of the explanation to make it fit, as a smaller collection of pixels will no longer be recognized as tumor by the model.}
    \label{fig:overlay}
\end{figure*}


\begin{algorithm}[t]
  \caption{$\nito(x, \mathcal{N}, U, \delta, r, Pr)$}
  \label{algo:eoa}
  \begin{flushleft}
    \textbf{INPUT:}\,\, input image $x$, model $\mathcal{N}$, set of images $U$, density $\delta$, radius $r$, \emph{Pr} (a probability distribution over $U$)\\
    \textbf{OUTPUT:}\,\, a gridded image $x'$, a tuple ($\alpha$, $\beta$)
  \end{flushleft}
  \begin{algorithmic}[1]
    \setcounter{ALC@unique}{0}
    \STATE $\varphi \leftarrow \mathcal{N}(x)$
    \STATE $\K \leftarrow \text{neighborhood of} \, x \in U$
    \IF{$\K = \varnothing$}
        \RETURN $x, 1, 0$
    \ENDIF
    \STATE $\mathcal{E} \leftarrow \text{causal explanations of} \, \K$
    \STATE $e_{\mathcal{E}} \leftarrow \text{find smallest explanation} \in \mathcal{E}$
    \STATE\label{line:grid} $\text{grid} \leftarrow \text{calculate\_grid}(e_{\mathcal{E}}, \delta, r)$
    \IF{$\text{grid} = \varnothing$}
        \RETURN $x, 1, 0$
    \ENDIF
    \STATE $\beta \leftarrow 0.0$
    \FOR{$s \in \K$}
        \STATE $o \leftarrow \mathcal{N}(s)$
        \STATE $o' \leftarrow \mathcal{N}(grid(s))$
        \STATE $o \neq o' \, ? \,  : \beta = \beta + Pr(s)$
    \ENDFOR
    \RETURN $\text{grid}(x), (1, \beta)$
  \end{algorithmic}
\end{algorithm}

\Cref{algo:eoa} is the main \nito algorithm. The set $\U$ is the full dataset, containing scans from different slices of the organ under examination. 
For a given input $x$ (a single image), we define $\K$ as all scans \emph{similar} to $x$. The similarity can be defined parametrically; for this implementation,
we define it as images of the same slice, for example the same part of the brain for MRIs of brains. The probability distribution over $\K$ is a parameter
and is assumed uniform by default.
As the dataset grows with each new examined patient, the set $\U$ grows as well, with more similar scans to the current input.
In the future, the concept of similarity can be extended to include external parameters affecting the scans, such as biological sex, age, etc.
We note that if $\K$ is empty, we cannot say anything useful about the current input image $x$. 
In what follows, we assume class $0$ to mean ``no tumor'', and class $1$ to mean ``tumor''.


The algorithm first calculates an approximation of a smallest explanation \emph{for a tumor} in $\K$ 
by executing \rex (see \Cref{app:rex} for an overview of \rex).
Note that an explanation of an object is typically smaller than the object itself, representing just a part of it~\citep{CKKS24}: if an explanation of a tumor cannot be made to fit between the grid then the tumor itself certainly cannot. Note that we assume a reasonably regular shape of explanations: it 
is possible in theory to have tumors that fit neatly between the nodes of the grid, thus avoiding detection, while being overall quite large, however in practice
tumor shapes are reasonably close to convex.

\paragraph*{Size and color of the grid}\label{subsec:grid}

The procedure on line 8 of \Cref{algo:eoa}, $\mbox{calculate\_grid}(x, e_{\mathcal{E}}, \delta, r)$, receives the input image $x$, a smallest explanation 
$e_{\mathcal{E}}$ of a tumor in the set 
$\K$, and optionally the density $\delta$ and radius $r$, and constructs a grid with each node being of radius $r$ and the distance 
$\delta$ between the nodes over the image $x$.
If $\delta$ and $r$ are not given, the procedure calculates them using a binary search, constructing the \emph{least dense} grid
that satisfies \Cref{def:PEoA}. We assume convexity of explanations, hence the calculation of $\delta$ is based on the size of a minimal bounding box
for $e_{\mathcal{E}}$. The radius $r$ of each node is determined as the smallest that satisfies PAG2 of \Cref{def:PEoA} and is, again, determined using
a binary search.

We also allow the option of receiving $\delta$ and $r$ from the user, in case a user with domain knowledge is able to
provide hints to the algorithm. An example is shown in~\Cref{fig:grid_search}.
The grid pixel values should be the same as in $x$, but in practice this often does not provide enough contrast, due to the quality and color scheme
of the image. We therefore also allow the option of having out-of-distribution neutral values, and we compare these approaches
in~\Cref{sec:eval}.

\begin{figure*}[t]
    \centering
    \begin{subfigure}{0.2\textwidth}
        \centering 
        \includegraphics[scale=0.3]{images/example/TCGA_CS_5397_20010315_14.png}
        \caption{Healthy slice}
        \label{fig:alpha}
    \end{subfigure}
    \hfill
    \begin{subfigure}{0.2\textwidth}
        \centering 
        \includegraphics[scale=0.3]{images/example/TCGA_CS_5397_20010315_14_14_superimposed.png}
        \caption{Approximate location}
        \label{fig:alpha:a}
    \end{subfigure}
    \hfill
    \begin{subfigure}{0.2\textwidth}
        \centering 
        \includegraphics[scale=0.3]{images/example/TCGA_CS_5397_20010315_14_clip_hull.png}
        \caption{Initially calculated grid}
        \label{fig:alpha:b}
    \end{subfigure}
    \hfill
    \begin{subfigure}{0.2\textwidth}
        \centering
        \includegraphics[scale=0.3]{images/example/TCGA_DU_7298_19910324_14_mutant_no_4.png}
        \caption{$\neg$ flip 1}
        \label{fig:alpha:c}
    \end{subfigure}
    %%% NEXT LINE
   \begin{subfigure}{0.2\textwidth}
        \centering 
        \includegraphics[scale=0.3]{images/example/TCGA_CS_6665_20010817_14_mutant_no_19.png}
        \caption{Flip 1}
        \label{fig:alpha:d}
    \end{subfigure}
    \hfill
    \begin{subfigure}{0.2\textwidth}
        \centering 
        \includegraphics[scale=0.3]{images/example/TCGA_DU_A5TU_19980312_14_mutant_no_37.png}
        \caption{$\neg$ flip 2}
        \label{fig:alpha:e}
    \end{subfigure}
    \hfill
    \begin{subfigure}{0.2\textwidth}
        \centering 
        \includegraphics[scale=0.3]{images/example/TCGA_FG_5964_20010511_14_mutant_no_15.png}
        \caption{Flip 2}
        \label{fig:alpha:f}
    \end{subfigure}
    \hfill
    \begin{subfigure}{0.2\textwidth}
        \centering
        \includegraphics[scale=0.3]{images/example/TCGA_HT_7882_19970125_14_mutant_no_12.png}
        \caption{Flip 3}
        \label{fig:alpha:g}
    \end{subfigure}
    \caption{A example of a grid, approximate location of the explanation superimposed on the healthy brain (\Cref{fig:alpha:a}) and $\mathcal{K}$. $\K$ consists of~\Cref{fig:alpha,fig:alpha:c,fig:alpha:d,fig:alpha:e,fig:alpha:f,fig:alpha:g}. In this example, only~\Cref{fig:alpha} is in the set $(\vec{X} = \vec{x})\varphi \subseteq \mathcal{K}$, so $\alpha = 1.0$. Of the five slices where we apply the intervention (d - h), 3 change classification, so $\beta = \frac{3}{5}$ or $0.6$.}
    \label{fig:example}
\end{figure*}



\paragraph*{Calculating \texorpdfstring{$\alpha$}{alpha} and \texorpdfstring{$\beta$}{beta}}\label{app:alpha}
The probability that an image in $\K$ has both $\vec{X} = \vec{x} \land \varphi$ is given by $\alpha$. For simplicity, let us say that $\varphi$ means ``tumor''. $\vec{X} = \vec{x}$ then will be a set of pixels and their values. Even if we ignore the spatial dimension of of pixels, the chances of $\vec{X} = \vec{x}$ being the same in a different image for which $\varphi$ holds is very slim. Explanations are rarely identical between images. If we take into account the spatial dimension as well, then $\alpha$ is likely to be near $0$ on any dataset. If we are interested in $\vec{G} = \vec{g}$, our absence grid, then we can approximately control the value of $\alpha$ if either $\K$ does not contain any healthy slices (in which case $\alpha = 1$), or we use a neutral, constant, masking value for the grid. In either case, $\alpha$ does not reveal as much information about our grid as we would like. 

We present a simple visual example of a \betagood calculation (\Cref{fig:example}), with the absence grid only partially applied for clarity. Causal explanations, by virtue of their minimality, tend not to be robust. Hence, the explanation of the smallest tumor is itself a \emph{partial} explanation. Future work will examine the usefulness of explanation \emph{vs.} partial explanation of tumor on grid calculation from the point of view of the clinician.

\paragraph*{Quantitative evaluation of partial explanations}

The $\alpha$ value is the fraction of images in $\K$ classified as ``no tumor'' and for which $\vec{X} = \vec{x}$, represented as probability. 
In our experiments, there was only one healthy image per slice (the explanandum), 
thus $\alpha = 1$. We discuss general computation of $\alpha$ in~\Cref{app:alpha}. 
$\beta$ measures the effect of setting $\vec{G}$ to $\vec{g}$ in $\K$. For example, let $|\K| = 5$, 
where $\vec{G} = \vec{g}$ is an absence grid for $3$ out of all $5$ images. 
Assuming a uniform distribution over these images, we have $\beta = 0.6$, as $3$ images change their classification under $\vec{G} \leftarrow \vec{g}$. 

The definition of $\beta$ assumes equal weight for all elements in $\K$. However, given that $\cN$ is an AI model, we can weight the calculation by
the model's confidence in the classification. We consider two options for this weighting: $\beta_a$ denotes the parameter weighted by the confidence
over all classifications in $\K$ when $\vec{G} \leftarrow \vec{g}$, and $\beta_p$ considers only the confidence of images where changing
$\vec{G}$ to $\vec{g}$ does not change the classification (otherwise $1$).

\begin{figure*}[t]
    \centering
    \begin{subfigure}{0.3\textwidth}
        \centering 
        \includegraphics[scale=0.4]{images/interactive/fake.png}
        \caption{A class $0$ brain}
        \label{fig:inter1}
    \end{subfigure}
    \hfill
       \begin{subfigure}{0.3\textwidth}
        \centering 
        \includegraphics[scale=0.4]{images/interactive/fake1.png}
        \caption{A suspicious area}
        \label{fig:inter2}
    \end{subfigure}
    \hfill
    \begin{subfigure}{0.3\textwidth}
        \centering 
        \includegraphics[scale=0.4]{images/interactive/fake2.png}
        \caption{A local grid application}
        \label{fig:inter3}
    \end{subfigure}
    \caption{Suppose a clinician finds an area of a brain suspicious (\Cref{fig:inter2}). With the pre-calculated grid at the appropriate slice, the clinician can superimpose the grid over the area of interest. Here, the suspicious area sits is able to fit inside the grid, so it falls below the model's information requirements. This explains why the model gave class $0$, but does not necessarily indicate health in the patient.}
     \label{fig:interactive}
\end{figure*}

\paragraph*{Dialog with a clinician}
Given a stable, unchanging, dataset, the grid is entirely computable off-line. Changes to the dataset mean that the grid needs to be recomputed for the appropriate slices only. This is unlikely to occur during deployment.
As a result, \nito supports a dialog with a clinician in real time. 
\Cref{fig:interactive} illustrates the following scenario. An input MRI slice is classified as class $0$ by the model (\Cref{fig:inter1}) 
but with relatively low confidence. A clinician might choose this slice for closer examination. There is an area, highlighted in red (\Cref{fig:inter2}),
of slightly increased density. The clinician can take the grid for the appropriate slice and superimpose it over the suspicious area. The suspicious area fits reasonably neatly inside the grid (\Cref{fig:inter3}). As the grid was calculated from the smallest explanation in the dataset at that slice, this indicates that, from the model's perspective, there is no evidence of a tumor present. Of course, a clinician may disagree, in which case there is an argument for retraining or refining the model by adding this image to the training data.