\section{Proofs}\label{app:proofs}

\subsection{Lemma~\ref{lemma:disjointrelevant}}\label{proof:disjointrelevant}
\paragraph{\Cref{lemma:disjointrelevant} (Disjoint Relevant).}
  Let $\scm{H}$ be a $\mat{T}$-abstraction of $\scm{L}$,
  where $\scm{H}$ and $\scm{L}$
  are two linear SCMs
  respectively on variables $\set{Y}$ and $\set{X}$.
  Then,
  for any pair of distinct abstract variables $Y_1, Y_2\in\set{Y}$,
  it holds that $\Pi_R(Y_1)\cap\Pi_R(Y_2) = \emptyset$,
  where $\Pi_R(Y_1) \neq \emptyset$ and $\Pi_R(Y_2) \neq \emptyset$.
\begin{proof}
  Firstly,
  we show that
  given an abstract intervention ${j = (Y_1 \gets k)}$
  on $Y_1$,
  any concrete intervention $i$
  such that $\omega(i) = j$
  must fix all relevant variables~$\rel{Y_1}$.
  Otherwise,
  if we assume the existence
  of a non-intervened variable $X_s\in\rel{Y_1}$
  the function $\scm{L}^i_{\rel{Y_1}}$
  would be non-constant.
  Therefore,
  since
  $\tau_{Y_1}$ depends on $X_s$
  by definition of relevant variable,
  interventional consistency would not hold,
  as in
  \begin{align}
    \tau_{Y_1} \circ \scm{L}^i_{\Pi_R(Y_1)}     
    \neq
    \scm{H}^j_{Y_1} \circ \gamma
    = k.
  \end{align}
  Therefore,
  for any abstract intervention~$j=(Y_1 \gets k)$,
  the corresponding concrete interventions
  must have form
  \begin{align}
    i = (\Pi_R(Y_1) \gets \vec{v}),
  \end{align}
  for any vector $\vec{v}$ such that $\tau_{Y_1}(\vec{v}) = k$,
  without intervening on further relevant variables.

  We firstly
  prove \Cref{lemma:disjointrelevant}
  whenever $Y_1 \centernot\anc Y_2$.
  Then,
  we assume the existence
  of a non-empty subset $\set{V} = \Pi_R(Y_1) \cap \Pi_R(Y_2)$
  of shared variables.
  Since $Y_1$ has no causal effect on $Y_2$,
  given an high-level intervention
  ${j=(Y_1 \gets k)}$,
  it must hold that
  \begin{align}
      \scm{H}^j_{Y_2} = \scm{H}_{Y_2}.
  \end{align}
  However, by intervening on $Y_1$,
  any concretization must also fix $\set{V}$.
  Therefore, we prove the property by contradiction, as
  \begin{align}
    \scm{H}^j_{Y_2} \circ \gamma &=
    \tau_{Y_2} \circ \scm{L}^i_{\Pi_R(Y_2)} \\
    & \neq \tau_{Y_2} \circ \scm{L}_{\Pi_R(Y_2)} \\
    &= \scm{H}_{Y_2} \circ \gamma\\
    &\implies 
    \scm{H}^j_{Y_2} \neq \scm{H}_{Y_2},
  \end{align}
  given the surjectivity of $\gamma$
  and the lack of cancelling paths.

  Finally, we can tackle the last scenario,
  where $Y_1 \anc Y_2$,
  by showing that $\Pi_R(Y) \cap \Pi_R(\an{Y}) = \emptyset$,
  where $\an{Y}$ is the set of ancestors of $Y$.
  Given the model acyclicity,
  for any abstract intervention~$j=(Y\gets k)$,
  it must hold
  \begin{align}
      \scm{H}^j_{\an{Y}} = \scm{H}_{\an{Y}}.
  \end{align}
  However,
  if the relevant variables of $Y$
  were to overlap
  with the relevant variables of its ancestors,
  we could show that
  \begin{align}
    \scm{H}^j_{\an{Y}} \circ \gamma
    &= \tau_{\an{Y}} \circ \scm{L}^i_{\an{Y}} \\
    &\neq \tau_{\an{Y}} \circ \scm{L}_{\an{Y}} \\
    &= \scm{H}_{\an{Y}} \circ \gamma\\
    &\implies 
    \scm{H}^j_{\an{Y}} \neq \scm{H}_{\an{Y}}.
  \end{align}
  Therefore,
  since interventional consistency does not hold,
  $\scm{H}$ is not a $\mat{T}$-abstraction of $\scm{L}$,
  which contradicts the hypothesis
  and concludes the proof.
\end{proof}

\subsection{Corollary~\ref{cor:constructive}}\label{proof:constructive}
\paragraph{\Cref{cor:constructive} (Constructive Abstraction).}
    Let $\scm{H}$
    be a strong $\tau$-abstraction
    of $\scm{L}$ where
    $\scm{H}$ and $\scm{L}$ are linear SCMs
    and
    $\tau$ is a linear transformation.
    Then,
    $\scm{H}$ is a constructive $\tau$-abstraction
    of $\scm{L}$.
\begin{proof}
    By definition of linear transformation,
    the set of low-level variables
    on which an abstract variable~$Y\in\set{Y}$
    depends through the linear abstraction function~$\tau$
    coincides with its
    set of relevant variables~$\rel{Y}\subseteq\set{X}$.
    Therefore,
    by showing
    that the relevant sets are disjoint
    whenever the SCMs $\scm{H}$ and $\scm{L}$
    are linear,
    a $\mat{T}$-abstraction on linear SCMs
    is also a constructive abstraction.
    By definition of $\mat{T}$-abstraction,
    this is equivalent
    to state that
    a linear $\tau$-abstraction
    on linear SCMs
    is a constructive abstraction
    under our assumption
    on the absence of cancelling paths.
\end{proof}

\subsection{Lemma~\ref{lemma:sufcon}}\label{proof:sufcon}
\paragraph{\Cref{lemma:sufcon} (Sufficient Directed Paths)}
  Let $\scm{H}$ be a $\mat{T}$-abstraction of $\scm{L}$,
  where $\scm{H}$ and $\scm{L}$
  are two linear SCMs
  respectively on variables $\set{Y}$ and $\set{X}$ with graphs $\mathcal{G}_\scm{H}$ and $\mathcal{G}_\scm{L}$.
  Then, 
  for any pair
  of relevant variables $X_1,X_2\in\Pi_R(\set{Y})$,
  such that
  $X_1\in\Pi_R(Y_1)$
  and
  $X_2\in\Pi_R(Y_2)$
  with $Y_1 \neq Y_2 \in \set{Y}$,
  it holds
  \begin{align}
    X_1 \taudirect X_2 \ \ \mathrm{in} \ \mathcal{G}_\scm{L}
    \implies
    Y_1 \to Y_2 \ \ \mathrm{in} \ \mathcal{G}_\scm{H}.
  \end{align}
\begin{proof}
  Let $Y_1, Y_2$ be two distinct abstract variables
  and
  let $i,i'$
  be two concrete interventions
  that fix any \emph{relevant} variable
  except for those in the relevant set $\Pi_R(Y_2)$,
  and
  whose assignments differ only in $X_1\in\Pi_R(Y_1)$.
  Formally,
  \begin{align}
  i &= (\set{V} \gets \vec{v},\,\Pi_R(Y_1) \gets \vec{c})\\
  i' &= (\set{V} \gets \vec{v},\,\Pi_R(Y_1) \gets \vec{c}'),
  \end{align}
  where
  \begin{align}
      \set{V}
      &=
      \bigcup_{Y \in \set{Y} \setminus \{Y_1, Y_2\}} \Pi_R(Y).
  \end{align}
  Given $X_1 \taudirect X_2$,
  there exists at least a directed path
  composed only of non-relevant variables,
  that are therefore non-intervened.
  Consequently,
  due to the \emph{faithfulness} assumption,
  the concrete model does not have cancelling paths
  and, therefore,
  an intervention on a variable
  always has an effect on its descendants.
  In particular,
  since $i,i'$ constrain $X_1$
  to two different values,
  it holds that
  \begin{align}
      \scm{L}^i_{X_2} &\neq \scm{L}^{i'}_{X_2}\\
      \tau_{Y_2}\circ\scm{L}^i &\neq \tau_{Y_2}\circ\scm{L}^{i'}\\
      \scm{H}^j_{Y_2} \circ \gamma &\neq \scm{H}^{j'}_{Y_2} \circ \gamma,
  \end{align}
  where, given the intervention map,
  the concrete interventions
  correspond
  to the following
  abstract interventions
  \begin{align}
  j &=
  ( \set{Y} \setminus \{Y_1, Y_2\} \gets \tau(\vec{v}), Y_1 \gets \tau_{Y_1}(\vec{c}))\\
  j' &=
  ( \set{Y} \setminus \{Y_1, Y_2\} \gets \tau(\vec{v}), Y_1 \gets \tau_{Y_1}(\vec{c}')).
  \end{align}
  Therefore,
  due to
  the surjectivity of $\gamma$,
  it also holds
  \begin{align}
      \scm{H}^j_{Y_2} \neq \scm{H}^{j'}_{Y_2}.
  \end{align}
  Consequently,
  since $j$ and $j'$
  differ only in $Y_1$
  and fix everything but $Y_2$,
  $Y_1$ has a direct effect on $Y_2$,
  i.e., $Y_1 \to Y_2$.
\end{proof}

\subsection{Corollary~\ref{lemma:corollarysufcon}}\label{proof:corollarysufcon}
\paragraph{\Cref{lemma:corollarysufcon} (Sufficient Directed Paths)}
  Let $\scm{H}$ be a $\mat{T}$-abstraction of $\scm{L}$,
  where $\scm{H}$ and $\scm{L}$
  are two linear SCMs
  respectively on variables $\set{Y}$ and $\set{X}$ with graphs $\mathcal{G}_\scm{H}$ and $\mathcal{G}_\scm{L}$.
  Then, 
  for any pair
  of relevant variables $X_1,X_2\in\Pi_R(\set{Y})$,
  such that
  $X_1\in\Pi_R(Y_1)$
  and
  $X_2\in\Pi_R(Y_2)$
  with $Y_1 \neq Y_2 \in \set{Y}$,
  it holds that
  \begin{align}
    X_1 \anc X_2 \ \ \mathrm{in} \ \mathcal{G}_\scm{L}
    \implies
    Y_1 \anc Y_2 \ \ \mathrm{in} \ \mathcal{G}_\scm{H}.
  \end{align}
\begin{proof}
   Given \Cref{lemma:sufcon},
   whenever there exists a $\mat{T}$-direct
   path between relevant variables $X_1\in\rel{Y_1}$
   and $X_2\in\rel{Y_2}$
   there must exist an abstract
   edge $Y_1 \to Y_2$.
   However, if the path is not $\mat{T}$-direct,
   then there must exists
   some relevant variable $X_3\in\rel{Y_3}$
   for another abstract variable $Y_3$ along the path.
   We firstly
   consider the case where $Y_3 \neq Y_1$ and $Y_3 \neq Y_2$.
   Consequently,
   there must exist an edge $Y_1 \to Y_3$ and,
   by applying the same argument on the path $X_3 \anc X_2$,
   the corollary holds for $Y_1 \anc Y_2$.
   Due to the acyclicity of the abstract graph,
   the case where $Y_3 = Y_1$ or $Y_3 = Y_2$
   can arise only at the beginning (resp. the end) of the path.
   In this case,
   we could consider the successive variable
   until we get one different from $Y_1, Y_2$, if any.
   If there is none, then there exists a $\mat{T}$-direct path between the relevant variables of $Y_1, Y_2$ and we fallback to the scenario of \Cref{lemma:sufcon},
   which directly entails $Y_1 \anc Y_2$.
\end{proof}

\subsection{Example~\ref{ex:faithfulness}}\label{proof:faithfulness}
\paragraph{\Cref{ex:faithfulness} (Unfaithful Concrete Model)}
\begin{proof}
To prove $\mat{T}$-abstraction
of the example, we anticipate
the parametrical characterization
of linear abstraction
which we introduce in \Cref{subsec:weightconc}.
In particular,
given the adjacencies
of the model,
\begin{align}
    \mat{W} &= \begin{bmatrix}
      0 & 1 & -1 & 0 & 1\\
      0 & 0 & 0 & 1 & 0\\
      0 & 0 & 0 & 1 & 0\\
      0 & 0 & 0 & 0 & 1\\
      0 & 0 & 0 & 0 & 0
    \end{bmatrix}\\
    \mat{M} &= \begin{bmatrix}
      0 & 0 & 1\\
      0 & 0 & 1\\
      0 & 0 & 0
    \end{bmatrix}
\end{align}
the necessary form for
the exogenous abstraction function,
which we will introduce in \Cref{lemma:exoabs},
is
\begin{align}
    \mat{S} = \begin{bmatrix}
      1 & 0& 0\\
      0 & 1& 0\\
      0 & 1& 0\\
      0 & 1& 0\\
      0 & 0& 1
    \end{bmatrix}.
\end{align}
Consequently,
we can prove abstraction by showing that
for any $Y_i, Y_j$
it holds that
\begin{align}
    \mat{W}_{ij}\vec{s}_j = m_{ij} \vec{t}_i.
\end{align}
For this example,
of particular interest is the case $Y_1 \to Y_2$,
where it holds that
\begin{align}
    \mat{W}_{1,2}\vec{s}_2 &= m_{1,2} \vec{t}_1\\
    \begin{bmatrix}
       1 & -1 & 0 
    \end{bmatrix}    
    \begin{bmatrix}
       1\\
       1\\
       1\\
    \end{bmatrix}    
    &=
    0 \cdot \begin{bmatrix}1\end{bmatrix}\\
    0 &= 0,
\end{align}
and thus $\scm{H}$ $\mat{T}$-abstracts $\scm{L}$.
\end{proof}

\subsection{Theorem~\ref{theo:connectivity}}\label{proof:connectivity}
\paragraph{\Cref{theo:connectivity} (Abstract Connectivity)}
  Let $\scm{H}$ be a $\mat{T}$-abstraction of $\scm{L}$,
  where $\scm{H}$ and $\scm{L}$
  are two linear SCMs
  respectively on variables $\set{Y}$ and $\set{X}$ with graphs $\mathcal{G}_\scm{H}$ and $\mathcal{G}_\scm{L}$.
  Then,
  there exists an edge ${Y_1 \to Y_2}$ in $\mathcal{G}_\scm{H}$
  if and only if
  for each $X_1\in\Pi_R(Y_1)$
  there exists $X_2\in\Pi_R(Y_2)$
  such that $X_1 \taudirect X_2$ in $\mathcal{G}_\scm{L}$.
\begin{proof}
  The sufficient condition follows immediately from \Cref{lemma:sufcon}, where we already proved that any $\mat{T}$-direct path between relevant variables entails an abstract edge.
  
  To prove the necessary condition,
  we consider instead two abstract interventions $j,j'$
  which differ only in $Y_1$
  and fix everything but $Y_2$.
  Formally,
  \begin{align}
     j  &= (Y_1 \gets k, \set{V} \gets \set{v})\\
     j' &= (Y_1 \gets k', \set{V} \gets \set{v}),
  \end{align}
  where $\set{V} = \set{Y} \setminus \{Y_1, Y_2\}$.
  Consequently,
  since $Y_1$ has a direct linear effect on $Y_2$,
  it holds that 
  \begin{align}\label{eq:proofnecessary}
      \scm{H}^j_{Y_2} &\neq \scm{H}^{j'}_{Y_2}\\
      \scm{H}^j_{Y_2} \circ \gamma &\neq \scm{H}^{j'}_{Y_2} \circ \gamma\\
     \tau_{Y_2} \circ \scm{L}^i &\neq \tau_{Y_2} \circ \scm{L}^{i'},
  \end{align}
  for any intervention $i, i'$ such that $\omega(i)=j$ and $\omega(i')=j'$.

  Let now $X_1 \in \Pi_R(Y_1)$
  be a relevant concrete variable
  for $Y_1$, and $t_{11}$ be the non-zero coefficient
  from $X_1$ to $Y_1$
  in the linear abstraction transformation~$\mat{T}$.
  We can then build two concrete interventions $i,i'$
  by setting all relevant variables of $Y_1$
  to zero, except for $X_1$.
  Formally,
  the interventions have the following form
  \begin{align}
      i &= (X_1 \gets \frac{k}{t_{11}},\, \Pi(Y_1) \setminus \{X_1\} \gets \vec{0},\, \ldots)\\
      i' &= (X_1 \gets \frac{k'}{t_{11}},\, \Pi(Y_1) \setminus \{X_1\} \gets \vec{0},\, \ldots).
  \end{align}
  If we suppose that
  it does not exist a variable $X_2\in\Pi_R(Y_2)$
  such that $X_1 \taudirect X_2$,
  all directed paths $X_1 \anc X_2$, if any,
  are mediated by a relevant variable
  of any abstract variable $Y\in \set{Y}\setminus \{Y_2\}$.
  Consequently, given our construction of $j,j'$
  and consequently $i,i'$,
  any path is mediated by an intervened variable
  and, therefore, it holds
  \begin{align}
     \tau_{Y_2} \circ \scm{L}^i = \tau_{Y_2} \circ \scm{L}^{i'},
  \end{align}
  which however breaks interventional consistency
  and implies that $\scm{H}$ is not
  a $\mat{T}$-abstraction of $\scm{L}$,
  proving the necessary condition by contradiction.
\end{proof}

\subsection{Corollary~\ref{cor:necessary}}\label{proof:necessary}
\paragraph{\Cref{cor:necessary} (Connectivity Violation)}
  Let $\scm{H}$ and $\scm{L}$
  be two linear SCMs
  respectively on variables $\set{Y}$ and $\set{X}$ with graphs $\mathcal{G}_\scm{H}$ and $\mathcal{G}_\scm{L}$. Consider a linear transformation~$\mat{T}$ between them leading to the sets of relevant variables $\Pi_R(\set{Y})$.
  If there exists three variables
  $X_1\in\Pi_R(Y_1)$,
  $X_2\in\Pi_R(Y_2)$, and
  $X_3\in\Pi_R(Y_1)$,
  such that
  both conditions hold
\begin{itemize}
    \item%
      $X_1 \taudirect X_2$
      in $\mathcal{G}_\scm{L}$, and
    \item%
      for any $X_4 \in \Pi_R(Y_2)$,
      $X_3 \centernot\taudirect X_4$
      is not in $\mathcal{G}_\scm{L}$,
\end{itemize}
    then $\scm{H}$ is not a $\mat{T}$-abstraction of $\scm{L}$.
\begin{proof}
Follows directly from \Cref{lemma:sufcon} which applied to the first item implies that $Y_1 \to Y_2$, and from \Cref{theo:connectivity}, which applied to the second item implies that $Y_1 \not \to Y_2$, hence providing a contradiction to the assumption that $\scm{H}$ is a $\mat{T}$-abstraction of $\scm{L}$.
\end{proof}

\subsection{Corollary~\ref{cor:exogabs}}\label{proof:exogabs}
\paragraph{\Cref{cor:exogabs} (Exogenous Abstraction)}
  Let $\scm{H}=(\set{Y},\set{U},\set{g},\dist{P}_{\set{U}})$ be a {$\mat{T}$-abstraction} of 
  $\scm{L}=(\set{X},\set{E},\set{f},\dist{P}_{\set{E}})$,
  where $\scm{H}$ and $\scm{L}$
  are two linear SCMs.
  Then, the exogenous abstraction function
  $\gamma\colon\dom{\set{E}}\to\dom{\set{U}}$,
  has form
  \begin{align}
      \gamma(\vec{e}) = \mat{S}^\tr \vec{e},
  \end{align}
  where $\mat{S} = \mat{F} \mat{T}\mat{G}^\inv$
  and $\mat{F}, \mat{G}$
  are
  the linear
  transformations
  of
  respectively
  the reduced forms of $\scm{L}$ and $\scm{H}$, i.e., $\scm{L}(\vec{e}) = \mat{F}^T \vec{e}$ and $\scm{H}(\vec{u}) = \mat{G}^T \vec{u}$.
\begin{proof}
    Since $\scm{H}$ $\mat{T}$-abstracts $\scm{L}$,
    it must hold $\tau\circ\scm{L}=\scm{H}\circ\gamma$.
    Consequently, due to the invertibility
    of the reduced form $\scm{H}$
    of linear SCMs, it holds that
    \begin{align}
        \gamma = \scm{H}^\inv\circ\tau\circ\scm{L}.
    \end{align}
    Since, $\scm{L}$, $\tau$, and $\scm{H}^\inv$
    are linear transformations,
    their composition coincides
    with a linear transformation
    $\mat{S}=\mat{F}\mat{T}\mat{G}^\inv$.
\end{proof}

\subsection{Lemma~\ref{lemma:blockordering}}\label{proof:blockordering}
\paragraph{\Cref{lemma:blockordering} (Block Composition)}
  Let $\scm{H}$ be a $\mat{T}$-abstraction of $\scm{L}$,
  where $\scm{H}$ and $\scm{L}$
  are two linear SCMs
  respectively on variables $\set{Y}$ and $\set{X}$.
  Then,
  for any abstract variable $Y\in\set{Y}$,
  it holds
  $X\in\Pi(Y)$ if and only if
  \begin{itemize}
      \item $X\in\Pi_R(Y)$, or
      \item  $X \not \in \Pi_R(\set{Y})$, i.e., $X$ is irrelevant, and there exists $X'\in\Pi_R(Y)$ s.t. $X \taudirect X'$.
  \end{itemize}
\begin{proof}
  Let $Y$ be an abstract variable
  and ${j = (\pa{Y} \gets \vec{k})}$
  be a hard intervention
  fixing all of its endogenous parents.
  Consequently,
  the value of the abstract variable,
  $\scm{H}^j_Y(\vec{u})$ depends only
  on its exogenous term $U_Y$.
  Further,
  given the definition of concrete block,
  the formulation
  \begin{align}
  \scm{H}^j_Y(\gamma(\vec{e})) &=
  \scm{H}^j_Y(\mat{S}^\tr \vec{e}),
  \end{align}
  depends only on the exogenous
  terms $\vec{e}_{\Pi(Y)}$.
  Therefore, given the interventional consistency property
  \begin{align}
  \scm{H}^j_Y(\gamma(\vec{e})) &= \tau_Y(\scm{L}^i_{\Pi_R(Y)}(\vec{e})),
  \end{align}
  and the lack of cancelling paths,
  $\scm{L}^i_{\Pi_R(Y)}$
  also depends only on the exogenous terms $\vec{e}_{\Pi(Y)}$,
  for any concrete intervention
  \begin{align}
    i = (\Pi_R(\pa{Y}) \gets \vec{c}),
  \end{align}
  where $\tau_{\pa{Y}}(\vec{c}) = \vec{k}$.
  Notably,
  given the intervention $i$,
  the structural mechanisms of $\Pi_R(Y)$
  depend only on the exogenous noise
  of the relevant variables
  and on those variables
  whose direct path
  is non-mediated by another relevant variable.
  Given \Cref{lemma:sufcon},
  any of such relevant variables
  must be in the relevant set of a parent,
  and thus be constrained by the intervention $i$.
  Consequently,
  $\scm{L}^i_{\Pi_R(Y)}$
  depends only on its relevant variables
  and the \emph{irrelevant} variables
  with a $\mat{T}$-direct path
  towards the former.
\end{proof}

\subsection{Lemma~\ref{lemma:disjointconstitutive}}\label{proof:disjointconstitutive}
\paragraph{\Cref{lemma:disjointconstitutive} (Disjoint Block)}
  Let $\scm{H}$ be a $\mat{T}$-abstraction of $\scm{L}$,
  where $\scm{H}$ and $\scm{L}$
  are two linear SCMs
  respectively on variables $\set{Y}$ and $\set{X}$.
  If for any two distinct endogenous variables $Y_1, Y_2$
  it holds that $\Pi(Y_1) \cap \Pi(Y_2) \neq \emptyset$, then 
  the abstract model is not causally sufficient.
\begin{proof}
  By definition of concrete block~(\Cref{def:block}),
  each abstract exogenous term $U_Y$
  is a function $\gamma$
  of the noise terms of the block $\Pi(Y)$.
  Therefore,
  given two variables $Y_1, Y_2\in\set{Y}$,
  we can write
  \begin{align}
  U_1 &= \gamma_{1} ( E_{\Pi(Y_1)})\\
  U_2 &= \gamma_{2} ( E_{\Pi(Y_2)}).
  \end{align}
  Therefore, 
  whenever the blocks share
  a subset of variables ${\set{S}} = \Pi(Y_1) \cap \Pi(Y_2)$,
  both $U_1$ and $U_2$
  are a function of the exogenous terms
  \begin{align}
    \set{V} =
    \{ E_X \in \set{E}
    \mid X \in \set{S}\}.
  \end{align}
  Consequently,
  the exogenous terms $U_1, U_2$
  are not independent and
  the variables $Y_1, Y_2$
  are then confounded.
\end{proof}

\subsection{Theorem~\ref{theorem:absord}}\label{proof:absord}
\paragraph{\Cref{theorem:absord} (Block Ordering)}
  Let $\scm{H}$ be a $\mat{T}$-abstraction of $\scm{L}$,
  where $\scm{H}$ and $\scm{L}$
  are two linear SCMs
  respectively on variables $\set{Y}$ and $\set{X}$ with graphs $\mathcal{G}_\scm{H}$ and $\mathcal{G}_\scm{L}$.
  Then,
  for any valid topological ordering $\prec_{\scm{H}}$ of $\mathcal{G}_\scm{H}$
  there exists a valid ordering $\prec_{\scm{L}}$ of $\mathcal{G}_\scm{L}$
  such that
  for any $Y_1, Y_2, Y \in \set{Y}$:
  \begin{itemize}
      \item%
      $Y_1 \prec_{\scm{H}} Y_2 \iff
      \Pi(Y_1) \prec_{\scm{L}} \Pi(Y_2)$, and
      \item%
      $\Pi(Y) \prec_{\scm{L}} \big( \set{X} \setminus \Pi (\set{Y}) \big). %
        $
  \end{itemize}
\begin{proof}

Firstly, we recall
that in a valid topological order,
a variable precedes another
only if
there is a directed path
from the former to the latter~\citep{bondy_graph_2008}.
\begin{align}
    X_1 \anc X_2 &\implies X_1 \prec X_2
\end{align}
Since we always compare abstract variables
with abstract variables
and concrete variables with concrete variables,
in the following
we ease the notation
by avoiding the subscript on the precedence operator~$\prec$.

We show the existence
of a valid topological ordering
on the concrete model by construction.
Given the topological ordering on the abstract model,
we assign to each abstract node~$Y\in\set{Y}$
an integer $\rho_{\set{Y}}(Y) \in \{1, \ldots, |\set{Y}|\}$
such that
\begin{align}
    Y_1 \prec Y_2 \iff \rho_{\set{Y}}(Y_1) < \rho_{\set{Y}}(Y_2).
\end{align}
Then, we can take any valid topological
ordering within any concrete block $\Pi(Y)$
and assign in the same way $\rho_{\Pi(Y)}(X)$
for any
$Y\in\set{Y}$
and
$X\in\Pi(Y)$.
We do the same
for the set~$\set{Q}$
of concrete variables
outside of any block,
which we formally define as follows
\begin{align}
    \set{Q} = \set{X} \setminus \bigcup_{Y\in\set{Y}} \Pi(Y).
\end{align}
We then assign
the ``position''
of each
concrete variable $X\in\set{X}$
through a further integer
defined as follows,
\begin{align}
    \rho_{\set{X}} = \begin{cases}
        \sum_{Y' \prec Y} |\Pi(Y')| + \rho_{\Pi(Y)}(X)
        & \exists Y .\, X \in \Pi(X)\\
        \sum_{Y \in\set{Y}} |\Pi(Y)| + \rho_{\set{Q}}(X)
        & X \in \set{Q}.
    \end{cases}
\end{align}
Notably, since the blocks do not overlap (\Cref{lemma:disjointconstitutive}),
the assignment is unique.
We finally define the concrete topological ordering
for any $X_1, X_2 \in\set{X}$ as
\begin{align}
  X_1 \prec X_2 \iff \rho_{\set{X}}(X_1) < \rho_{\set{X}}(X_2).  
\end{align}

Given this ordering, it holds by construction that
\begin{align}
  \forall Y_1, Y_2 \in \set{Y}.\, 
  Y_1 \prec_{\scm{H}} Y_2 \iff
  \Pi(Y_1) \prec_{\scm{L}} \Pi(Y_2)\\
  \forall Y \in \set{Y}.\,
    \Pi(Y) \prec_{\scm{L}} \{X\in\set{X} \mid X \notin \bigcup_{Y\in\set{Y}} \Pi(Y)\}.
\end{align}
Therefore,
to finally prove the Theorem we have to show
that the ordering we defined is valid for the concrete graph.
Formally,
we have to show that, for any $X_1, X_2\in\set{X}$,
\begin{align}
    X_1 \to X_2 &\implies X_1 \prec X_2\\
                &\implies \rho_{\set{X}}(X_1) < \rho_{\set{X}}(X_2).
\end{align}
\textit{Case $\{X_1, X_2\} \subset\Pi(Y) \lor \{X_1, X_2\}\subset\set{Q}$.}
Whenever $X_1 \to X_2$ and $X_1, X_2$ are in the same block $\Pi(Y)$
for some $Y\in\set{Y}$ or are both in $\set{Q}$,
then $\rho_{\set{X}}(X_1) < \rho_{\set{X}}(X_2)$
by definition.\\
\textit{Case $X_1\in\Pi(Y_1), X_2\in\set{Q}$.}
Also holds by definition.\\
\textit{Case $X_1\in\set{Q}, X_2\in\Pi(Y)$.}
By definition of block,
this case never occurs,
since otherwise $X_1$ would be in $\Pi$ (\Cref{lemma:blockordering}).
\textit{Case $X_1\in\Pi(Y_1), X_2\in\Pi(Y_2)$.}
Further,
whenever $X_1 \to X_2$ such that $X_1\in\Pi(Y_1)$
for some $Y_1$ and $X_2\in\Pi(Y_2)$ for some $Y_2$,
then $X_1$ is relevant, otherwise it would have also been
in the block $\Pi(Y_2)$, which are necessarily disjoint (\Cref{lemma:disjointconstitutive}).
Therefore, given the sufficient condition
on the existence of an abstract edge (\Cref{lemma:sufcon}),
it must hold
\begin{align}
Y_1 &\to Y_2 \\
\implies Y_1 &\prec Y_2 \\
\implies \Pi(Y_1) &\prec \Pi(Y_2) \\
\implies X_1 &\prec X_2.
\end{align}
\end{proof}

\subsection{Lemma~\ref{lemma:ignvar}}\label{proof:ignvar}
\paragraph{\Cref{lemma:ignvar} (Submodel Abstraction)}
  Let $\scm{H}$ and $\scm{L}$
  be two linear SCMs
  respectively on variables $\set{Y}$ and $\set{X}$.
  Then,
  $\scm{H}$ is a $\mat{T}$-abstraction of $\scm{L}$
  if and only if
  $\scm{H}$ is a $\mat{T}$-abstraction of $\scm{L}^\prime$,
  where $\scm{L}^\prime$ is a submodel of $\scm{L}$
  defined on the subset of variables
  $\set{X}^\prime = \Pi(\set{Y})$, i.e., all of the variables in the concrete blocks.
\begin{proof}
    The Lemma directly follows from \Cref{theorem:absord},
    where the variables not in any block
    always follow in the topological ordering
    the remaining. Therefore, by removing them,
    for any intervention $i$
    the interventional consistency
    $\tau \circ \scm{L}'^i  = \tau \circ \scm{L}^i$
    still holds
    since they do not influence any relevant variable, hence the abstraction function~$\tau$, nor any block, hence the exogenous abstraction function~$\gamma$.
    Similarly, we could add as many variables
    and mechanism not influencing the blocks
    and interventional consistency would still hold. 
\end{proof}

\subsection{Lemma~\ref{lemma:exoabs}}\label{proof:exoabs}
\paragraph{\Cref{lemma:exoabs} (Exogenous Abstraction)}
  Let $\scm{H}=(\set{Y}, \set{U}, \mat{M},  \dist{P}_{\set{U}})$
  and $\scm{L}=(\set{X},  \set{E}, \mat{W}, \dist{P}_{\set{E}})$
  be two linear SCMs
  such that $\scm{H}$
  is a $\mat{T}$-abstraction
  of $\scm{L}$, such that $\mat{W}$ follows permutation $\pi_{\scm{H}}$.
  Then, the exogenous abstraction function $\gamma\colon\dom{\set{E}}\to\dom{\set{U}}$
  is unique and
  has form ${\gamma(\vec{e}) = \mat{S}^\tr \vec{e}}$
  for a linear transformation ${\mat{S}\in\real^{d \times b}}$
  defined as the upper-diagonal block matrix
  \begin{align}
    \mat{S} = \begin{bmatrix}
      \vec{s}_1 & \mat{0} & \cdots & \mat{0} \\
      \mat{0} & \vec{s}_2 & \cdots & \mat{0} \\
      \vdots & \vdots & \ddots & \vdots \\
      \mat{0} & \mat{0} & \cdots & \vec{s}_b,
    \end{bmatrix}
  \end{align}
  where
  $\vec{s}_k = \mat{F}_{kk} \vec{t}_k = {(\mat{I} - \mat{W}_{kk})}^\inv\vec{t}_k$
  for any $Y_k\in\set{Y}$.%
\begin{proof}
  Given the definition of $\mat{T}$-abstraction,
  we can rephrase observational consistency as
  \begin{align}
    \tau \circ \scm{L} &= \scm{H} \circ \gamma\\
    \mat{FT} &= \mat{SG}
  \end{align}
  where $\mat{F}$ and $\mat{G}$
  are respectively the reduced
  forms of the concrete and the abstract SCM\@.
  Consequently,
  by exploiting the block-definition of $\mat{T}$,
  we can reformulate the left side of the equation as
  \begin{align}
    \begin{bmatrix}
      \mat{F}_{11} & \mat{F}_{12} & \cdots & \mat{F}_{1b} \\
      \mat{0} & \mat{F}_{22} & \cdots & \mat{F}_{2b} \\
      \vdots & \vdots & \ddots & \vdots \\
      \mat{0} & \mat{0} & \cdots & \mat{F}_{bb}
    \end{bmatrix}
    \begin{bmatrix}
      \vec{t}_1 & \vec{0} & \cdots & \vec{0} \\
      \vec{0} & \vec{t}_2 & \cdots & \vec{0} \\
      \vdots & \vdots & \ddots & \vdots \\
      \vec{0} & \vec{0} & \cdots & \vec{t}_b
    \end{bmatrix}\\
    =\begin{bmatrix}
      \mat{F}_{11}\vec{t}_1 & \mat{F}_{12}\vec{t}_2 & \cdots & \mat{F}_{1b}\vec{t}_b \\
      \mat{0} & \mat{F}_{22}\vec{t}_2 & \cdots & \mat{F}_{2b}\vec{t}_b \\
      \vdots & \vdots & \ddots & \vdots \\
      \mat{0} & \mat{0} & \cdots & \mat{F}_{bb}\vec{t}_b
    \end{bmatrix}
  \end{align}
  Given that
  block variables are not shared (\Cref{lemma:disjointconstitutive})
  and follow the same topological order of $\mat{T}$,
  the exogenous transformation must also have form
  \begin{align}
    \mat{S} = \begin{bmatrix}
      \vec{s}_1 & \mat{0} & \cdots & \mat{0} \\
      \mat{0} & \vec{s}_2 & \cdots & \mat{0} \\
      \vdots & \vdots & \ddots & \vdots \\
      \mat{0} & \mat{0} & \cdots & \vec{s}_b,
    \end{bmatrix}.
  \end{align}
  We can therefore reformulate the right
  side $\mat{SG}$
  of the observational consistency
  equation as
  \begin{align}
      \begin{bmatrix}
      \vec{s}_1 & \mat{0} & \cdots & \mat{0} \\
      \mat{0} & \vec{s}_2 & \cdots & \mat{0} \\
      \vdots & \vdots & \ddots & \vdots \\
      \mat{0} & \mat{0} & \cdots & \vec{s}_b,
    \end{bmatrix}
    \begin{bmatrix}
      1 & g_{12} & \cdots & g_{1b} \\
      0 & 1 & \cdots & g_{2b} \\
      \vdots & \vdots & \ddots & \vdots \\
      0 & 0 & \cdots & 1
    \end{bmatrix}\\
    =\begin{bmatrix}
      \vec{s}_1 & g_{12}\vec{s}_1 & \cdots & g_{1b}\vec{s}_1 \\
      \mat{0} & \vec{s}_2 & \cdots & g_{2b}\vec{s}_2 \\
      \vdots & \vdots & \ddots & \vdots \\
      \mat{0} & \mat{0} & \cdots & \vec{s}_b.
    \end{bmatrix}
  \end{align}
  Consequently, for any $Y_i\in\set{Y}$,
  it holds $\vec{s}_i = \mat{F}_{ii}\vec{t}_i$.
\end{proof}

\subsection{Theorem~\ref{theo:concretization}}\label{proof:concretization}
\paragraph{\Cref{theo:concretization} (Block Abstraction)}
  Let $\scm{H}=(\set{Y}, \set{U}, \mat{M}, \dist{P}_{\set{U}})$
  and $\scm{L}=(\set{X}, \set{E}, \mat{W}, \dist{P}_{\set{E}})$
  be two linear SCMs with graphs $\mathcal{G}_{\scm{H}}$ and $\mathcal{G}_{\scm{L}}$ respectively.
  Then $\scm{H}$ is a linear $\mat{T}$-abstraction of $\scm{L}$
  if and only if
  for any valid topological ordering $\prec_{\scm{H}}$ of $\mathcal{G}_{\scm{H}}$
  there exists a valid ordering $\prec_{\scm{L}}$ of $\mathcal{G}_{\scm{L}}$
  such that,
  for any $Y_i,Y_j\in\set{Y}$ it holds
  \begin{align}\label{eq:weightconsistency}
    Y_i \prec_{\scm{H}} Y_j &\iff \Pi(Y_i) \prec_{\scm{L}} \Pi(Y_j), \ \mathrm{and}\\
    \mat{W}_{ij}\vec{s}_j &= m_{ij} \vec{t}_i,
  \end{align}
  where $\mat{W}_{ij}$ is the $i$-th element on the $j$-th column of $\mat{W}$, and $m_{ij}$ is the $i$-th element on the $j$-th column of $\mat{M}$.
\begin{proof}
Firstly, we introduce
the following decomposition
of the reduced forms
of the concrete and the abstract model,
which we separately prove in \Cref{proof:decomposition}.
\begin{align}
\mat{F}_{ij} &= \begin{cases}
  {(\mat{I} - \mat{W}_{ii})}^\inv & \text{if } i=j\\
  \mat{F}_{ii} (\mat{W}_{ij} + \mat{R}_{ij}) \mat{F}_{jj} & \text{if } i<j\\
  \mat{0} & \text{otherwise},\\
\end{cases}\\
\mat{R}_{ij} &= \sum_{i < k < j} \mat{W}_{ik} \mat{F}_{kk} (\mat{W}_{kj} + \mat{R}_{kj})\\
g_{ij} &= \begin{cases}
  1 & \text{if } i=j\\
  m_{ij} + \rho_{ij} & \text{if } i<j\\
  0 & \text{otherwise},\\
\end{cases}\\
\rho_{ij} &= \sum_{i < k < j} m_{ik} (m_{kj} + \rho_{kj})
\end{align}
\textit{Necessary Condition.}
We show that $\mat{T}$-abstraction
implies both conditions.
For the existence of a valid concrete ordering,
we invite the reader to consult the proof
of \Cref{theorem:absord}.
Therefore, we focus on proving that $\mat{T}$-abstraction
entails $\mat{W}_{ij} \vec{s}_j = m_{ij} \vec{t}_i$
for any $Y_i, Y_j \in \set{Y}$.
Given the decomposition
consistency condition $\mat{FT}=\mat{SG}$
from the proof of \Cref{lemma:exoabs},
for each $i<j$, it must hold that
\begin{align}
\mat{F}_{ij} \vec{t}_j
&= \vec{s}_{i} g_{ij}\\
\mat{F}_{ii} (\mat{W}_{ij} + \mat{R}_{ij}) \mat{F}_{jj} \vec{t}_j
&= \mat{F}_{ii} \vec{t}_i (m_{ij} + \rho_{ij})\\
(\mat{W}_{ij} + \mat{R}_{ij}) \vec{s}_j
&= \vec{t}_i (m_{ij} + \rho_{ij})\\
\mat{W}_{ij} \vec{s}_j
&= m_{ij} \vec{t}_i,
\end{align}
where the first step comes from
the previously introduced decomposition,
proved in \Cref{proof:decomposition}.
To prove the last step
we firstly notice that
\begin{align}
\mat{R}_{ij} \vec{s}_j = \rho_{ij}\vec{t}_i 
\iff
\mat{W}_{ij} \vec{s}_j = m_{ij} \vec{t}_i.
\end{align}
We then prove the statement for each row
by induction on the columns.
We take $j=i+1$ as base case,
where it holds
\begin{align}
    \mat{R}_{ij}\vec{s}_j &= \rho_{ij} \vec{t}_{i}\\
    \mat{0}\vec{s}_j &= 0 \cdot \vec{t}_{i}\\
    \vec{0} &= \vec{0}\\
    \implies
    \mat{W}_{ij} \vec{s}_j &= m_{ij} \vec{t}_i.
\end{align}
Consequently,
we can show that
\begin{align}
    &\mat{R}_{ij} \vec{s}_j =
    \sum_{i < k < j}
    \mat{W}_{ik} \mat{F}_{kk} (\mat{W}_{kj} + \mat{R}_{kj})
    \vec{s}_j\\
    &=\sum_{i < k < j}
    \mat{W}_{ik} \mat{F}_{kk} \mat{W}_{kj}
    \vec{s}_j +
    \mat{W}_{ik} \mat{F}_{kk} \mat{R}_{kj}
    \vec{s}_j\\
    &=\sum_{i < k < j}
    \mat{W}_{ik} \mat{F}_{kk} \mat{W}_{kj}
    \vec{s}_j +
    \mat{W}_{ik} \mat{F}_{kk} \rho_{kj}
    \vec{t}_k\\
    &=\sum_{i < k < j}
    \mat{W}_{ik} \mat{F}_{kk} m_{kj}
    \vec{t}_k +
    \mat{W}_{ik} \mat{F}_{kk} \rho_{kj}
    \vec{t}_k\\
    &=\sum_{i < k < j}
    \mat{W}_{ik} \mat{F}_{kk}
    \vec{t}_k
    m_{kj} +
    \mat{W}_{ik} \mat{F}_{kk}
    \vec{t}_k
    \rho_{kj}\\
    &=\sum_{i < k < j}
    m_{ik}\vec{t}_i m_{kj} +
    m_{ik}\vec{t}_i \rho_{kj}\\
    &=\sum_{i < k < j}
    m_{ik} (m_{kj} + \rho_{kj}) \vec{t}_i\\
    &= \rho_{ij} \vec{t}_i.
\end{align}
\textit{Sufficient Condition.}
We now show that the conditions imply
interventional consistency of the abstraction.
That is, we want to prove that
\begin{align}
    \tau_Y \circ \scm{L}^\iota_{\Pi(Y)}
    &= \scm{H}^{\omega(\iota)}_Y \circ \gamma,
\end{align}
for any concrete intervention $\iota$
on the relevant sets
defined by the linear abstraction transformation $\mat{T}$.
Firstly, we notice that the equation
is immediately true for any abstract variable $Y\in\set{Y}$
whenever the intervention targets its relevant set.
Therefore,
we focus on the case
where the abstract intervention $\omega(\iota)$
does not affect $Y$.
Consequently,
given that we assume that the
topological ordering of the blocks
coincides with that of the abstract variables,
we can decompose the concrete model as
\begin{align}
    \scm{L}^\iota_{\Pi(Y_j)}(\vec{e})
    &=
    \sum_{Y_i\in\pa{Y_j}}
    \left(
    {\left[
    \scm{L}^\iota_{\Pi(Y_i)}(\vec{e})
    \right]}^\tr
    \mat{W}_{ij} + \vec{e}^\tr_{\Pi(Y_j)}
    \right) \mat{F}_{jj},
\end{align}
where we
(i.) compute the linear contribution of the parents,
(ii.) sum the exogenos noise of the block,
(iii.) and apply the submodel composed of the internal connections in the block.
Similarly, we can decompose the abstract model as
\begin{align}
    \scm{H}_{Y_j}^{\omega(\iota)}(\vec{u})
    &=
    \sum_{Y_i\in\pa{Y_j}}
    \scm{H}_{Y_i}^{\omega(\iota)}(\vec{u})
    \cdot
    m_{ij}
    + u_j.
\end{align}
Abstraction holds whenever
interventional consistency is satisfied
by at least an exogenous transformation $\gamma$.
To continue the proof, we then define it as the linear transformation
from \Cref{lemma:exoabs}, where $\vec{s}_j = \mat{F}_{jj}\vec{t}_j$ for any $Y_j\in\set{Y}$.
Therefore,
we can reformulate interventional consistency as
\begin{align}
\begin{split}
    \sum_{Y_i\in\pa{Y_j}}
    \left(
    {\left[
    \scm{L}^\iota_{\Pi(Y_i)}(\vec{e})
    \right]}^\tr
    \mat{W}_{ij} + \vec{e}^\tr_{\Pi(Y_j)}
    \right) \mat{F}_{jj} \vec{t}_j
    \\= 
    \sum_{Y_i\in\pa{Y_j}}
    \scm{H}_{Y_i}^{\omega(\iota)}(\mat{S}^\tr \vec{e})
    \cdot
    m_{ij}
    + \vec{e}_{\Pi(Y_j)}^\tr \vec{s}_j,
\end{split}
\end{align}
which further simplifies to
\begin{align}
\begin{split}
    &\sum_{Y_i\in\pa{Y_j}}
    {\left[
    \scm{L}^\iota_{\Pi(Y_i)}(\vec{e})
    \right]}^\tr
    \mat{W}_{ij} \mat{F}_{jj} \vec{t}_j
    \\= 
    &\sum_{Y_i\in\pa{Y_j}}
    \scm{H}_{Y_i}^{\omega(\iota)}(\mat{S}^\tr \vec{e})
    \cdot
    m_{ij}
\end{split}
\end{align}
given our choice of the exogenous transformation $\mat{S}$.
We prove this last equation by induction
on the topological ordering
of the abstract graph.
In fact, as a base case,
for any root of the graph
the equation holds
given that the parent set is the empty set.
Consequently,
we can finally show
that 
$\mat{W}_{ij}\vec{s}_j = m_{ij} \vec{t}_i$
implies abstraction
as follows
\begin{align}
    &\sum_{Y_i\in\pa{Y_j}}
    \scm{H}_{Y_i}^{\omega(\iota)}(\mat{S}^\tr \vec{e})
    \cdot
    m_{ij}\\
    =
    &\sum_{Y_i\in\pa{Y_j}}
    {\left[
    \scm{L}^\iota_{\Pi(Y_i)}(\vec{e})
    \right]}^\tr \vec{t}_i
    \cdot
    m_{ij}\\
    =
    &\sum_{Y_i\in\pa{Y_j}}
    {\left[
    \scm{L}^\iota_{\Pi(Y_i)}(\vec{e})
    \right]}^\tr
    \mat{W}_{ij}
    \vec{s}_{j}\\
    =
    &\sum_{Y_i\in\pa{Y_j}}
    {\left[
    \scm{L}^\iota_{\Pi(Y_i)}(\vec{e})
    \right]}^\tr
    \mat{W}_{ij}
    \mat{F}_{jj}
    \vec{t}_{j}.
\end{align}
\end{proof}

\subsection{Model Reduction Decomposition}\label{proof:decomposition}
In the following,
we prove the decomposition
of the model reduction matrix~$\mat{F}$
from the proof in \Cref{proof:concretization}.
To simplifiy the notation, we define the matrix $\mat{A}=(\mat{I}-\mat{W})$.

\begin{proof}
Back-substituting
to solve $\mat{FA}=\mat{I}$
leads to
\begin{align}
  {\mat{F}}_{ij} = \begin{cases}
    \mat{A}_{ii}^\inv & i =j\\
    - \sum_{i<k\leq j} \mat{F}_{ii} \mat{A}_{ik} {\mat{F}}_{kj} & i <j\\
    0 & i > j
  \end{cases}.
\end{align}
Therefore, we want to prove that whenever $i<j$,
it holds
\begin{align}
  - \sum_{i<k\leq j} \mat{F}_{ii} \mat{A}_{ik} {\mat{F}}_{kj}
  =
  \mat{F}_{ii}(\mat{W}_{ij} + \mat{R}_{ij})\mat{F}_{jj},
\end{align}
where
\begin{align}
  \mat{R}_{ij} =
  \sum_{i < k < j} \mat{W}_{ik} \mat{F}_{kk} (\mat{W}_{kj} + \mat{R}_{kj}).
\end{align}

Overall,
we simplify the thesis
as follows
\begin{align}
  \mat{F}_{ii}(\mat{W}_{ij} + \mat{R}_{ij})\mat{F}_{jj}
  &=
  - \sum_{i<k\leq j} \mat{F}_{ii} \mat{A}_{ik} {\mat{F}}_{kj}
  \\
  \mat{F}_{ii}(\mat{W}_{ij} + \mat{R}_{ij})\mat{F}_{jj}
  &=
  \sum_{i<k\leq j} \mat{F}_{ii} \mat{W}_{ik} {\mat{F}}_{kj}
  \\
  \mat{F}_{ii}\mat{R}_{ij}\mat{F}_{jj}
  &=
  \sum_{i<k<j} \mat{F}_{ii} \mat{W}_{ik} {\mat{F}}_{kj}
  \\
  \mat{R}_{ij}\mat{F}_{jj}
  &=
  \sum_{i<k<j} \mat{W}_{ik} {\mat{F}}_{kj}.
\end{align}

We finally prove our thesis
by induction
on the decreasing row component~$i$,
starting
from $i=j-1$.
In the base case,
both sides of the equation
reduce to zero
and thus the statement holds.
We then prove the inductive case
by showing that if the statement
holds for any $k>i$, then it also
holds for $i$.
Formally,
\begin{align}
  &\sum_{i<k<j} \mat{W}_{ik} {\mat{F}}_{kj}\\
  &=
  \sum_{i<k<j} \mat{W}_{ik} \mat{F}_{kk} (\mat{W}_{kj} + \mat{R}_{kj}) \mat{F}_{jj}\\
  &=\mat{R}_{ij} \mat{F}_{jj}.
\end{align}
\end{proof}



