

\section{Appendix}
\subsection{Proofs of Theorems~\ref{thm:feasible},~\ref{thm:quad} and~\ref{thm:id}}\label{sec:proofs}


$\mathbf{\Sigma_Z}$, Variance matrix of $Z$,  is a (Semi) Positive Definite matrix and hence invertible. From ~\ref{eq:zy_constraint}, it follows:

\begin{equation}\label{eq:gamma_alpha}
   {\gamma= \Sigma_{Z}^{-1} \left(\Sigma_{Zy} - \alpha\Sigma_{Zx}\right)}
\end{equation} 
replace the results in ~\ref{eq:tau_constraint}:
\begin{equation}\label{eq:tau_constraint_2}
        \alpha^2\left( \Sigma_{xZ}\Sigma_{Z}^{-2} \Sigma_{Zx}\right) - 2\alpha \left(\Sigma_{xZ}\Sigma_{Z}^{-2} \Sigma_{Zy} \right)+ \Sigma_{yZ}\Sigma_{Z}^{-2} \Sigma_{Zy}  \leq \tau
\end{equation} 
and replacing $\gamma$ from ~\ref{eq:gamma_alpha} in ~\ref{eq:xy_constraint}:
\begin{equation}\label{eq:xy_constraint_2}
    \small\alpha \left(
    \Sigma_{xZ}\Sigma_{Z}^{-1}\Sigma_{Zx} -  \sigma^2_{x}
    \right)-\left(
    \Sigma_{xZ}\Sigma_{Z}^{-1}\Sigma_{Zy}-\sigma_{xy} + \rho \eta_x\eta_y
    \right)=0
\end{equation}
and now replacing $\gamma$ in ~\ref{eq:yvar_constraint}:
%     &&\alpha^2\left(
%     \widehat{\Sigma}_{xx}-  \Sigma_{xZ}\Sigma_{Z}^{-1}\Sigma_{Zx}\right) +
%     \alpha\left(
%     \Sigma_{xZ}\Sigma_{Z}^{-1}\Sigma_{Zx} -
%     \Sigma_{yZ}\Sigma_{Z}^{-1}\Sigma_{Zx} +
%     2\eta_x\eta_y\rho \right)+
%     \left(C^2_y + \Sigma_{yZ}\Sigma_{Z}^{-1}\Sigma_{Zy}- \widehat{\Sigma}_{yy}
% \right)=0\nonumber\\
\begin{align}\label{eq:yvar_constraint_2}
&\alpha^2\left(
    \sigma^2_{x}-  \Sigma_{xZ}\Sigma_{Z}^{-1}\Sigma_{Zx}\right) +2
    \alpha
    \eta_x\eta_y\rho \nonumber\\
    &\qquad \qquad +
    \left(\eta_y^2 + \Sigma_{yZ}\Sigma_{Z}^{-1}\Sigma_{Zy}- \sigma_{y}^2
\right)=0
\end{align}
\\Defining $a,,b,c,d,e$ and $f$ as:

\begin{align*}
        a &:= \mathbf{\Sigma}_{\mathbf{xZ}}\mathbf{\Sigma}_{\mathbf{Z}}^{-2}\mathbf{\Sigma}_{\mathbf{Zx}} \quad &d := 
        \mathbf{\Sigma}_{\mathbf{xZ}}\mathbf{\Sigma}_{\mathbf{Z}}^{-1}\mathbf{\Sigma}_{\mathbf{Zx}}
         \\
        b &:= \mathbf{\Sigma}_{\mathbf{xZ}}\mathbf{\Sigma}_{\mathbf{Z}}^{-2}\mathbf{\Sigma}_{\mathbf{Zy}} \quad &e := \mathbf{\Sigma}_{\mathbf{xZ}}\mathbf{\Sigma}_{\mathbf{Z}}^{-1}\mathbf{\Sigma}_{\mathbf{Zy}} \\
        c &:= \mathbf{\Sigma}_{\mathbf{yZ}}\mathbf{\Sigma}_{\mathbf{Z}}^{-2}\mathbf{\Sigma}_{\mathbf{Zy}} \quad &f := \mathbf{\Sigma}_{\mathbf{yZ}}\mathbf{\Sigma}_{\mathbf{Z}}^{-1}\mathbf{\Sigma}_{\mathbf{Zy}}
    \end{align*}

\subsubsection{Proof of Lemma.~\ref{lem:lemma1}}$\, \mathbf{\Sigma_Z}$ is a variance matrix and the matrix and its inverse, both, are (semi) positive definite. Therefore, $a,b,c,d,e$ and $f \geq 0$. 
Additionally, $Z$ is a set of instrument for $x$, therefore, $\Sigma_{xZ} \neq 0$. Consequently, $a$ and $d>0$ and $b,c,e$ and $f \geq 0$.
\\From $X = \bm{Z}\bm{\beta} + \epsilon_x \eta_x $, it follows  $\beta=\Sigma_Z^{-1}\Sigma_{Zx}$. Additionally, 
\begin{eqnarray*}\label{eq:xvar_constraint}
\sigma_x^2&=&\beta^T\Sigma_Z\beta + \eta_x^2 
\end{eqnarray*}
and replacing $\beta$:
\begin{eqnarray}
  \sigma_x^2=\mathbf{\Sigma}_{\mathbf{xZ}}\mathbf{\Sigma}_{\mathbf{Z}}^{-1}\mathbf{\Sigma}_{\mathbf{Zx}}+\eta_x^2=d + \eta_x^2\nonumber
\end{eqnarray}
Hence, $d=\sigma_x^2-\eta_x^2 > 0$, and $d-\sigma_x^2=-\eta_x^2 < 0$. Similarly, it can be shown that $f=\gamma^T\mathbf{\Sigma}_{\mathbf{Z}}\gamma$
\\\square

\\Defining $a,b,c,d,e$ and $f$ as above, we can summarise Eqs.~\ref{eq:tau_constraint_2}, ~\ref{eq:xy_constraint_2} and ~\ref{eq:yvar_constraint_2} as: 
 \begin{eqnarray}
    && a \alpha^2 -2\alpha b +c\leq \tau    \label{eq:quadratic1}\\
    &&(\sigma_x^2-d)\alpha +\rho\eta_x\eta_y +
    e -\sigma_{xy}
    =0\label{eq:quadratic2}\\
    && 
    (\sigma_x^2-d)\alpha^2 + 2\alpha\rho \eta_x\eta_y  +(\eta_y^2 +f-\sigma_y^2)=0\label{eq:quadratic3} 
    \end{eqnarray}
 
%  For unnormalised data: 
%  \begin{eqnarray}
%     && A \alpha^2 -2\alpha B +D\leq \tau    \label{eq:quadratic_un1}\\
%     &&(\sigma^2_{x}- F)\alpha +
%     E -{\sigma}_{xy}+\rho \eta_x\eta_y
%      =0 \label{eq:quadratic_un22}\\
%     && 
%     (\sigma^2_{x}-F)\alpha^2 +\alpha (2\rho \eta_x\eta_y)  +(C^2_y +G-\sigma^2_{y})=0\label{eq:quadratic_un3} 
%     \end{eqnarray}
\\
\subsubsection{Proof of Theorem. ~\ref{thm:feasible}}
Eq. ~\ref{eq:quadratic1} gives us \textit{feasible area} of \(\alpha \) as a function of \(\tau\):
\begin{eqnarray*}
  %&& A \alpha^2 -2\alpha B +D\leq \tau 
  %&& a \alpha^2 -2\alpha b +c\leq \tau   \quad \rightarrow \quad 
  0 \leq \left(\alpha-\frac{b}{a}\right)^2\leq\frac{a(\tau-c)+b^2}{a^2} \end{eqnarray*}
and $a > 0$, therefore, 
\begin{eqnarray}\label{eq:feasible_alpha_tau1}
   \tau &\geq& c-\frac{b^2}{a} 
   \end{eqnarray}
\begin{equation}
  \frac{b}{a}-\sqrt{\frac{a(\tau-c)+b^2}{a^2}} 
  \leq &\alpha & \leq
  \frac{b}{a}+\sqrt{\frac{a(\tau-c)+b^2}{a^2}} 
\end{equation}
\\\square

\subsubsection{Proof of Theorem. ~\ref{thm:quad}} Eq.~\ref{eq:quadratic2} formalises the functional form of relationship between \(\alpha, \rho\) and $\eta_y$, a hyperbola (see ~\ref{fig:const_2}). 
\begin{figure}
  \centering
 \includegraphics[width=\linewidth]{figures/2nd_constraint.png}
  \caption{$\alpha$ as a function of $\rho$ and $\eta_y$. See Eq. ~\ref{eq:quadratic2}}
  \label{fig:const_2}
\end{figure} \label{fig:const_2}
Rearranging Eq.~\ref{eq:quadratic2}: 
\begin{eqnarray}\label{eq:eta_y_alpha}
  \eta_y=\frac{1}{\eta_x\rho}\left[(d-\sigma_x^2)\alpha-(e-{\sigma}_{xy})\right]
\end{eqnarray}
\\ $\eta_x, \eta_y>0$ and $d-\sigma_x^2<0$ (see Lemma.~\ref{lem:lemma1}), therefore,
\begin{equation}\label{eq:eta_y_constraint}
\Bigg\{\begin{matrix}
\alpha < \frac{e-{\sigma}_{xy}}{d-\sigma_x^2}&\quad & \rho >0\\
\\
\alpha > \frac{e-{\sigma}_{xy}}{d-\sigma_x^2}& \quad & \rho <0
\end{matrix}    
\end{equation}


\\Replacing \(\eta_y\) from Eq.\ref{eq:eta_y_alpha} in Eq.\ref{eq:quadratic3}: 
\begin{eqnarray}\label{eq:quadratic_alpha_1}
  &&\alpha^2 \left[(d-\sigma_x^2)(1+ \frac{d-\sigma_x^2}{\eta_x^2\rho^2})
  \right] 
   -2\alpha (e-\sigma_{xy})(1+\frac{d-\sigma_x^2}{\eta_x^2\rho^2})\nonumber\\
   &&\qquad
   + \left[ \frac{(e-\sigma_{xy})^2}{\eta_x^2\rho^2} +f-\sigma_y^2\right]=0\quad\\
   &&\nonumber
\end{eqnarray}
Defining: 
\begin{eqnarray*}
        g &:= (d - \sigma^2_{\mathbf{x}})(1 + \frac{d - \sigma^2_{\mathbf{x}}}{\eta^2_x\rho^2}) \\
        h &:= -(e - \sigma_{\mathbf{xy}})(1 + \frac{d - \sigma^2_{\mathbf{x}}}{\eta^2_x\rho^2}) \\
        i &:= \frac{(e - \sigma_{\mathbf{xy}})^2}{\eta^2_x\rho^2} + f - \sigma^2_{\mathbf{y}}
\end{eqnarray*}
\\Eq.~\ref{eq:quadratic_alpha_1} can be rewritten as a general quadratic equation \(g\alpha^2 +2h\alpha+ i=0\), and given 
\begin{equation}\label{eq:delta_pos}
    h^2 - gi \geq 0
\end{equation}
the real solution $(\alpha \in \mathbb{R}^2)$ can be expressed as $\alpha = \frac{-h \pm \sqrt{h^2 - gi}}{g}$. Denoting:
\begin{equation*}
    \delta(\rho):=\frac{\sqrt{\left[(e-\sigma_{xy})^2-(d-\sigma^2_x)(f-\sigma^2_y)\right](1+\frac{d-\sigma^2_x}{ \eta^2_x\rho^2}) }}{(d-\sigma^2_x)(1+\frac{d-\sigma^2_x}{ \eta^2_x \rho^2})}
\end{equation*}, 
$\alpha$ can be written as: 
% \begin{eqnarray}\label{eq:closed_form_alpha1}
%   \label{eq:alpha_final}
%   \alpha= \tfrac{(e-\sigma_{xy})(1+\frac{d-\sigma^2_x}{ \eta^2_x \rho^2})\pm \sqrt{\left[(e-\sigma_{xy})^2-(d-\sigma^2_x)(f-\sigma^2_y)\right](1+\frac{d-\sigma^2_x}{ \eta^2_x\rho^2}) }}{(d-\sigma^2_x)(1+\frac{d-\sigma^2_x}{ \eta^2_x \rho^2})}
% \end{eqnarray}  
% and, 
\begin{align}\label{eq:alpha_delta_2sln}
&\alpha=\frac{(e-\sigma_{xy})} {(d-\sigma^2_x)}
        \quad 
        \pm \delta(\rho)
        % \frac{\sqrt{\left[(e-\sigma_{xy})^2-(d-\sigma^2_x)(f-\sigma^2_y)\right](1+\frac{d-\sigma^2_x}{ \eta^2_x\rho^2}) }}{(d-\sigma^2_x)(1+\frac{d-\sigma^2_x}{ \eta^2_x \rho^2})}
\end{align}

\\With this we have identified (at most) two possible point estimates for $\alpha$ for a given $\rho$. Fig. ~\ref{fig:alpha_rho_2solutions} depicts possible solutions for $\alpha$ in range of $|\rho|^2 \leq 1$.
\begin{figure}
  \centering
 \includegraphics[width=\linewidth]{figures/rho_alpha.png}
  \caption{$\alpha$ as a function of $\rho$ and $\eta_y$. See Eq. ~\ref{eq:alpha_delta_2sln}}
%   \label{fig:alpha_rho_2solutions}
\end{figure} \label{fig:alpha_rho_2solutions}
\\From Lemma ~\ref{lem:lemma1}, we know that $d-\sigma_x^2=-\eta_x^2 < 0$, 
hence, both $ d-\sigma^2_x <0$ and $1+\frac{d-\sigma^2_x}{ \eta^2_x \rho^2} <0 $, and consequently, $\delta(\rho) >0$ for all values of $\rho$ and all samples from SCMs consistent with Eqs.~\ref{eq:scmx}, ~\ref{eq:scmy} and ~\ref{eq:scmSigma}. 

With this, $\{\delta(\rho) >0 \text{ for all } |\rho^2| \leq 1\}$, and given constraints in Eq.~\ref{eq:eta_y_constraint} :
 
        \begin{align}\label{eq:alpha_closedform_2}
        \alpha(\rho)=\Bigg\{\begin{matrix} \frac{e-\sigma_{xy}} {d-\sigma^2_x} - \delta(\rho) & \quad & \rho>0 \\
        \\
       \frac{e-\sigma_{xy}} {d-\sigma^2_x} + \delta(\rho) & \quad & \rho<0
        \end{matrix}
    \end{align}
Intuitively, with constraints on feasible values for $\eta_y$, $\eta_y>0$, summarised by Eq.~\ref{eq:eta_y_constraint}, we have eliminated one of the two possible solutions for $\alpha(\rho)$. This leaves us with $\alpha=\alpha(\rho)$ as a deterministic bijective function of $\rho$.
\\ \square

\subsubsection{Proof of Theorem \ref{thm:id}}
\begin{itemize}[wide=0.5em, leftmargin =*, nosep, before = \leavevmode]
    \item[(i)] Follows from proof Theorem \ref{thm:feasible}, Eq.\ref{eq:feasible_alpha_tau1}
    
    \item[(ii)] Follows from proof Theorem \ref{thm:quad} and condition of existence of a real solution for a quadratic equation, $\alpha \in \mathbb{R}^2$, Eq.~\ref{eq:delta_pos}. 
    
    \item[(iii)] In naturally follows that a solution for $\alpha$ proposed by theorem ~\ref{thm:quad}, is only valid if it is within feasible area for solution defined by theorem ~\ref{thm:id}. In other words, theorem ~\ref{thm:quad} identifies all possible values of $\alpha$, average causal effect of $x$ on $y$ which is consistent with observed data (and their covariance matrices). Those structures which require higher influence of $Z$ on $y$, larger than allowed by $\tau$, are invalid.
\end{itemize}
\\ \square

\subsection{comparing $\sigma^2_x$ and $d := 
        \mathbf{\Sigma}_{\mathbf{xZ}}\mathbf{\Sigma}_{\mathbf{Z}}^{-1}\mathbf{\Sigma}_{\mathbf{Zx}} $}

Lets start with a simple scenario, when $d_z=2$.
\begin{eqnarray*}
 d &:=& 
        \mathbf{\Sigma}_{\mathbf{xZ}}\mathbf{\Sigma}_{\mathbf{Z}}^{-1}\mathbf{\Sigma}_{\mathbf{Zx}} \nonumber\\
        &=& \begin{bmatrix}\sigma_{xz_1} & \sigma_{xz_2}\end{bmatrix}
        \begin{bmatrix}
        \sigma_{z_1}^2 & \sigma_{z_1z_2}\\
        \sigma_{z_1z_2} & \sigma_{z_2}^2
        \end{bmatrix}^{-1}
        \begin{bmatrix}\sigma_{xz_1}\\\sigma_{xz_2}\end{bmatrix}\nonumber\\
        &=& \sigma_{xz_1}^2 \sigma_{z_2}^2 
            +\sigma_{xz_2}^2 \sigma_{z_1}^2  
            -2\sigma_{xz_1}\sigma_{xz_2} \sigma_{z_1z_2} 
\end{eqnarray*}
\begin{itemize}
    \item [(i)] Assume $\sigma_{xz_1} = \sigma_{xz_2}=\sigma_{xz}$. 
    \begin{align*}
        d=\sigma_{xz}^2 \sigma_{z_2}^2 
            +\sigma_{xz}^2 \sigma_{z_1}^2  
            -2\sigma_{xz}^2\sigma_{z_1z_2} 
        =\sigma_{xz}^2 \sigma_{(z_1 - z_2)}^2 \nonumber
    \end{align*}
    Hence, if, for example, $\sigma_{xz}=0.5$ and $\sigma_{x}^2= 1$, with $\sigma_{(z_1 - z_2)} \geq 2$, i.e. $ \left[\frac{\sum^m_i (z^i_1 - z^i_2)^2}{m-1}- \left(\mu_{z_1}- \mu_{z_2}\right)^2\right] \geq 2 $, we have $d-\sigma_x^2 \geq 0$
   
    \item [(ii)] Assume $\sigma_{xz_1} = -\sigma_{xz_2}=\sigma_{xz}$, and, $d=\sigma_{xz}^2 \sigma_{(z_1 + z_2)}^2 $.
    For a similar setting, i.e. $\sigma_{xz}=0.5$ and $\sigma_{x}^2= 1$, with $\sigma_{(z_1 + z_2)} \geq 2$,  we have $d-\sigma_x^2 \geq 0$
    
    \item [(ii)] Assume $\sigma_{z_1z_2} =0$
    %, and $\frac{\sigma_{xz_1}^2}{\sigma_{xz_2}^2}=\frac{\sigma_{z_1}^2}{\sigma_{z_2}^2}=C.$
    , then for a $\sigma_{xz_1}^2\sigma_{z_2}^2 + \sigma_{xz_1}^2\sigma_{z_1}^2 \geq \sigma_{x}^2$, $d - \sigma_{x}^2 \geq 0$.
\end{itemize}
With $d_z \geq 3$, it becomes more complicated to identify the setting where $d-\sigma_{x}^2 \geq 0$, but as shown here for $d_z=2$, such settings are possible. 