
\subsection{Special Cases}
\label{appD1}

We provide three additional experiments under (1) no effect between ${M}$ and ${N}$, (2) no effect between $\{{M},{N}\}$ and $Y$, (3) only effect through $X \rightarrow {M} \rightarrow {N} \rightarrow Y$.

{\bf (1). No effect between ${M}$ and ${N}$.}
We consider the situation where there is no effect between ${M}$ and ${N}$.


{\bf Setting.}
We consider the following linear SCM:
\begin{equation}
\begin{gathered}
Y:=X+{M}+ {N}+ C+U^Y,
%{N}:=X+ {M}+ C+U^{{N}},\\
{N}:=X+ C+U^{{N}},
{M}:=X+C+U^{{M}}, X:=C+U^X, C:=U^C,
\end{gathered}
\end{equation}
where $U^C\sim {\cal N}(0,1)$, $U^X\sim {\cal N}(0,1)$, $U^Y\sim {\cal N}(0,1)$, $U^{{M}} \sim {\cal N}(0,1)$, $U^{{N}} \sim {\cal N}(0,1)$ and they are mutually independent normal distributions.
This SCM satisfies Assumptions \ref{SCAS}, \ref{ASM}, \ref{SUP1}, \ref{AS1}, and \ref{AS1}'.
We let $x'=0$, $x=1$, $y=0$, $c=0$, and ${\cal E}=\emptyset$.
We simulate 1000 times with the sample size $N=20$, $N=100$, and $N=10000$.



{\bf Results.}
The ground truth of $\text{\normalfont T-PNS}$ is $0.458$.
The ground truth of $\text{\normalfont PNS}^{X \rightarrow Y}$ is $0.082$ and the estimates are
\begin{center}
\textbf{$N=20$}:\, \, \, \, $0.083$ (95\%CI: $[0.003,0.213]$),\\\vspace{0.1cm}
\textbf{$N=100$}:\, \, \,  $0.081$ (95\%CI: $[0.044,0.127]$),\\\vspace{0.1cm}
\textbf{$N=10000$}: $0.082$ (95\%CI: $[0.078,0.086]$).
\end{center}
The ground truth of $\text{\normalfont PNS}^{X \rightarrow {N}  \rightarrow Y}$ is $0.158$ and the estimates are
\begin{center}
\textbf{$N=20$}:\, \, \, \, $0.158$ (95\%CI: $[0.030,0.350]$),\\\vspace{0.1cm}
\textbf{$N=100$}:\, \, \,  $0.158$ (95\%CI: $[0.102,0.221]$),\\\vspace{0.1cm}
\textbf{$N=10000$}: $0.158$ (95\%CI: $[0.151,0.164]$).
\end{center}
The ground truth of $\text{\normalfont PNS}^{X \rightarrow {M} \rightarrow {N}  \rightarrow Y}$ is $0.000$ and the estimates are
\begin{center}
\textbf{$N=20$}:\, \, \, \, $0.018$ (95\%CI: $[0.000,0.090]$),\\\vspace{0.1cm}
\textbf{$N=100$}:\, \, \,  $0.008$ (95\%CI: $[0.000,0.038]$),\\\vspace{0.1cm}
\textbf{$N=10000$}: $0.001$ (95\%CI: $[0.000,0.004]$).
\end{center}
The ground truth of $\text{\normalfont PNS}^{X \rightarrow {M}  \rightarrow Y}$ is $0.218$ and the estimates are
\begin{center}
\textbf{$N=20$}:\, \, \, \, $0.199$ (95\%CI: $[0.057,0.353]$),\\\vspace{0.1cm}
\textbf{$N=100$}:\, \, \,  $0.211$ (95\%CI: $[0.154,0.265]$),\\\vspace{0.1cm}
\textbf{$N=10000$}: $0.217$ (95\%CI: $[0.212,0.223]$).
\end{center}
All means of the estimators are close to the ground truth. 
However, estimators for small sample sizes have large 95 $\%$ CIs.




{\bf (2). No effect between $\{{M},{N}\}$ and $Y$.}
We consider the situation where there is no effect between $\{{M},{N}\}$ and $Y$.


{\bf Setting.}
We consider the following linear SCM:
\begin{equation}
\begin{gathered}
Y:=X+ C+U^Y,
{N}:=X+ {M}+ C+U^{{N}},
{M}:=X+C+U^{{M}}, X:=C+U^X, C:=U^C,
\end{gathered}
\end{equation}
where $U^C\sim {\cal N}(0,1)$, $U^X\sim {\cal N}(0,1)$, $U^Y\sim {\cal N}(0,1)$, $U^{{M}} \sim {\cal N}(0,1)$, $U^{{N}} \sim {\cal N}(0,1)$ and they are mutually independent normal distributions.
This SCM satisfies Assumptions \ref{SCAS}, \ref{ASM}, \ref{SUP1}, \ref{AS1}, and \ref{AS1}'.
We let $x'=0$, $x=1$, $y=0$, $c=0$, and ${\cal E}=\emptyset$.
We simulate 1000 times with the sample size $N=20$, $N=100$, and $N=10000$.



{\bf Results.}
The ground truth of $\text{\normalfont T-PNS}$ is $0.346$.
The ground truth of $\text{\normalfont PNS}^{X \rightarrow Y}$ is $0.346$ and the estimates are
\begin{center}
\textbf{$N=20$}:\, \, \, \, $0.282$ (95\%CI: $[0.037,0.481]$),\\\vspace{0.1cm}
\textbf{$N=100$}:\, \, \,  $0.314$ (95\%CI: $[0.207,0.400]$),\\\vspace{0.1cm}
\textbf{$N=10000$}: $0.339$ (95\%CI: $[0.328,0.347]$).
\end{center}
The ground truth of $\text{\normalfont PNS}^{X \rightarrow {N}  \rightarrow Y}$ is $0.000$ and the estimates are
\begin{center}
\textbf{$N=20$}:\, \, \, \, $0.027$ (95\%CI: $[0.000,0.185]$),\\\vspace{0.1cm}
\textbf{$N=100$}:\, \, \,  $0.011$ (95\%CI: $[0.000,0.074]$),\\\vspace{0.1cm}
\textbf{$N=10000$}: $0.001$ (95\%CI: $[0.000,0.007]$).
\end{center}
The ground truth of $\text{\normalfont PNS}^{X \rightarrow {M} \rightarrow {N}  \rightarrow Y}$ is $0.000$ and the estimates are
\begin{center}
\textbf{$N=20$}:\, \, \, \, $0.011$ (95\%CI: $[0.000,0.103]$),\\\vspace{0.1cm}
\textbf{$N=100$}:\, \, \,  $0.005$ (95\%CI: $[0.000,0.042]$),\\\vspace{0.1cm}
\textbf{$N=10000$}: $0.000$ (95\%CI: $[0.000,0.004]$).
\end{center}
The ground truth of $\text{\normalfont PNS}^{X \rightarrow {M}  \rightarrow Y}$ is $0.000$ and the estimates are
\begin{center}
\textbf{$N=20$}:\, \, \, \, $0.025$ (95\%CI: $[0.000,0.168]$),\\\vspace{0.1cm}
\textbf{$N=100$}:\, \, \,  $0.012$ (95\%CI: $[0.000,0.071]$),\\\vspace{0.1cm}
\textbf{$N=10000$}: $0.001$ (95\%CI: $[0.000,0.007]$).
\end{center}
All means of the estimators are close to the ground truth. 
However, estimators for small sample sizes have large 95 $\%$ CIs.




{\bf (3). Only effect through $X \rightarrow {M} \rightarrow {N} \rightarrow Y$.}
We consider the situation where there is only effect through $X \rightarrow {M} \rightarrow {N} \rightarrow Y$.



{\bf Setting.}
We consider the following linear SCM:
\begin{equation}
\begin{gathered}
Y:= {N}+ C+U^Y,
{N}:={M}+ C+U^{{N}},
{M}:=X+C+U^{{M}}, X:=C+U^X, C:=U^C,
\end{gathered}
\end{equation}
where $U^C\sim {\cal N}(0,1)$, $U^X\sim {\cal N}(0,1)$, $U^Y\sim {\cal N}(0,1)$, $U^{{M}} \sim {\cal N}(0,1)$, $U^{{N}} \sim {\cal N}(0,1)$ and they are mutually independent normal distributions.
This SCM satisfies Assumptions \ref{SCAS}, \ref{ASM}, \ref{SUP1}, \ref{AS1}, and \ref{AS1}'.
We let $x'=0$, $x=1$, $y=0$, $c=0$, and ${\cal E}=\emptyset$.
We simulate 1000 times with the sample size $N=20$, $N=100$, and $N=10000$.



{\bf Results.}
The ground truth of $\text{\normalfont T-PNS}$ is $0.219$.
The ground truth of $\text{\normalfont PNS}^{X \rightarrow Y}$ is $0.000$ and the estimates are
\begin{center}
\textbf{$N=20$}:\, \, \, \, $0.017$ (95\%CI: $[0.000,0.124]$),\\\vspace{0.1cm}
\textbf{$N=100$}:\, \, \,  $0.008$ (95\%CI: $[0.000,0.049]$),\\\vspace{0.1cm}
\textbf{$N=10000$}: $0.001$ (95\%CI: $[0.000,0.004]$).
\end{center}
The ground truth of $\text{\normalfont PNS}^{X \rightarrow {N}  \rightarrow Y}$ is $0.000$ and the estimates are
\begin{center}
\textbf{$N=20$}:\, \, \, \, $0.021$ (95\%CI: $[0.000,0.144]$),\\\vspace{0.1cm}
\textbf{$N=100$}:\, \, \,  $0.008$ (95\%CI: $[0.000,0.050]$),\\\vspace{0.1cm}
\textbf{$N=10000$}: $0.001$ (95\%CI: $[0.000,0.005]$).
\end{center}
The ground truth of $\text{\normalfont PNS}^{X \rightarrow {M} \rightarrow {N}  \rightarrow Y}$ is $0.219$ and the estimates are
\begin{center}
\textbf{$N=20$}:\, \, \, \, $0.146$ (95\%CI: $[0.000,0.293]$),\\\vspace{0.1cm}
\textbf{$N=100$}:\, \, \,  $0.189$ (95\%CI: $[0.123,0.247]$),\\\vspace{0.1cm}
\textbf{$N=10000$}: $0.215$ (95\%CI: $[0.208,0.222]$).
\end{center}
The ground truth of $\text{\normalfont PNS}^{X \rightarrow {M}  \rightarrow Y}$ is $0.000$ and the estimates are
\begin{center}
\textbf{$N=20$}:\, \, \, \, $0.034$ (95\%CI: $[0.000,0.189]$),\\\vspace{0.1cm}
\textbf{$N=100$}:\, \, \,  $0.014$ (95\%CI: $[0.000,0.068]$),\\\vspace{0.1cm}
\textbf{$N=10000$}: $0.001$ (95\%CI: $[0.000,0.007]$).
\end{center}
All means of the estimators are close to the ground truth. 
However, estimators for small sample sizes have large 95 $\%$ CIs.




\subsection{Sensitivity Analysis for Violation of Monotonicity}
\label{appD2}

We conduct a sensitivity analysis to assess the impact of violations of the monotonicity assumption.

{\bf Setting.}
We consider the following SCM:
\begin{equation}
\begin{gathered}
Y:=X+{M}+ {N}+ C+\alpha U^Y +(1-\alpha) (U^Y)^4,
{N}:=X+ {M}+ C+U^{{N}},
{M}:=X+C+U^{{M}}, X:=C+U^X, C:=U^C,
\end{gathered}
\end{equation}
where $U^C\sim {\cal N}(0,1)$, $U^X\sim {\cal N}(0,1)$, $U^Y\sim {\cal N}(0,1)$, $U^{{M}} \sim {\cal N}(0,1)$, $U^{{N}} \sim {\cal N}(0,1)$, which are mutually independent normal distributions.
%This SCM satisfies Assumptions \ref{SCAS}, \ref{ASM}, \ref{SUP1}, \ref{AS1}, and 4.3'.
This SCM violates the monotonicities.
We let $x'=0$, $x=1$, $y=0$, $c=0$, and ${\cal E}=\emptyset$.
We simulate 1000 times with the sample size $N=20$, $N=100$, and $N=10000$.
We examine the cases $\alpha = 0.5$ and $\alpha = 0$, which correspond to a moderate violation and a strong violation of monotonicity, respectively.
The case where $\alpha = 1$ corresponds to the setting described in Section 5.


{\bf Results ($\alpha=0.5$; moderate violation).}
The ground truth of $\text{\normalfont T-PNS}$ is $0.365$.
The ground truth of $\text{\normalfont PNS}^{X \rightarrow Y}$ is $0.039$ and the estimates are
\begin{center}
\textbf{$N=20$}:\, \, \, \, $0.048$ (95\%CI: $[0.000,0.188]$),\\\vspace{0.1cm}
\textbf{$N=100$}:\, \, \,  $0.048$ (95\%CI: $[0.000,0.115]$),\\\vspace{0.1cm}
\textbf{$N=10000$}: $0.048$ (95\%CI: $[0.040,0.057]$).
\end{center}
The ground truth of $\text{\normalfont PNS}^{X \rightarrow {N}  \rightarrow Y}$ is $0.073$ and the estimates are
\begin{center}
\textbf{$N=20$}:\, \, \, \, $0.053$ (95\%CI: $[0.000,0.176]$),\\\vspace{0.1cm}
\textbf{$N=100$}:\, \, \,  $0.056$ (95\%CI: $[0.000,0.104]$),\\\vspace{0.1cm}
\textbf{$N=10000$}: $0.056$ (95\%CI: $[0.050,0.062]$).
\end{center}
The ground truth of $\text{\normalfont PNS}^{X \rightarrow {M} \rightarrow {N}  \rightarrow Y}$ is $0.111$, and the estimates are
\begin{center}
\textbf{$N=20$}:\, \, \, \, $0.078$ (95\%CI: $[0.000,0.214]$),\\\vspace{0.1cm}
\textbf{$N=100$}:\, \, \,  $0.070$ (95\%CI: $[0.000,0.135]$),\\\vspace{0.1cm}
\textbf{$N=10000$}: $0.063$ (95\%CI: $[0.055,0.071]$).
\end{center}
The ground truth of $\text{\normalfont PNS}^{X \rightarrow {M}  \rightarrow Y}$ is $0.142$ and the estimates are
\begin{center}
\textbf{$N=20$}:\, \, \, \, $0.101$ (95\%CI: $[0.000,0.253]$),\\\vspace{0.1cm}
\textbf{$N=100$}:\, \, \,  $0.080$ (95\%CI: $[0.000,0.163]$),\\\vspace{0.1cm}
\textbf{$N=10000$}: $0.069$ (95\%CI: $[0.057,0.081]$).
\end{center}





{\bf Results ($\alpha=0$; strong violation).}
The ground truth of $\text{\normalfont T-PNS}$ is $0.330$.
The ground truth of $\text{\normalfont PNS}^{X \rightarrow Y}$ is $0.035$ and the estimates are
\begin{center}
\textbf{$N=20$}:\, \, \, \, $0.048$ (95\%CI: $[0.000,0.201]$),\\\vspace{0.1cm}
\textbf{$N=100$}:\, \, \,  $0.041$ (95\%CI: $[0.000,0.125]$),\\\vspace{0.1cm}
\textbf{$N=10000$}: $0.032$ (95\%CI: $[0.022,0.043]$).
\end{center}
The ground truth of $\text{\normalfont PNS}^{X \rightarrow {N}  \rightarrow Y}$ is $0.064$ and the estimates are
\begin{center}
\textbf{$N=20$}:\, \, \, \, $0.038$ (95\%CI: $[0.000,0.149]$),\\\vspace{0.1cm}
\textbf{$N=100$}:\, \, \,  $0.034$ (95\%CI: $[0.000,0.091]$),\\\vspace{0.1cm}
\textbf{$N=10000$}: $0.034$ (95\%CI: $[0.027,0.042]$).
\end{center}
The ground truth of $\text{\normalfont PNS}^{X \rightarrow {M} \rightarrow {N}  \rightarrow Y}$ is $0.101$, and the estimates are
\begin{center}
\textbf{$N=20$}:\, \, \, \, $0.048$ (95\%CI: $[0.000,0.184]$),\\\vspace{0.1cm}
\textbf{$N=100$}:\, \, \,  $0.040$ (95\%CI: $[0.000,0.106]$),\\\vspace{0.1cm}
\textbf{$N=10000$}: $0.044$ (95\%CI: $[0.028,0.044]$).
\end{center}
The ground truth of $\text{\normalfont PNS}^{X \rightarrow {M}  \rightarrow Y}$ is $0.130$ and the estimates are
\begin{center}
\textbf{$N=20$}:\, \, \, \, $0.069$ (95\%CI: $[0.000,0.232]$),\\\vspace{0.1cm}
\textbf{$N=100$}:\, \, \,  $0.049$ (95\%CI: $[0.000,0.137]$),\\\vspace{0.1cm}
\textbf{$N=10000$}: $0.038$ (95\%CI: $[0.026,0.048]$).
\end{center}

The bias becomes large under strong violations of monotonicity.







\subsection{Binary Outcome}
\label{appD3}



We conduct additional experiments using a logistic model for binary outcomes.

{\bf Setting.}
We consider the following SCM:
$Y$ is randomly chosen from $\{0,1\}$ with the probability
\begin{align}
\mathbb{P}(Y=1)=\frac{1}{1+\exp(-10(X+{M}+ {N}+ C))},
\end{align}
and
\begin{equation}
\begin{gathered}
{N}:=X+ {M}+ C+U^{{N}},
{M}:=X+C+U^{{M}}, X:=C+U^X, C:=U^C,
\end{gathered}
\end{equation}
where $U^C\sim {\cal N}(0,1)$, $U^X\sim {\cal N}(0,1)$, $U^{{M}} \sim {\cal N}(0,1)$, and $U^{{N}} \sim {\cal N}(0,1)$, which are mutually independent normal distributions.
This SCM satisfies Assumptions \ref{SCAS}, \ref{ASM}, \ref{SUP1}, \ref{AS1}, and 4.3'.
We estimate the model parameters using logistic regression.
We let $x'=0$, $x=1$, $y=0$, $c=0$, and ${\cal E}=\emptyset$.
We simulate 1000 times with the sample size $N=20$, $N=100$, and $N=10000$.





{\bf Results.}
The ground truth of $\text{\normalfont T-PNS}$ is $0.466$.
The ground truth of $\text{\normalfont PNS}^{X \rightarrow Y}$ is $0.054$ and the estimates are
\begin{center}
\textbf{$N=20$}:\, \, \, \, $0.092$ (95\%CI: $[0.000,0.950]$),\\\vspace{0.1cm}
\textbf{$N=100$}:\, \, \,  $0.054$ (95\%CI: $[0.000,0.159]$),\\\vspace{0.1cm}
\textbf{$N=10000$}: $0.053$ (95\%CI: $[0.048,0.058]$).
\end{center}
The ground truth of $\text{\normalfont PNS}^{X \rightarrow {N}  \rightarrow Y}$ is $0.098$ and the estimates are
\begin{center}
\textbf{$N=20$}:\, \, \, \, $0.080$ (95\%CI: $[0.000,0.359]$),\\\vspace{0.1cm}
\textbf{$N=100$}:\, \, \,  $0.096$ (95\%CI: $[0.013,0.202]$),\\\vspace{0.1cm}
\textbf{$N=10000$}: $0.096$ (95\%CI: $[0.089,0.103]$).
\end{center}
The ground truth of $\text{\normalfont PNS}^{X \rightarrow {M} \rightarrow {N}  \rightarrow Y}$ is $0.141$, and the estimates are
\begin{center}
\textbf{$N=20$}:\, \, \, \, $0.110$ (95\%CI: $[0.000,0.306]$),\\\vspace{0.1cm}
\textbf{$N=100$}:\, \, \,  $0.130$ (95\%CI: $[0.000,0.232]$),\\\vspace{0.1cm}
\textbf{$N=10000$}: $0.141$ (95\%CI: $[0.137,0.146]$).
\end{center}
The ground truth of $\text{\normalfont PNS}^{X \rightarrow {M}  \rightarrow Y}$ is $0.173$ and the estimates are
\begin{center}
\textbf{$N=20$}:\, \, \, \, $0.149$ (95\%CI: $[0.000,0.439]$),\\\vspace{0.1cm}
\textbf{$N=100$}:\, \, \,  $0.182$ (95\%CI: $[0.031,0.329]$),\\\vspace{0.1cm}
\textbf{$N=10000$}: $0.178$ (95\%CI: $[0.167,0.190]$).
\end{center}
The estimates obtained from logistic regression are reliable when the sample size is large.