
We represent a single or vector variable with a capital letter $(X)$ and its realized value with a small letter $(x)$.
Let $\mathbb{I}(\cdot)$ be an indicator function that takes $1$ if the statement in $(\cdot)$ is true and $0$ otherwise, and $\mathbbm{1}(\cdot)$ be a delta function.
Denote $\Omega_Y$ be the domain of variable $Y$,
$\mathbb{E}[Y]$ be the expectation of $Y$, 
$\mathbb{P}(Y\prec y)$ be the cumulative distribution function (CDF) of continuous variable $Y$, and $\mathfrak{p}_Y(y)$ be the probability density function (PDF) of continuous variable $Y$.
We use $X \indep Y|C$ to denote that $X$ and $Y$ are conditionally independent given $C$.
We use $\preceq$ to denote a total order. {In the univariate case, the total order $\preceq$ reduces to the standard order $\leq$.}
A formal definition of total order is given in Appendix \ref{appA}.


{\bf Structural causal models (SCM).}
We use the language of SCMs as our basic %semantic and inferential 
framework and follow the standard definition in the following \citep{Pearl09}. 
An SCM ${\cal M}$ is a tuple $\left<{\boldsymbol V},{\boldsymbol U}, {\cal F}, \mathbb{P}_{\boldsymbol U} \right>$, where ${\boldsymbol U}$ is a set of exogenous (unobserved) variables following a distribution $\mathbb{P}_{\boldsymbol U}$, and ${\boldsymbol V}$ is a set of endogenous (observable) variables whose values are determined by structural functions ${\cal F}=\{f_{V_i}\}_{V_i \in {\boldsymbol V}}$ such that $v_i:= f_{V_i}({\mathbf{pa}}_{V_i},{\boldsymbol u}_{V_i})$ where ${\mathbf{PA}}_{V_i} \subseteq {\boldsymbol V}$ and $\boldsymbol{U}_{V_i} \subseteq {\boldsymbol U}$. 
Each SCM ${\cal M}$ induces an observational distribution $\mathbb{P}_{\boldsymbol V}$ over ${\boldsymbol V}$, and a causal graph $G({\cal M})$ %over ${\boldsymbol V}$ 
in which there exists a directed edge from every variable in ${\mathbf{PA}}_{V_i}$ and $\boldsymbol{U}_{V_i}$ to $V_i$. 
An intervention of setting a set of endogenous variables ${\boldsymbol X}$ to constants ${\boldsymbol x}$, denoted by $do({\boldsymbol x})$, replaces the original equations of ${\boldsymbol X}$
 by the constants ${\boldsymbol x}$ and induces a \textit{sub-model}  ${\cal M}_{{\boldsymbol x}}$.
We denote the potential outcome $Y$ under intervention $do({\boldsymbol x})$ by $Y_{{\boldsymbol x}}({\boldsymbol u})$, which is the solution of $Y$ in the sub-model ${\cal M}_{{\boldsymbol x}}$ given ${\boldsymbol U}={\boldsymbol u}$. 





%\begin{figure}[tb]
%\vspace{-0.5cm}
   % \hspace{0.3cm}
%    \centering
 %   \scalebox{0.8}{
%\begin{tikzpicture}
    % x node set with absolute coordinates
 %   \node[mynode] (x) at (0,0) {$X$};
   % \node[mynode] (y) at (3,0) {$Y$};
  %  \node[mynode] (u) at (1.5,1) {$C$};
    %\node[mynode] (m) at (1.5,-1) {$M$};

    % Directed edge
    %\path (x) edge[->] (y);
    %\path (x) edge[dotted,<->,bend right] (y);
%    \path (z) edge[->] (x);
    %\path (u) edge[->] (y);
%    \path (u) edge[dotted,<->,bend left] (y);
    %\path (u) edge[->]  (x);
%\path (x) edge[dotted,<->,bend left] (u);

%\path (x) edge[->] (m);
%\path (m) edge[->] (y);
%\path (u) edge[->] (m);
%\end{tikzpicture}
%}
%\vspace{-0cm}
 %   \caption{A causal graph representing SCM ${\cal M}$.}
  %  \label{DAG1}
   % \end{figure}



%{\bf Causal mediation analysis.} 
%\jin{Delete or shorten this part}
%\st{Causal mediation analysis reveals the strength of different pathways between treatment and outcome through a mediator.
%For the causal mediation analysis, researchers often consider the following SCM ${\cal M}_1$:}
%\begin{equation}
%\begin{gathered}
%Y:=f_Y(X,{M},C,U^Y), {M}:=f_{{M}}(X,C,U^{{M}}), \\
%X:=f_X(C,U^X), C:=f_C(U^C),
%\end{gathered}
%\end{equation}
%\st{where all variables can be vectors, and $U^X$, $U^C$, $U^Y$, and $U^{{M}}$ are latent exogenous variables.
%We assume that the domains $\Omega_Y$ and $\Omega_{U^Y} \times \Omega_{U^{{M}}}$ are totally ordered sets with $\preceq$.}
%\citet{Pearl2001} defined the total, controlled direct, natural direct, and natural indirect effects for general (nonlinear and nonparametric) SCM ${\cal M}_1$. 
%\begin{definition}[TE, CDE, NDE, and NIE] \citep{Pearl2001}
%\label{def1}
%\st{The total, controlled direct, natural direct, and natural indirect effects (TE, CDE, NDE, and NIE) are defined by
%\begin{enumerate}
%\setlength{\itemsep}{2pt}
%\setlength{\parskip}{2pt}
%    \item Total Effect (TE):
%$\text{\normalfont TE}(y;x',x)\defeq\mathbb{E}[Y_{x}]-\mathbb{E}[Y_{x'}]$,
    %$\text{\normalfont TE}(y;x',x)\defeq\mathbb{P}(Y_{x'}\prec y)-\mathbb{P}(Y_{x}\prec y)$
%    \item Controlled Direct Effect (CDE):
%$\text{\normalfont CDE}(y;x',x,{m})\defeq\mathbb{E}[Y_{x,{{m}}}]-\mathbb{E}[Y_{x',{{m}}}]$,
    %$\text{\normalfont CDE}(y;x',x,m)\defeq\mathbb{P}(Y_{x',{m}}\prec y)-\mathbb{P}(Y_{x,{m}}\prec y)$
 %   \item Natural Direct Effect (NDE): 
% $\text{\normalfont NDE}(y;x',x)\defeq\mathbb{E}[Y_{x,{{M}_{x'}}}]-\mathbb{E}[Y_{x'}]$, and
    %\mathbb{E}[Y_{x}]-\mathbb{E}[Y_{x',{M_{x}}}]$
    %$\text{\normalfont NDE}(y;x',x)\defeq\mathbb{P}(Y_{x',{M_{x}}} \prec y)-\mathbb{P}(Y_{x} \prec y)$
    %\item Natural Indirect Effect (NIE):
%    $\text{\normalfont NIE}(y;x',x)\defeq\mathbb{E}[Y_{x',{{M}_{x}}}]-\mathbb{E}[Y_{x'}]$.}
    %\mathbb{E}[Y_{x',{M_{x}}}]-\mathbb{E}[Y_{x'}]$
    %$\text{\normalfont NIE}(y;x',x)\defeq\mathbb{P}(Y_{x'} \prec y)-\mathbb{P}(Y_{x',{M_{x}}} \prec y)$
%\end{enumerate}
%\end{definition}
%\noindent CDE represents the causal effect of changing the treatment from $x'$ to $x$ had the value of the mediator been fixed at a certain value.
%NDE represents the causal effect of changing the treatment from $x'$ to $x$  had the value of the mediator been kept to the same value $M_{x'}$ that $M$ attains under $x'$. 
%NIE represents the causal effect of changing the mediator from $M_{x'}$ to $M_{x}$ had the value of the treatment been fixed to $x'$.
%TE can be decomposed into NDE and NIE by $\text{\normalfont TE}(y;x',x)=\text{\normalfont NDE}(y;x',x)-\text{\normalfont NIE}(y;x,x')=\text{\normalfont NIE}(y;x',x)-\text{\normalfont NDE}(y;x,x')$. 
%\st{These direct and indirect effects can be identified from observational distributions under various settings }\citep{Pearl2001,Avin2005,Shpitser2008,Malinsky2019,Imai2010b}. 

{\bf Probabilities of causation (PoC) and mediation analysis for PoC.}
\citet{Kawakami2024} consider the following SCM:
\begin{equation}
\begin{gathered}
Y:=f_Y(X,C,U^Y), X:=f_X(C,U^X), C:=f_C(U^C),
\end{gathered}
\end{equation}
where all variables can be vectors, and $U^X$, $U^C$, and $U^Y$ are latent exogenous variables, and
defined the (multivariate  conditional) PoC for vectors of continuous or discrete variables as follows:
\begin{definition}[PNS with Evidence] \citep{Kawakami2024}
\label{def41}
%For any $x',x \in \Omega_X$, $y \in \Omega_Y$, and $c \in \Omega_C$, 
The 
%(multivariate  conditional) 
PNS with evidence is defined as 
%\begin{equation}
$\text{\normalfont PNS}(y;x',x,{\cal E},c)\defeq\mathbb{P}(Y_{x'} \prec y \preceq Y_{x}|{\cal E},C=c)$. 
%\end{equation}
%\begin{equation}
%\text{\normalfont PN}(y;x',x,{\cal E},c)\defeq\mathbb{P}(Y_{x'} \prec y |y \preceq Y,X=x,{\cal E},C=c),
%\end{equation}
%\begin{equation}
%\text{\normalfont PS}(y;x',x,{\cal E},c)\defeq\mathbb{P}(y \preceq Y_{x} |Y \prec y,X=x',{\cal E},C=c).
%\end{equation}
\end{definition}
In the above definition, {$C$ and ${\cal E}$ represent the information used to characterize a specific targeted subpopulation.
$C$ consists of subjects’ pre-treatment covariates, and ${\cal E}$ contains information about post-treatment variables, commonly referred to as evidence.
$\text{\normalfont PNS}(y;x',x,{\cal E},c)$ provides a measure of the necessity and sufficiency of $x$ w.r.t. $x'$ to produce $Y \succeq y$ given $C= c$ and evidence ${\cal E}$, that is, when $X$ is set to $X=x$, the event $Y \succeq y$ occurs; when $X$ is set to $X=x'$, the event $Y \succeq y$ does not occur.}
{Note that PNS with ${\cal E}=(y \leq Y, X=x)$ coincides with the probability of necessity (PN), and PNS with ${\cal E}=(Y < y, X=x')$ coincides with the probability of sufficiency (PS) \citep{Kawakami2024med}.}

%\noindent $\text{\normalfont PNS}(y;x',x,{\cal E},c)$ provides a measure of the necessity and sufficiency of $x$ w.r.t. $x'$ to produce $Y\succeq y$ given $C=c$ and ${\cal E}$.
%$\text{\normalfont PNS}(y;x',x,{\cal E},c)$ include PN and PS, which is defined as $\text{\normalfont PN}(y;x',x,c)\defeq\mathbb{P}(Y_{x'} \prec y |y \preceq Y,X=x,C=c)$ and $\text{\normalfont PS}(y;x',x,c)\defeq\mathbb{P}(y \preceq Y_{x} |Y \prec y,X=x',C=c)$.
%$\text{\normalfont PN}(y;x',x,c)$ and $\text{\normalfont PS}(y;x',x,c)$ provide a measure of the necessity and sufficiency, respectively, of $x$ w.r.t. $x'$ to produce $Y\succeq y$ given $C=c$.
%$\text{\normalfont PS}(y;x',x,c)$ provides a measure of the sufficiency of $x$ w.r.t. $x'$ to produce $Y\succeq y$ given $C=c$.
We will often call $\text{\normalfont PNS}$ \textit{total PNS (T-PNS)} and denote it by $\text{\normalfont T-PNS}(y;x',x,{\cal E},c)$  for convenience. 
%Figure \ref{fig2} (a) shows the situation of potential outcomes in T-PNS.
%When treatment $X$ and outcome $Y$ are binary, 
%PNS, PS, and PS become (setting $y=1$) 
%$\text{\normalfont PNS}(c)=\mathbb{P}(Y_{0}=0,Y_{1}=1|C=c)$,
%$\text{\normalfont PN}(c)=\mathbb{P}(Y_{0}=0|Y=1,X=1,C=c)$, and 
%$\text{\normalfont PS}(c)=\mathbb{P}(Y_{1}=1|Y=0,X=0,C=c)$
%for any $c \in \Omega_C$, which reduce to Pearl's (1999) original definition when $C=\emptyset$.
%In the studies \citep{Dawid2017,Cuellar2020}, PN is called PoC.

Recently, \citet{Kawakami2024med} considered the following SCM ${\cal M}_1${, corresponding to the causal graph in Figure~\ref{DAG0}}:
\begin{equation}
\begin{gathered}
Y:=f_Y(X,{M},C,U^Y), {M}:=f_{{M}}(X,C,U^{{M}}), \\
X:=f_X(C,U^X), C:=f_C(U^C),
\end{gathered}
\end{equation}
where all variables can be vectors, and $U^X$, $U^C$, $U^Y$, and $U^{{M}}$ are latent exogenous variables.

\citet{Kawakami2024med} defined the (conditional) controlled direct, natural direct, and natural indirect probabilities of necessity and sufficiency with evidence.
%to answer the questions (Q-a) and (Q-b)
%as below.
\begin{definition}[CD-PNS, ND-PNS, and NI-PNS with Evidence]
\label{def3}
%For each $x',x \in \Omega_X$, $m \in \Omega_M$, $y \in \Omega_Y$, and $c \in \Omega_C$, 
The controlled direct, natural direct, and natural indirect %probabilities of necessity and sufficiency 
PNS (CD-PNS, ND-PNS, and NI-PNS) with evidence w.r.t. $M$ are defined by
%\begin{align}
$\text{\normalfont CD-PNS}(y;x',x,m,{\cal E},c)\defeq\mathbb{P}(Y_{x',m} \prec y \preceq Y_{x,m}|{\cal E},C=c)$, 
$\text{\normalfont ND-PNS}(y;x',x,{\cal E},c)\defeq\mathbb{P}(Y_{x'} \prec y \preceq Y_{x}, Y_{x',M_{x}} \prec y|{\cal E},C=c)$, and
$\text{\normalfont NI-PNS}(y;x',x,{\cal E},c)\defeq\mathbb{P}(Y_{x'} \prec y \preceq Y_{x},y \preceq Y_{x',M_{x}}|{\cal E},C=c)$.
%\end{align}
\end{definition}
%, including the evidence of PN and PS.
ND-PNS and NI-PNS can answer the causal questions (Q-a) and (Q-b), respectively.
$\text{\normalfont T-PNS}$ is decomposed as $\text{\normalfont ND-PNS}+\text{\normalfont NI-PNS}$.
However, their applicability is restricted to the single mediator case, limiting their ability to capture more complex mediation pathways involving additional mediators.




\begin{figure}[tb]
%\vspace{-0.5cm}
   % \hspace{0.3cm}
    \centering
    \scalebox{1}{
\begin{tikzpicture}
    % x node set with absolute coordinates
    \node[mynode] (x) at (0,0) {$X$};
    \node[mynode] (y) at (4,0) {$Y$};
    \node[mynode] (u) at (2,1.25) {$C$};
    \node[mynode] (m) at (2,-1.25) {${M}$};
    
    %\node[mynode] (m2) at (3,-1.5) {${N}$};

    % Directed edge
    \path (x) edge[->] (y);
    %\path (x) edge[dotted,<->,bend right] (y);
%    \path (z) edge[->] (x);
    \path (u) edge[->] (y);
%    \path (u) edge[dotted,<->,bend left] (y);
    \path (u) edge[->]  (x);
%\path (x) edge[dotted,<->,bend left] (u);

\path (x) edge[->] (m);
\path (m) edge[->] (y);
\path (u) edge[->] (m);


%\path (x) edge[->] (m2);
%\path (m) edge[->] (m2);
%\path (u) edge[->] (m2);
%\path (m2) edge[->] (y);
\end{tikzpicture}
}
%\vspace{-0cm}
    \caption{A causal graph representing SCM ${\cal M}_1$.}
    \label{DAG0}
    \end{figure}


\begin{figure}[tb]
%\vspace{-0.5cm}
   % \hspace{0.3cm}
    \centering
    \scalebox{1}{
\begin{tikzpicture}
    % x node set with absolute coordinates
    \node[mynode] (x) at (0,0) {$X$};
    \node[mynode] (y) at (4,0) {$Y$};
    \node[mynode] (u) at (2,1.25) {$C$};
    \node[mynode] (m) at (1,-1.5) {${M}$};
    
    \node[mynode] (m2) at (3,-1.5) {${N}$};

    % Directed edge
    \path (x) edge[->] (y);
    %\path (x) edge[dotted,<->,bend right] (y);
%    \path (z) edge[->] (x);
    \path (u) edge[->] (y);
%    \path (u) edge[dotted,<->,bend left] (y);
    \path (u) edge[->]  (x);
%\path (x) edge[dotted,<->,bend left] (u);

\path (x) edge[->] (m);
\path (m) edge[->] (y);
\path (u) edge[->] (m);


\path (x) edge[->] (m2);
\path (m) edge[->] (m2);
\path (u) edge[->] (m2);
\path (m2) edge[->] (y);
\end{tikzpicture}
}
%\vspace{-0cm}
    \caption{A causal graph representing SCM ${\cal M}_2$.}
    \label{DAG1}
    \end{figure}






{\bf Causal mediation analysis for two mediators.}
%\citet{Daniel2015} and \citet{Zhou2023} have studied the causal mediation analysis with multiple mediators.
Researchers often consider the following SCM ${\cal M}_2$ with two mediators, corresponding to the causal graph in Figure~\ref{DAG1}:
\begin{equation}
\begin{gathered}
Y:=f_Y(X,{M},{N},C,U^Y), {N}:=f_{{N}}(X,{M},C,U^{{N}}),\\ {M}:=f_{{M}}(X,C,U^{{M}}),X:=f_X(C,U^X),C:=f_C(U^C),
\end{gathered}
\end{equation}
where all variables can be vectors, 
and $U^X$, $U^C$, $U^Y$, $U^{{M}}$, and $U^{{N}}$ are latent exogenous variables.
We assume that the domains $\Omega_Y$ and $\Omega_{U^Y} \times \Omega_{U^{{M}}} \times \Omega_{U^{{N}}}$ are totally ordered sets with $\preceq$.
SCM ${\cal M}_2$ means that two mediators are causally ordered, or ${M}$ is the cause of ${N}$.


One of the most widely used models in mediation analysis with multiple mediators is a linear SCM ${\cal M}^{L2}$ %with normal distribution 
%\citep{Baron1986} 
consisting of 
%Especially, the linear SCM with normal distribution ${\cal M}^L$ consists of 
$Y:=\alpha_0+\alpha_1 X+\alpha_2 {M}+\alpha_3 {N}+\alpha_4 C+U^Y$, ${N}:=\beta_0+\beta_1 X+\beta_2 {M}+\beta_3 C+U^{{N}}$, ${M}:=\gamma_0+\gamma_1 X+\beta_3 C+U^{{M}}$, where $U^C\sim {\cal N}(0,\sigma_C)$, $U^X\sim {\cal N}(0,\sigma_X)$, $U^Y\sim {\cal N}(0,\sigma_Y)$, $U^{{M}} \sim {\cal N}(0,\sigma_{{M}})$, $U^{{N}} \sim {\cal N}(0,\sigma_{{N}})$, and they are mutually independent normal distributions.
${\cal N}(\mu,\sigma)$ means a normal distribution whose mean is $\mu$ and standard deviation is $\sigma$.
%${\cal M}^L$ is the most widely used model in the mediation analysis \citep{Baron1986}.
%Under SCM ${\cal M}^L$, the total effect of $X$ on $Y$ is $\alpha_1+\beta_1\alpha_2$, the indirect effect is $\beta_1\alpha_2$, and the direct effect is $\alpha_1$.


Then, \citet{Daniel2015} defined the 
%\hl{56}\jin{??} 
natural path-specific causal effects for binary treatment using the expectation of the counterfactuals, e.g.,
$\mathbb{E}[Y_{1,{M}_{1},{N}_{1,{M}_{0}}}]-\mathbb{E}[Y_{1,{M}_{1},{N}_{0,{M}_{0}}}]$.
They impose the following assumption to identify the path-specific causal effects.
%$\mathbb{P}\Big(Y_{x,{M}_{x'},{N}_{x'',{M}_{x'''}}}>y\Big)$.
\begin{assumption}%[Assumptions for Path-Specific Effects]
\label{SCAS}
The following conditional independence statements hold:
%\begin{equation}
%\begin{gathered}
${\normalfont (1)} \{Y_{x,{m},{n}},{M}_x,{N}_{x,{m}}\} \indep X|C=c$,
${\normalfont (2)} \{Y_{x,{m},{n}},{N}_{x,{m}}\} \indep {M}|C=c,X=x$, and
${\normalfont (3)} Y_{x,{m},{n}} \indep {N}|C=c,X=x$,
%\end{gathered}
%\end{equation}
for any ${m} \in \Omega_{{M}}$, ${n} \in \Omega_{{N}}$, $x \in \Omega_X$, and $c \in \Omega_C$, where $\mathfrak{p}_{X|C}(x|c)>0$, $\mathfrak{p}_{{M}|C,X}({m}|c,x)>0$, $\mathfrak{p}_{{N}|C,X,{M}}({n}|c,x'',{{m}}')>0$, and $\mathfrak{p}_{{M}_{x'''}|C,{M}_{x'}}({{m}}'|c,{m})>0$ for any ${m}, {{m}}' \in \Omega_{{M}}$, ${n} \in \Omega_{{N}}$, $x \in \Omega_X$, and $c \in \Omega_C$.
\end{assumption}
These independence conditions hold when there are no unmeasured confounders (or bidirected edges) between $\{X,{M},{N}\}$$\rightarrow$$Y$, $\{X,{M}\}$$\rightarrow$${N}$, and $X$$\rightarrow$${M}$.
The consistency conditions $\{X,{M},{N}\}$ on $Y$, $X$ on ${M}$, and $\{X,{M}\}$ on ${N}$ assumed in \citep{Daniel2015} hold under SCM ${\cal M}_2$.

\begin{lemma}%[$\mathbb{P}\Big(Y_{x,{M}_{x'},{N}_{x'',{M}_{x'''}}}\prec y\Big)$] 
\citep{Daniel2015}
\label{lem2}
Under SCM ${\cal M}_2$  and Assumption \ref{SCAS}, 
the conditional CDF of potential outcome $\mathbb{P}(Y_{x,{M}_{x'},{N}_{x'',{M}_{x'''}}}\prec y|C=c)$ is given by
\begin{align}
\label{eq3}
&\mathbb{P}(Y_{x,{M}_{x'},{N}_{x'',{M}_{x'''}}}\prec y|C=c)=\int_{\Omega_{{M}}}\int_{\Omega_{{M}}}\int_{\Omega_{{N}}}\nonumber\\
&\hspace{0.5cm}\mathbb{P}(Y\prec y|X=x,{M}={m},{N}={n},C=c)\nonumber\\
&\hspace{0.5cm}\times\mathfrak{p}_{{N}|C,X,{M}}({n}|c,x'',{{m}}')\ \mathfrak{p}_{{M}_{x'''}|C,{M}_{x'}}({{m}}'|c,{m})\nonumber\\
&\hspace{0.5cm}\times\mathfrak{p}_{{M}|C,X}({m}|c,x')\ d{n}d{m}d{{m}}'
\end{align}
for any $x, x', x'', x''' \in \Omega_X$, $y \in \Omega_Y$, and $c \in \Omega_C$.
\end{lemma}
This lemma does not imply the identification of $\mathbb{P}(Y_{x,{M}_{x'},{N}_{x'',{M}_{x'''}}}\prec y|C=c)$.
Instead, it states that $\mathbb{P}(Y_{x,{M}_{x'},{N}_{x'',{M}_{x'''}}}\prec y|C=c)$ is identifiable if $\mathfrak{p}_{{M}_{x''}|C,{M}_{x'}}({{m}}'|c,{m})$ is known or identifiable.
{Appendix \ref{appA3} presents the explicit form of the distribution of $Y_{x,{M}_{x'},{N}_{x'',{M}_{x'''}}}$ derived under two simple SCMs.}



Furthermore, \citep{Daniel2015} showed three special cases in which $\mathfrak{p}_{{M}_{x''}|C,{M}_{x'}}({{m}}'|c,{m})$ is identifiable.
First, if $x'=x'''$, then $\mathfrak{p}_{{M}_{x'''}|C,{M}_{x'}}({{m}}'|c,{m})=\mathbbm{1}({m}={{m}}')$ holds.
Second, if there exists no effect of ${M}$ on ${N}$, then
%{\small
%\begin{align}
$\mathbb{P}(Y_{x,{M}_{x'},{N}_{x'',{M}_{x'''}}}\prec y|C=c)=\int_{\Omega_{{M}}}\int_{\Omega_{{M}}}\int_{\Omega_{{N}}}\mathbb{P}(Y\prec y|X=x,{M}={m},{N}={n},C=c)\mathfrak{p}_{{N}|C,X}({n}|c,x'')\mathfrak{p}_{{M}|C,X}({m}|c,x')d{n}d{m}$
%\end{align}
%}
holds.
Third, if we assume a specific model with Gaussian noise, i.e., ${M}|X,C \sim {\cal N}(f(X,C;\alpha),\sigma^2)$, then we can identify $\mathfrak{p}_{{M}_{x'''}|C,{M}_{x'}}({{m}}'|c,{m})$, where $f(X,C;\alpha)$ represents a parametric model.








%[why do you need $Y_x' < y$? That is , why do you insist on T-PNS when considering NDE?]

%\yuta{
%Alternatively, one may define ND-PNS and NI-PNS as
%$\text{\normalfont ND-PNS'}(y;x',x,{\cal E},c)\defeq\mathbb{P}(Y_{x',M_{x}} \prec y \preceq Y_{x}|{\cal E},C=c)$, and
%$\text{\normalfont NI-PNS'}(y;x',x,{\cal E},c)\defeq\mathbb{P}(Y_{x'} \prec y \preceq Y_{x',M_{x}}|{\cal E},C=c)$.
%Since we have
%\begin{align}
%&\mathbb{P}(Y_{x',M_{x}} \prec y \preceq Y_{x}|{\cal E},c)\\
%&=\mathbb{P}(Y_{x'} \prec y,Y_{x',M_{x}} \prec y \preceq Y_{x}|{\cal E},c)\\
%&+\mathbb{P}(y\preceq Y_{x'},Y_{x',M_{x}} \prec y \preceq Y_{x}|{\cal E},c),
%\end{align}
%and 
%\begin{align}
%&\mathbb{P}(Y_{x'} \prec y \preceq Y_{x',M_{x}}|{\cal E},c)\\
%&=\mathbb{P}(Y_x \prec y,Y_{x'} \prec y \preceq Y_{x',M_{x}}|{\cal E},c)\\
%&+\mathbb{P}(y\preceq Y_x,Y_{x'} \prec y \preceq Y_{x',M_{x}}|{\cal E},c),
%\end{align}
%then the decomposition relationship $\text{\normalfont T-PNS}(y;x',x,{\cal E},c)=\text{\normalfont ND-PNS'}(y;x',x,{\cal E},c)+\text{\normalfont NI-PNS'}(y;x',x,{\cal E},c)$ does not hold.
%We have 
%\begin{align}
%&\text{\normalfont ND-PNS'}(y;x',x,{\cal E},c)+\text{\normalfont NI-PNS'}(y;x',x,{\cal E},c)\\
%&=\text{\normalfont T-PNS}(y;x',x,{\cal E},c)+\mathbb{P}(Y_x \prec y,Y_{x'} \prec y).
%\end{align}
%}




%\yuta{The definitions of ND-PNS and NI-PNS, when formulated without the term $Y_{x'} \prec y$, lead to an unintuitive result.
%When $\mathbb{P}(Y_{x'} \prec y,Y_{x',M_{x}} \prec y \preceq Y_{x})=0$, $\mathbb{P}(y\preceq Y_{x'},Y_{x',M_{x}} \prec y \preceq Y_{x})>0$, $\mathbb{P}(Y_x \prec y,Y_{x'} \prec y \preceq Y_{x',M_{x}})>0$, and $\mathbb{P}(y\preceq Y_x,Y_{x'} \prec y \preceq Y_{x',M_{x}})=0$, 
%we have $\text{\normalfont ND-PNS'}(y;x',x,{\cal E},c)>0$, $\text{\normalfont NI-PNS'}(y;x',x,{\cal E},c)>0$, and $\text{\normalfont T-PNS}(y;x',x,{\cal E},c)=0$.
%This means the treatment $x$ is necessary and sufficient w.r.t. $x'$ to provoke the event $y \preceq Y$ through directly and indirectly, respectively, to some extent.
%However, the treatment $x$ is not necessary and sufficient w.r.t. $x'$ to provoke the event $y \preceq Y$ along with both paths.
%This is an unintuitive result.}


%[It looks like the AAAI definitions are more like (ND-PNS AND T-PNS) and  (NI-PNS AND T-PNS).]



%\yuta{We denote the counterfactual conditions of ``total necessity and sufficiency" (T-NS), ``natural direct necessity and sufficiency" (ND-NS), and ``natural indirect necessity and sufficiency" (NI-NS) as
%\begin{align}
%&\text{\normalfont T-NS}(y;x',x)=\mathbb{I}(Y_{x'} \prec y \preceq Y_{x})\\
%&\text{\normalfont ND-NS}(y;x',x,x^*)=\mathbb{I}(Y_{x',M_{x^*}} \prec y \preceq Y_{x,M_{x^*}}),\\
%&\text{\normalfont NI-NS}(y;x',x,x^*)=\mathbb{I}(Y_{x^*,M_{x'}} \prec y \preceq Y_{x^*,M_{x}}).
%\end{align}
%$\text{\normalfont ND-NS}(y;x',x,x^*)$ represents the treatment $x$ is necessary and sufficient w.r.t. $x'$ to provoke the event $y \preceq Y$ while keeping the mediator value as ${M}_{x^*}$.
%$\text{\normalfont NI-NS}(y;x',x,x^*)$ represents ${M}_{x}$ is necessary and sufficient w.r.t. ${M}_{x'}$ to provoke the event $y \preceq Y$ while setting the treatment as $x^*$.
%Then, the definitions of ND-PNS and NI-PNS are given as $\text{\normalfont ND-PNS}(y;x',x,{\cal E},c)=\mathbb{P}(\text{\normalfont T-NS}(y;x',x)\times \text{\normalfont ND-NS}(y;x',x,x)=1|{\cal E},C=c)$ and $\text{\normalfont NI-PNS}(y;x',x,{\cal E},c)=\mathbb{P}(\text{\normalfont T-NS}(y;x',x)\times \text{\normalfont NI-NS}(y;x',x,x')=1|{\cal E},C=c)$.}





%\yuta{
%More generally, the definitions of ND-PNS and NI-PNS can be expressed as $\text{\normalfont ND-PNS}(y;x',x,x^*,{\cal E},c)=\mathbb{P}(\text{\normalfont T-NS}(y;x',x)\times \text{\normalfont ND-NS}(y;x',x,x^*)=1|{\cal E},C=c)$ and $\text{\normalfont NI-PNS}(y;x',x,x^*,{\cal E},c)=\mathbb{P}(\text{\normalfont T-NS}(y;x',x)\times \text{\normalfont NI-NS}(y;x',x,x^*)=1|{\cal E},C=c)$ for $x^* \in \{x',x\}$.
%}




%[ND-PNS was defined based on NDE(x,x') instead of NDE(x',x).]


%\yuta{[When we define $\text{\normalfont ND-PNS}(y;x',x,{\cal E},c)\defeq\mathbb{P}(Y_{x'} \prec y \preceq Y_{x}, Y_{x,M_{x'}} \prec y|{\cal E},C=c)$, 
%$\text{\normalfont ND-PNS}(y;x,x',{\cal E},c)\defeq\mathbb{P}(Y_{x} \prec y \preceq Y_{x'}, Y_{x',M_{x}} \prec y|{\cal E},C=c)$, which does not coincide with AAAI definition.
%When we define $\text{\normalfont ND-PNS}(y;x',x,{\cal E},c)\defeq\mathbb{P}(Y_{x} \prec y \preceq Y_{x'}, Y_{x,M_{x'}} \prec y|{\cal E},C=c)$, 
%$\text{\normalfont ND-PNS}(y;x,x',{\cal E},c)\defeq\mathbb{P}(Y_{x'} \prec y \preceq Y_{x}, Y_{x',M_{x}} \prec y|{\cal E},C=c)$, which coincides with AAAI definition.]}



