

In this section, we study the (central) moments of causal effects $Y_1 - Y_0$ to address (\textbf{Question 1}). %We examine the causal effect $Y_1 - Y_0$.
%We examine the comparison of two potential outcomes $(Y_1, Y_0)$. % in the setting where $\Omega_X = \{0,1\}$.


\subsection{Definition of the moments of causal effects} % of momemts of causal effects}
\label{sec-mce}
%{\bf Definition of the moment of causal effects.}
We define the moments of causal effects in the same manner as the moments of random variables.
\begin{definition}[The moments of causal effects]
For each $m\geq 1$,
the $m$-th moment of causal effect $Y_1-Y_0$ is defined as 
\begin{equation}
\mu^{(m)}\defeq\mathbb{E}\Big[(Y_1-Y_0)^m\Big].
\end{equation}
\end{definition}
The $m$-th moment of the causal effect is defined as the expectation of the $m$-th power of the causal effect $Y_1 - Y_0$.
The first moment, $\mu^{(1)}=\mathbb{E}[Y_1 - Y_0]$, is the ACE.
%When $m \geq 2$, $\mu^{(m)}$ is not equal to $\mathbb{E}[Y_1^m - Y_0^m]$, as discussed in \citep{Hernan2024, Kuroki2024}. Under the exogeneity assumption (Assumption \ref{ASEXO2}), $\mathbb{E}[Y_1^m - Y_0^m]$ is identifiable as $\mathbb{E}[Y^m | X = 1] - \mathbb{E}[Y^m | X = 0]$. However, $\mu^{(m)}$ remains unidentifiable because both $Y_1$ and $Y_0$ are never simultaneously observed for any subject \citep{Holland1986, Hernan2024}. For example, the second moment of the causal effect, $\mu^{(2)}$, is given by $\mathbb{E}[Y_1^2]-2\mathbb{E}[Y_0 Y_1]+\mathbb{E}[Y_0^2]$. However, the term $\mathbb{E}[Y_0 Y_1]$ is not identifiable because $Y_0$ and $Y_1$ are never observed simultaneously for any subject.





We present two examples to illustrate what the moments of causal effects specifically measure in simple SCMs.


{\bf Example 1.} (Homogeneous ICE)
Consider a simple linear SCM given by $Y=X+U^Y$ where $\mathbb{E}[U^Y]=0$.
In this model, the ICE is equal to $1$ for every subject, meaning that the causal effect is homogeneous.
Consequently, all of the $m$-th moments of the causal effect are also equal to $1$.
Note that %$\mathbb{E}[Y^m]=\mathbb{E}[(X+U^Y)^m]$ and 
$\mathbb{E}[Y_1^m-Y_0^m]=\mathbb{E}[(1+U^Y)^m-(U^Y)^m]$ {varies with $m$.} 

{\bf Example 2.} (Heterogeneous ICE)
Consider a linear SCM with an interaction term between $X$ and $U^Y$, $Y=X(U^Y+1)+1$ where $\mathbb{E}[U^Y]=0$.
In this model, $\text{ICE} = Y_1 - Y_0 = U^Y+1$, which varies across subjects, making the causal effect heterogeneous.
The $m$-th moment of the causal effect  is given by $\mathbb{E}[(U^Y+1)^m]$.
In comparison, %$\mathbb{E}[Y^m]=\mathbb{E}[(X(U^Y+1)+1)^m]$ and 
$\mathbb{E}[Y_1^m-Y_0^m]=\mathbb{E}[(U^Y+2)^m-1]$.


%\yuta{For a continuous outcome, several studies \citep{DiNardo1996,Kennedy2023d} aim to estimate the PDF of $Y_x$, i.e., $\mathfrak{p}_{Y_x}$. However, identifying the moments of causal effects requires the joint PDF of $(Y_0, Y_1)$, i.e., $\mathfrak{p}_{(Y_0,Y_1)}$. $\mu^{(m)}$ is given by $\int_{\Omega_Y}(y_1-y_0)^m\mathfrak{p}_{(Y_0,Y_1)}(y_0,y_1)dy_0dy_1$.
%\citep{Hoshino2020} studied the identification problem of the joint PDF of $(Y_0,Y_1)$ under various parametric specifications.}

%\yuta{Since the joint CDF of $(Y_0, Y_1)$, i.e., $\mathbb{P}(Y_0 < y_0, Y_1 < y_1)$, is identified as $\min\{\mathbb{P}(Y_0 < y_0), \mathbb{P}(Y_1 < y_1)\}$ under Assumption \ref{MONO2}, the joint PDF of $(Y_0, Y_1)$ is then given by $\mathfrak{p}_{(Y_0,Y_1)}(y_0,y_1)=\frac{\partial^2\mathbb{P}(Y_0<y_0,Y_1<y_1)}{\partial_{y_0}\partial_{y_1}}=\frac{\partial^2\min\{\mathbb{P}(Y_0 < y_0), \mathbb{P}(Y_1 < y_1)\}}{\partial_{y_0}\partial_{y_1}}$ if it exists.}






%\subsection{Central momemts of causal effects}


%\yuta{The second central moments of causal effects (variance) are discussed in \citep{Hernan2024}.}
%\yuta{\citet{Heckman1997} showed the identification of ICE, under the rank invariance assumption, which states that ``$\mathbb{P}(Y_0<y_0)=\mathbb{P}(Y_1<y_1)$ holds  for almost every subject whose potential outcomes are $(Y_1,Y_0)=(y_1,y_0)$" in the case of a continuous outcome. Then, they also provide the identification of the variance of causal effects by identifying ICE. Their results are restricted to the case of continuous outcomes.}
%, whereas our Assumption \ref{MONO2} is applicable to discrete or binary outcomes.}






%We define the central moments of causal effects in a general form.
The central moments of causal effects are defined as the moments of causal effects measured relative to their mean.
%{\bf Definition of the central moment of causal effects.}
\begin{definition}[The central moment of causal effects]
For each $m\geq 1$,
the $m$-th central moment of causal effect $Y_1-Y_0$ is defined as
\begin{equation}
\overline{\mu}^{(m)}\defeq\mathbb{E}\Big[\Big\{(Y_1-Y_0)-(\mathbb{E}[Y_1]-\mathbb{E}[Y_0])\Big\}^m\Big].
\end{equation}
\end{definition}
%The $m$-th central moment of $Y_1 - Y_0$ is defined as the expectation of the $m$-th power of the deviation of $Y_1 - Y_0$ from its mean, given by $(Y_1-Y_0)-(\mathbb{E}[Y_1]-\mathbb{E}[Y_0])$.
The first central moment of causal effects is always $0$ since we have $\overline{\mu}^{(1)}=\mathbb{E}[(Y_1-Y_0)]-\mathbb{E}[(\mathbb{E}[Y_1]-\mathbb{E}[Y_0])]=0$.
When $m\geq 2$, $\overline{\mu}^{(m)}$ is not equal to $\mathbb{E}[(Y_1-\mathbb{E}[Y_1])^m]-\mathbb{E}[(Y_0-\mathbb{E}[Y_0])^m]$ as discussed in \citep{Wiedermann2022}. 


We revisit Examples 1 and 2 in Section~\ref{sec-mce}  to illustrate  the central moments of causal effects. % specifically measure in simple SCMs.


{\bf Example 1 (continued).} (Homogeneous ICE)
%Revisiting Example 1, 
In SCM given by $Y=X+U^Y$ where $\mathbb{E}[U^Y]=0$, the $m$-th central moment is equal to $0$ for any $m \geq 1$, indicating that the causal effect is homogeneous.




{\bf Example 2 (continued).} (Heterogeneous ICE)
%Revisiting Example 2, 
In SCM $Y=X(U^Y+1)+1$ where $\mathbb{E}[U^Y]=0$, the $m$-th central moment is given by $\mathbb{E}[(U^Y)^m]$ for all $m \geq 1$.
The central moments of causal effects correspond to the (central) moments of the random variable $U^Y$.


The higher order of moments of causal effects may  provide useful information on the distribution. The central moments of causal effects can be used to compute important and well-known statistics such as the variance $\overline{\mu}^{(2)}$, standard deviation $\sqrt{\overline{\mu}^{(2)}}$, skewness ${\overline{\mu}^{(3)}}/{{\overline{\mu}^{(2)}}^{3/2}}$, and kurtosis ${\overline{\mu}^{(4)}}/{{\overline{\mu}^{(2)}}^{2}}$ of the causal effects.
%The variance and standard deviation of causal effects are derived from the second central moment of the causal effect \citep{Heckman1997,Hernan2024}.
%i.e.,
%\begin{equation}
%$\overline{\mu}_2$,
%\end{equation}
%which appears in \citep{Hernan2024}.
%Standard deviation of causal effect is given by $\sqrt{\overline{\mu}_2}$.
Variance and standard deviation quantify the dispersion of a distribution.
If the variance of causal effects is large, the causal effects may deviate significantly from ACE for some subjects. %, posing a risk of much larger or smaller values.
When the variance of causal effects is small, ICE is close to ACE for all subjects. 
%If the variance of causal effects is 0, it implies that ICE is constant and homogeneous if the causal effects almost surely, where ``almost surely" means with probability 0.
%Then, it is possible to test the homogeneity of causal effects by checking whether $\overline{\mu}_2$ is equal to 0 or not.
%The homogeneity of causal effects is the essential property for applying the results of the averages to each subject \citep{Holland1986,Imbens1994,Swanson2013}, and the homogeneity test of causal effects (risk differences) for binary variables was studied in \citep{Gart1990,Lipsitz1998,Geng2001}.
%The skewness of the causal effect is determined by the combination of the second and third central moments of causal effects.
%, i.e., ${\overline{\mu}_3}/{\overline{\mu}_2^{3/2}}$.
Skewness is a measure of the asymmetry of a probability distribution. %\citep{Joanes1998,Doane2011}.
If the causal effect is positively skewed, the right tail of the distribution of the causal effect is longer.
If the causal effect is negatively skewed, the left tail of the distribution is longer.
Kurtosis is a measure of the tailedness or peakedness of a distribution.  %\citep{Pearson1905,Balanda1988,Joanes1998,Hippel2005}.
%The kurtosis of the causal effect is determined by the second and fourth central moments of the causal effect.
%, i.e., ${\overline{\mu}_4}/{\overline{\mu}_2^{2}}$.
High kurtosis values indicate the presence of outliers in causal effects \citep{Westfall2014}.



%Variance of causal effects is given by the second central moment of causal effect.
%, i.e.,
%\begin{equation}
%$\overline{\mu}^{(2)}$,
%\end{equation}
%which appears in \citep{Hernan2024}.
%Standard deviation of causal effect is given by $\sqrt{\overline{\mu}^{(2)}}$.
%Variance and standard deviation are measures of dispersion.
%If the variance of causal effects is relatively large, there is a significant risk of taking much larger or smaller values than ACE.
%When the variance of causal effects is relatively small, ICE is close to ACE for any subject.
%If the variance of causal effects is 0, it implies that ICE is constant and homogeneous if the causal effects almost surely, where ``almost surely" means with probability 0.
%Then, it is possible to test the homogeneity of causal effects by checking whether $\overline{\mu}^{(2)}$ is equal to 0 or not.
%The homogeneity of causal effects is the essential property for applying the results of the averages to each subject \citep{Holland1986,Imbens1994,Swanson2013}, and the homogeneity test of causal effects (risk differences) for binary variables was studied in \citep{Gart1990,Lipsitz1998,Geng2001}.
%Skewness of causal effect is given by the combination of the second and third central moments of causal effects, i.e., $\frac{\overline{\mu}^{(3)}}{{\overline{\mu}^{(2)}}^{3/2}}$.
%Skewness is a measure of the asymmetry of the probability distribution \citep{Joanes1998,Doane2011}.
%If the causal effect is positively skewed, the right tail of the distribution of causal effects is longer.
%If the causal effect is negatively skewed, the left tail of the distribution of causal effects is longer.
%Kurtosis is a measure of the tailedness or peakedness of the probability distribution \citep{Pearson1905,Balanda1988,Joanes1998,Hippel2005}.
%The kurtosis of the causal effect is given by the second and fourth central moments of the causal effect, i.e., $\frac{\overline{\mu}^{(4)}}{{\overline{\mu}^{(2)}}^{2}}$.
%High kurtosis values indicate the presence of outliers in causal effects \citep{Westfall2014}.


%The implications of higher-order moments of random variables than five have rarely been discussed. However, the higher order of moments of causal effects may also provide useful information on the distribution.


\subsection{Identification of the moments of causal effects}

Under %SCM ${\cal M}$ and 
the exogeneity assumption (Assumption \ref{ASEXO2}), the first moment of causal effects is identifiable as $\mathbb{E}[Y|X=1]-\mathbb{E}[Y|X=0]$ \citep{Holland1986}.
In this section, we discuss the identification  of the higher moments of causal effects. % where $m\geq 2$.

When $m \geq 2$, $\mu^{(m)}$ is not equal to $\mathbb{E}[Y_1^m - Y_0^m]$, as discussed in \citep{Hernan2024, Kuroki2024}. Under Assumption \ref{ASEXO2}, $\mathbb{E}[Y_1^m - Y_0^m]$ is identifiable as $\mathbb{E}[Y^m | X = 1] - \mathbb{E}[Y^m | X = 0]$. However, $\mu^{(m)}$ remains unidentifiable.  
For example, the second moment of the causal effect, $\mu^{(2)}$, is given by $\mathbb{E}[Y_1^2]-2\mathbb{E}[Y_0 Y_1]+\mathbb{E}[Y_0^2]$, where the term $\mathbb{E}[Y_0 Y_1]$ is not identifiable. 

%{\bf Lemmas related to the moment of causal effects.}
To prepare  the identification of the moments of causal effect,
 we first decompose $(Y_1-Y_0)^m$ into two parts as follows:
\begin{lemma}
\label{lem1}
Under SCM ${\cal M}$, %given $m\geq 1$, 
we have
\begin{align}
\label{eq5}
%\begin{aligned}
&(Y_1-Y_0)^m=(Y_1-Y_0)^m\mathbb{I}(Y_1>Y_0)\nonumber\\
&\hspace{3cm}+(-1)^m(Y_0-Y_1)^m\mathbb{I}(Y_0>Y_1)\nonumber\\
&=\int_{{\Omega_Y}^m} \mathbb{I}(Y_0<y_1\leq Y_1,Y_0<y_2\leq Y_1,\dots,\nonumber\\
&\hspace{3.5cm}Y_0<y_m\leq Y_1)dy_1\dots dy_m\nonumber\\
&+(-1)^m\int_{{\Omega_Y}^m} \mathbb{I}(Y_1<y_1\leq Y_0,Y_1<y_2\leq Y_0,\dots,\nonumber\\
&\hspace{3.5cm}Y_1<y_m\leq Y_0)dy_1\dots dy_m.
%\end{aligned}
\end{align}
\end{lemma}

The first part corresponds to subjects with a positive ICE, where $Y_1 - Y_0 > 0$, and the second part corresponds to subjects with a negative ICE, where $Y_1 - Y_0 < 0$.


%We present two examples to illustrate how $(Y_1-Y_0)^m$ is concretely decomposed.

%{\bf Example 1 (continued).} (Homogeneous ICE)
%Revisiting Example 1, the first part is $(Y_1-Y_0)^m\mathbb{I}(Y_1>Y_0)=1$ and the second part is $(-1)^m(Y_1-Y_0)^m\mathbb{I}(Y_0>Y_1)=0$ for any $m \geq 1$.


%{\bf Example 2 (continued).} (Heterogeneous ICE)
%Revisiting Example 2, the first part is $(Y_1-Y_0)^m\mathbb{I}(Y_1>Y_0)=U^Y^m\mathbb{I}(U^Y>0)$ and the second part is $(-1)^m(Y_1-Y_0)^m\mathbb{I}(Y_0>Y_1)=(-1)^m(-U^Y)^m\mathbb{I}(U^Y<0)=U^Y^m\mathbb{I}(U^Y<0)$ for any $m \geq 1$.

We make the following assumption:
\begin{assumption}[Finiteness of integrals]
\label{exi1}
Under SCM ${\cal M}$, for $m\geq 1$, 
$\mu^{(m)}<\infty$ and
$\int_{{\Omega_Y}^m} \mathbb{P}(Y_i<y_1\leq Y_j,Y_i<y_2\leq Y_j,\dots,Y_i<y_m\leq Y_j)dy_1\dots dy_m<\infty$ hold for $(i,j)=\{(0,1),(1,0)\}$.
\end{assumption}


%\begin{lemma}
%\label{lem2}
Under SCM ${\cal M}$ and Assumption \ref{exi1},  taking the expectation on both sides of  Eq.~\eqref{eq5}, we have
\begin{align}
\label{eq6}
%\begin{aligned}
\mu^{(m)}
&=\int_{{\Omega_Y}^m} \mathbb{P}(Y_0<y_1\leq Y_1,Y_0<y_2\leq Y_1,\dots,\nonumber\\
&\hspace{3cm}Y_0<y_m\leq Y_1)dy_1\dots dy_m\nonumber\\
&+(-1)^m\int_{{\Omega_Y}^m} \mathbb{P}(Y_1<y_1\leq Y_0,Y_1<y_2\leq Y_0,\dots,\nonumber\\
&\hspace{3cm}Y_1<y_m\leq Y_0)dy_1\dots dy_m.
%\end{aligned}
\end{align}
%\end{lemma}
The identification of the moments of causal effects then reduces to the identification  of  $\mathbb{P}(Y_0<y_1\leq Y_1,Y_0<y_2\leq Y_1,\dots,Y_0<y_m\leq Y_1)$ and $\mathbb{P}(Y_1<y_1\leq Y_0,Y_1<y_2\leq Y_0,\dots,Y_1<y_m\leq Y_0)$. The identification  of this type of  joint distributions of potential outcomes was discussed in \citep{Kawakami2024}, based on which we obtain the following result: 
%We show the identification theorem under relatively plausible assumptions (Assumptions \ref{ASEXO2},  and \ref{MONO2}).
\begin{theorem}[Identification of the moments of causal effect]
\label{theo1}
Under SCM ${\cal M}$ and Assumptions \ref{ASEXO2},  \ref{MONO2}, and \ref{exi1},  the $m$-th moment of causal effect $Y_1-Y_0$ is identifiable by $\mu^{(m)}=\sigma^{(m)}$, where
\begin{align}
\label{eq10}
%\begin{aligned}
&\sigma^{(m)}=\int_{{\Omega_Y}^m} \max\Big\{\min_{p=1,\dots,m}\{\mathbb{P}(Y<y_p|X=0)\}\nonumber\\
&\hspace{0.2cm}-\max_{p=1,\dots,m}\{\mathbb{P}(Y<y_p|X=1)\},0\Big\}dy_1\dots dy_m\nonumber\\
&+(-1)^m\int_{{\Omega_Y}^m} \max\Big\{\min_{p=1,\dots,m}\{\mathbb{P}(Y<y_p|X=1)\}\nonumber\\
&\hspace{0.2cm}-\max_{p=1,\dots,m}\{\mathbb{P}(Y<y_p|X=0)\},0\Big\}dy_1\dots dy_m.
%\end{aligned}
\end{align}
\end{theorem}
Theorem~\ref{theo1} says that the moments of causal effects can be expressed in terms of  conditional CDFs. 
For $m=1$, Eq.~\eqref{eq10} reduces to ACE$=\mathbb{E}[Y_1-Y_0]=\int_{\Omega_Y}\{\mathbb{P}(Y<y_1|X=0)-\mathbb{P}(Y<y_1|X=1)\}dy_1$   %, which represents the relationship between ACE and the distributional causal effect $\mathbb{P}(Y<y_1|X=0)-\mathbb{P}(Y<y_1|X=1)$, shown in 
\citep{Ju2010}, 
which  does not require Assumption \ref{MONO2} to hold.
%Note that the above relationship does not require Assumption \ref{MONO2}.


For $m=2$, the second moment of causal effects (variance) $\mu^{(2)}$ is given by $\int_{\Omega_Y} \int_{\Omega_Y} \max\{\min\{\mathbb{P}(Y<y_1|X=0),\mathbb{P}(Y<y_2|X=0)\}-\max\{\mathbb{P}(Y<y_1|X=1),\mathbb{P}(Y<y_1|X=1)\},0\}dy_1dy_2
+\int_{\Omega_Y} \int_{\Omega_Y} 
 \max\{\min\{\mathbb{P}(Y<y_1|X=1),\mathbb{P}(Y<y_2|X=1)\}-\max\{\mathbb{P}(Y<y_1|X=0),\mathbb{P}(Y<y_2|X=0),0\}dy_1dy_2$.


\subsection{Bounding the moments of causal effects}

The monotonicity Assumption \ref{MONO2} may sometimes be considered implausible by researchers.
Therefore, we derive bounds for the moments of causal effects that do not  rely on Assumption \ref{MONO2}.

We first provide bounds of the joint distribution of the potential outcomes $\mathbb{P}(Y_i<y_1\leq Y_j,Y_i<y_2\leq Y_j,\dots,Y_i<y_m\leq Y_j)$ using Fr\'{e}chet inequalities \citep{Frechet1935,Frechet1960}.
\begin{lemma}
\label{lem3}
Under SCM ${\cal M}$ and Assumptions \ref{ASEXO2} and \ref{exi1}, 
we have $l(y_1,\dots,y_m;i,j)\leq \mathbb{P}(Y_j<y_1\leq Y_i,Y_j<y_2\leq Y_i,\dots,Y_j<y_m\leq Y_i) \leq u(y_1,\dots,y_m;i,j)$, 
where 
\begin{align}
&l(y_1,\dots,y_m;i,j)=\max\Big\{\sum_{p=1,\dots,m}\mathbb{P}(Y<y_p|X=j)\nonumber\\
&\hspace{0.5cm}-\sum_{p=1,\dots,m}\mathbb{P}(Y<y_p|X=i)-m+1,0\Big\},\\
&u(y_1,\dots,y_m;i,j)=\min\Big\{\min_{p=1,\dots,m}\{\mathbb{P}(Y<y_p|X=j)\},\nonumber\\
&\hspace{1.5cm}1-\max_{p=1,\dots,m}\{\mathbb{P}(Y<y_p|X=i)\}\Big\}
\end{align}
for $(i,j) \in \{(1,0),(0,1)\}$ and any $y_1, \dots, y_m \in \Omega_Y$.
\end{lemma}


Then, we have the following theorem.
\begin{theorem}[Bounds of the moments of causal effect]
\label{theo2}
Under SCM ${\cal M}$ and Assumptions \ref{ASEXO2} and \ref{exi1},  we have $\sigma_L^{(m)} \leq \mu^{(m)} \leq \sigma_U^{(m)}$, where

(A). When $m$ is an even number,
\begin{align}
\label{eq13}
%\begin{aligned}
&\sigma_L^{(m)}=\int_{{\Omega_Y}^m} l(y_1,\dots,y_m;1,0)dy_1\dots dy_m\nonumber\\
&\hspace{1.5cm}+\int_{{\Omega_Y}^m} l(y_1,\dots,y_m;0,1)dy_1\dots dy_m,\\
&\sigma_U^{(m)}=\int_{{\Omega_Y}^m} u(y_1,\dots,y_m;1,0)dy_1\dots dy_m\nonumber\\
&\hspace{1.5cm}+\int_{{\Omega_Y}^m} u(y_1,\dots,y_m;0,1)dy_1\dots dy_m.
\end{align}

(B). When $m$ is an odd number,
\begin{align}
%\begin{aligned}
&\sigma_L^{(m)}=\int_{{\Omega_Y}^m} l(y_1,\dots,y_m;1,0)dy_1\dots dy_m\nonumber\\
&\hspace{1.5cm}-\int_{{\Omega_Y}^m} u(y_1,\dots,y_m;0,1)dy_1\dots dy_m,\\
\label{eq16}
&\sigma_U^{(m)}=\int_{{\Omega_Y}^m} u(y_1,\dots,y_m;1,0)dy_1\dots dy_m\nonumber\\
&\hspace{1.5cm}-\int_{{\Omega_Y}^m} l(y_1,\dots,y_m;0,1)dy_1\dots dy_m.
\end{align}
\end{theorem}
If $\sigma_U^{(m)}=\infty$ and $\sigma_L^{(m)}=-\infty$, then $\mu^{(m)}$ is unbounded.





{The upper bound of the Fr\'{e}chet inequalities is always sharp for all $m\geq 1$ \citep{Nelsen2007}; thus, the function $u(y_1,\dots,y_m;i,j)$ in Lemma 2 is sharp for all $m\geq 1$.
In contrast, the lower bound of the Fr\'{e}chet inequalities is not always sharp  except when $m=1$; hence, the function $l(y_1,\dots,y_m;i,j)$ in Lemma 2 is not sharp. 
As a result, only the upper bounds of the moments of causal effects are sharp when $m$ is even.
In all other cases, our bounds of the moments of causal effects are not sharp.}




\textbf{Remark.} We present a similar identification theorem and bounds on the central moments of causal effects in Appendix \ref{appB}.
Additionally, the skewness and kurtosis of causal effects are also bounded, as shown in Appendix \ref{appB}.

