In this appendix, we provide the details and consistency of all estimators in the body of the paper.


{\bf Details of the estimators in the body of the paper.}
The empirical CDFs and expectations are given by
\begin{gather}
\hat{\mathbb{P}}(Y<y|X=x)=\frac{\sum_{i=1}^N\mathbb{I}(Y_i<y,X_i=x)}{\sum_{i=1}^N\mathbb{I}(X_i=x)},\, \, \, \, \,
\hat{\mathbb{E}}[Y|X=x]=\frac{\sum_{i=1}^NY_i\mathbb{I}(X_i=x)}{\sum_{i=1}^N\mathbb{I}(X_i=x)}
\end{gather}
for any $x \in \Omega_X$ and $y \in \Omega_Y$.
We generate $\{y^1_{k^1}\}_{k^1=1}^{N_1}, \{y^2_{k^2}\}_{k^2=1}^{N_2}, \dots, \{y^m_{k^m}\}_{k^m=1}^{N_m}$  by i.i.d. sampling from a uniform distribution $U[\text{min}(Y),\text{max}(Y)]$ for Monte Carlo integration.




For $m=1,\dots$, the estimators $\hat{\sigma}^{(m)}$ and $\hat{\bar{\sigma}}^{(m)}$ are 
\begin{align}
&\hat{\sigma}^{(m)}=\frac{(b-a)^m}{N_1\dots N_m}\sum_{k^1=1}^{N_1}\dots\sum_{k^m=1}^{N_m}
\max\Big\{\min_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y<{y^p_{k^p}}|X=0)\}-\max_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y<{y^p_{k^p}}|X=1)\},0\Big\}\nonumber\\
&+(-1)^m\frac{(b-a)^m}{N_1\dots N_m}\sum_{k^1=1}^{N_1}\dots\sum_{k^m=1}^{N_m}
\max\Big\{\min_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y<{y^p_{k^p}}|X=1)\}-\max_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y<{y^p_{k^p}}|X=0)\},0\Big\},\nonumber\\
&\hat{\bar{\sigma}}^{(m)}=\frac{(b-a)^m}{N_1\dots N_m}\sum_{k^1=1}^{N_1}\dots\sum_{k^m=1}^{N_m}
\max\Big\{\min_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y-\hat{\mathbb{E}}[Y|X=0]<{y^p_{k^p}}|X=0)\}\nonumber\\
&\hspace{8cm}-\max_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y-\hat{\mathbb{E}}[Y|X=1]<{y^p_{k^p}}|X=1)\},0\Big\}\nonumber\\
&+(-1)^m\frac{(b-a)^m}{N_1\dots N_m}\sum_{k^1=1}^{N_1}\dots\sum_{k^m=1}^{N_m}
\max\Big\{\min_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y-\hat{\mathbb{E}}[Y|X=1]<{y^p_{k^p}}|X=1)\}\nonumber\\
&\hspace{8cm}-\max_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y-\hat{\mathbb{E}}[Y|X=0]<{y^p_{k^p}}|X=0)\},0\Big\}.
\end{align}



For $m=1,\dots$, the estimators $\hat{\sigma}_L^{(m)}$ and $\hat{\sigma}_U^{(m)}$ are given below.


(A). When $m$ is an even number,
\begin{align}
&\hat{\sigma}_L^{(m)}=\frac{(b-a)^m}{N_1\dots N_m}\sum_{k^1=1}^{N_1}\dots\sum_{k^m=1}^{N_m} \Big\{\hat{l}(y^1_{k^1},\dots,y^m_{k^m};1,0)+\hat{l}(y^1_{k^1},\dots,y^m_{k^m};0,1)\Big\},\\
&\hat{\sigma}_U^{(m)}=\frac{(b-a)^m}{N_1\dots N_m}\sum_{k^1=1}^{N_1}\dots\sum_{k^m=1}^{N_m} \Big\{\hat{u}(y^1_{k^1},\dots,y^m_{k^m};1,0)+\hat{u}(y^1_{k^1},\dots,y^m_{k^m};0,1)\Big\},
\end{align}
where 
\begin{align}
&\hat{l}(y_1,\dots,y_m;i,j)=\max\Big\{\sum_{p=1,\dots,m}\hat{\mathbb{P}}(Y<y_p|X=j)-\sum_{p=1,\dots,m}\hat{\mathbb{P}}(Y<y_p|X=i)-m+1,0\Big\},\\
&\hat{u}(y_1,\dots,y_m;i,j)=\min\Big\{\min_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y<y_p|X=j)\},1-\max_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y<y_p|X=i)\}\Big\}.
\end{align}

(B). When $m$ is an odd number,
\begin{align}
&\hat{\sigma}_L^{(m)}=\frac{(b-a)^m}{N_1\dots N_m}\sum_{k^1=1}^{N_1}\dots\sum_{k^m=1}^{N_m} \Big\{\hat{l}(y^1_{k^1},\dots,y^m_{k^m};1,0)-\hat{u}(y^1_{k^1},\dots,y^m_{k^m};0,1)\Big\},\\
&\hat{\sigma}_U^{(m)}=\frac{(b-a)^m}{N_1\dots N_m}\sum_{k^1=1}^{N_1}\dots\sum_{k^m=1}^{N_m} \Big\{\hat{u}(y^1_{k^1},\dots,y^m_{k^m};1,0)-\hat{l}(y^1_{k^1},\dots,y^m_{k^m};0,1)\Big\}.
\end{align}



For $m=1,\dots$, the estimators $\hat{\bar{\sigma}}_L^{(m)}$ and $\hat{\bar{\sigma}}_U^{(m)}$ are given below.


(A). When $m$ is an even number,
\begin{align}
&\hat{\bar{\sigma}}_L^{(m)}=\frac{(b-a)^m}{N_1\dots N_m}\sum_{k^1=1}^{N_1}\dots\sum_{k^m=1}^{N_m} \Big\{\hat{\bar{l}}(y^1_{k^1},\dots,y^m_{k^m};1,0)+\hat{\bar{l}}(y^1_{k^1},\dots,y^m_{k^m};0,1)\Big\},\\
&\hat{\bar{\sigma}}_U^{(m)}=\frac{(b-a)^m}{N_1\dots N_m}\sum_{k^1=1}^{N_1}\dots\sum_{k^m=1}^{N_m} \Big\{\hat{\bar{u}}(y^1_{k^1},\dots,y^m_{k^m};1,0)+\hat{\bar{u}}(y^1_{k^1},\dots,y^m_{k^m};0,1)\Big\},
\end{align}
where 
\begin{align}
&\hat{\bar{l}}(y_1,\dots,y_m;i,j)=\max\Big\{\sum_{p=1,\dots,m}\hat{\mathbb{P}}(Y-\hat{\mathbb{E}}[Y|X=j]<y_p|X=j)\nonumber\\
&\hspace{6cm}-\sum_{p=1,\dots,m}\hat{\mathbb{P}}(Y-\hat{\mathbb{E}}[Y|X=i]<y_p|X=i)-m+1,0\Big\},\\
&\hat{\bar{u}}(y_1,\dots,y_m;i,j)=\min\Big\{\min_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y-\hat{\mathbb{E}}[Y|X=j]<y_p|X=j)\},\nonumber\\
&\hspace{6cm}1-\max_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y-\hat{\mathbb{E}}[Y|X=i]<y_p|X=i)\}\Big\}.
\end{align}

(B). When $m$ is an odd number,
\begin{align}
&\hat{\bar{\sigma}}_L^{(m)}=\frac{(b-a)^m}{N_1\dots N_m}\sum_{k^1=1}^{N_1}\dots\sum_{k^m=1}^{N_m} \Big\{\hat{\bar{l}}(y^1_{k^1},\dots,y^m_{k^m};1,0)-\hat{\bar{u}}(y^1_{k^1},\dots,y^m_{k^m};0,1)\Big\},\\
&\hat{\bar{\sigma}}_U^{(m)}=\frac{(b-a)^m}{N_1\dots N_m}\sum_{k^1=1}^{N_1}\dots\sum_{k^m=1}^{N_m} \Big\{\hat{\bar{u}}(y^1_{k^1},\dots,y^m_{k^m};1,0)-\hat{\bar{l}}(y^1_{k^1},\dots,y^m_{k^m};0,1)\Big\}.
\end{align}

The estimators $\hat{\sigma}(i,j;k,h)$ and $\hat{\bar{\sigma}}(i,j;k,h)$ are 
\begin{align}
\hat{\sigma}(i,j;k,h)&=\frac{(b-a)^2}{N_1N_2}\sum_{k^1=1}^{N_1}\sum_{k^2=1}^{N_2}\max\Big\{\min\{\hat{\mathbb{P}}(Y<y^1_{k^1}|X=j),\hat{\mathbb{P}}(Y<y^2_{k^2}|X=h)\}\nonumber\\
&\hspace{5cm}-\max\{\hat{\mathbb{P}}(Y<y^1_{k^1}|X=i),\hat{\mathbb{P}}(Y<y^2_{k^2}|X=k)\},0\Big\}\nonumber\\
&-\frac{(b-a)^2}{N_1N_2}\sum_{k^1=1}^{N_1}\sum_{k^2=1}^{N_2}\max\Big\{\min\{\hat{\mathbb{P}}(Y<y^1_{k^1}|X=i),\hat{\mathbb{P}}(Y<y^2_{k^2}|X=h)\}\nonumber\\
&\hspace{5cm}-\max\{\hat{\mathbb{P}}(Y<y^1_{k^1}|X=j),\hat{\mathbb{P}}(Y<y^2_{k^2}|X=k)\},0\Big\}\nonumber\\
&-\frac{(b-a)^2}{N_1N_2}\sum_{k^1=1}^{N_1}\sum_{k^2=1}^{N_2}\max\Big\{\min\{\hat{\mathbb{P}}(Y<y^1_{k^1}|X=j),\hat{\mathbb{P}}(Y<y^2_{k^2}|X=k)\}\nonumber\\
&\hspace{5cm}-\max\{\hat{\mathbb{P}}(Y<y^1_{k^1}|X=i),\hat{\mathbb{P}}(Y<y^2_{k^2}|X=h)\},0\Big\}\nonumber\\
&+\frac{(b-a)^2}{N_1N_2}\sum_{k^1=1}^{N_1}\sum_{k^2=1}^{N_2}\max\Big\{\min\{\hat{\mathbb{P}}(Y<y^1_{k^1}|X=i),\hat{\mathbb{P}}(Y<y^2_{k^2}|X=k)\}\nonumber\\
&\hspace{5cm}-\max\{\hat{\mathbb{P}}(Y<y^1_{k^1}|X=j),\hat{\mathbb{P}}(Y<y^2_{k^2}|X=h)\},0\Big\},
\end{align}
\begin{align}
\hat{\bar{\sigma}}(i,j;k,h)
&=\frac{(b-a)^2}{N_1N_2}\sum_{k^1=1}^{N_1}\sum_{k^2=1}^{N_2}\max\Big\{\min\{\hat{\mathbb{P}}(Y-\hat{\mathbb{E}}[Y|X=j]<y^1_{k^1}|X=j),\hat{\mathbb{P}}(Y-\hat{\mathbb{E}}[Y|X=h]<y^2_{k^2}|X=h)\}\nonumber\\
&\hspace{3cm}-\max\{\hat{\mathbb{P}}(Y-\hat{\mathbb{E}}[Y|X=i]<y^1_{k^1}|X=i),\hat{\mathbb{P}}(Y-\hat{\mathbb{E}}[Y|X=k]<y^2_{k^2}|X=k)\},0\Big\}\nonumber\\
&-\frac{(b-a)^2}{N_1N_2}\sum_{k^1=1}^{N_1}\sum_{k^2=1}^{N_2}\max\Big\{\min\{\hat{\mathbb{P}}(Y-\hat{\mathbb{E}}[Y|X=i]<y^1_{k^1}|X=i),\hat{\mathbb{P}}(Y-\hat{\mathbb{E}}[Y|X=h]<y^2_{k^2}|X=h)\}\nonumber\\
&\hspace{3cm}-\max\{\hat{\mathbb{P}}(Y-\hat{\mathbb{E}}[Y|X=j]<y^1_{k^1}|X=j),\hat{\mathbb{P}}(Y-\hat{\mathbb{E}}[Y|X=k]<y^2_{k^2}|X=k)\},0\Big\}\nonumber\\
&-\frac{(b-a)^2}{N_1N_2}\sum_{k^1=1}^{N_1}\sum_{k^2=1}^{N_2}\max\Big\{\min\{\hat{\mathbb{P}}(Y-\hat{\mathbb{E}}[Y|X=j]<y^1_{k^1}|X=j),\hat{\mathbb{P}}(Y-\hat{\mathbb{E}}[Y|X=k]<y^2_{k^2}|X=k)\}\nonumber\\
&\hspace{3cm}-\max\{\hat{\mathbb{P}}(Y-\hat{\mathbb{E}}[Y|X=i]<y^1_{k^1}|X=i),\hat{\mathbb{P}}(Y-\hat{\mathbb{E}}[Y|X=h]<y^2_{k^2}|X=h)\},0\Big\}\nonumber\\
&+\frac{(b-a)^2}{N_1N_2}\sum_{k^1=1}^{N_1}\sum_{k^2=1}^{N_2}\max\Big\{\min\{\hat{\mathbb{P}}(Y-\hat{\mathbb{E}}[Y|X=i]<y^1_{k^1}|X=i),\hat{\mathbb{P}}(Y-\hat{\mathbb{E}}[Y|X=k]<y^2_{k^2}|X=k)\}\nonumber\\
&\hspace{3cm}-\max\{\hat{\mathbb{P}}(Y-\hat{\mathbb{E}}[Y|X=j]<y^1_{k^1}|X=j),\hat{\mathbb{P}}(Y-\hat{\mathbb{E}}[Y|X=h]<y^2_{k^2}|X=h)\},0\Big\}.
\end{align}





The estimators $\hat{\sigma}_L(i,j;k,h)$ and $\hat{\sigma}_U(i,j;k,h)$ are 
\begin{align}
\hat{\sigma}_L(i,j;k,h)
&=\frac{(b-a)^2}{N_1N_2}\sum_{k^1=1}^{N_1}\sum_{k^2=1}^{N_2}\hat{l}(y^1_{k^1},y^2_{k^2};i,j,k,h)-\frac{(b-a)^2}{N_1N_2}\sum_{k^1=1}^{N_1}\sum_{k^2=1}^{N_2}\hat{u}(y^1_{k^1},y^2_{k^2};j,i,k,h)\nonumber\\
&\hspace{1cm}-\frac{(b-a)^2}{N_1N_2}\sum_{k^1=1}^{N_1}\sum_{k^2=1}^{N_2}\hat{u}(y^1_{k^1},y^2_{k^2};i,j,h,k)+\frac{(b-a)^2}{N_1N_2}\sum_{k^1=1}^{N_1}\sum_{k^2=1}^{N_2}\hat{l}(y^1_{k^1},y^2_{k^2};j,i,h,k),\\
\hat{\sigma}_U(i,j;k,h)
&=\frac{(b-a)^2}{N_1N_2}\sum_{k^1=1}^{N_1}\sum_{k^2=1}^{N_2}\hat{u}(y^1_{k^1},y^2_{k^2};i,j,k,h)-\frac{(b-a)^2}{N_1N_2}\sum_{k^1=1}^{N_1}\sum_{k^2=1}^{N_2}\hat{l}(y^1_{k^1},y^2_{k^2};j,i,k,h)\nonumber\\
&\hspace{1cm}-\frac{(b-a)^2}{N_1N_2}\sum_{k^1=1}^{N_1}\sum_{k^2=1}^{N_2}\hat{l}(y^1_{k^1},y^2_{k^2};i,j,h,k)+\frac{(b-a)^2}{N_1N_2}\sum_{k^1=1}^{N_1}\sum_{k^2=1}^{N_2}\hat{u}(y^1_{k^1},y^2_{k^2};j,i,h,k),
\end{align}
where
\begin{align}
&\hat{l}(y_1,y_2;i,j,k,h)\nonumber\\
&=\max\Big\{\hat{\mathbb{P}}(Y<y_1|X=j)-\hat{\mathbb{P}}(Y <y_1|X=i)+\hat{\mathbb{P}}(Y<y_2|X=h)-\hat{\mathbb{P}}(Y<y_2|X=k)-1,0\Big\},\\
&\hat{u}(y_1,y_2;i,j,k,h)\nonumber\\
&=\min\Big\{\min\{\hat{\mathbb{P}}(Y<y_1|X=j),\hat{\mathbb{P}}(Y<y_2|X=h)\},1-\max\{\hat{\mathbb{P}}(Y<y_1|X=i),\hat{\mathbb{P}}(Y<y_2|X=k)\}\Big\}.
\end{align}



The estimators $\hat{\bar{\sigma}}_L(i,j;k,h)$ and $\hat{\bar{\sigma}}_U(i,j;k,h)$ are 
\begin{align}
\hat{\bar{\sigma}}_L(i,j;k,h)
&=\frac{(b-a)^2}{N_1N_2}\sum_{k^1=1}^{N_1}\sum_{k^2=1}^{N_2}\hat{\bar{l}}(y^1_{k^1},y^2_{k^2};i,j,k,h)-\frac{(b-a)^2}{N_1N_2}\sum_{k^1=1}^{N_1}\sum_{k^2=1}^{N_2}\hat{\bar{u}}(y^1_{k^1},y^2_{k^2};j,i,k,h)\nonumber\\
&\hspace{1cm}-\frac{(b-a)^2}{N_1N_2}\sum_{k^1=1}^{N_1}\sum_{k^2=1}^{N_2}\hat{\bar{u}}(y^1_{k^1},y^2_{k^2};i,j,h,k)+\frac{(b-a)^2}{N_1N_2}\sum_{k^1=1}^{N_1}\sum_{k^2=1}^{N_2}\hat{\bar{l}}(y^1_{k^1},y^2_{k^2};j,i,h,k),\\
\hat{\bar{\sigma}}_U(i,j;k,h)
&=\frac{(b-a)^2}{N_1N_2}\sum_{k^1=1}^{N_1}\sum_{k^2=1}^{N_2}\hat{\bar{u}}(y^1_{k^1},y^2_{k^2};i,j,k,h)-\frac{(b-a)^2}{N_1N_2}\sum_{k^1=1}^{N_1}\sum_{k^2=1}^{N_2}\hat{\bar{l}}(y^1_{k^1},y^2_{k^2};j,i,k,h)\nonumber\\
&\hspace{1cm}-\frac{(b-a)^2}{N_1N_2}\sum_{k^1=1}^{N_1}\sum_{k^2=1}^{N_2}\hat{\bar{l}}(y^1_{k^1},y^2_{k^2};i,j,h,k)+\frac{(b-a)^2}{N_1N_2}\sum_{k^1=1}^{N_1}\sum_{k^2=1}^{N_2}\hat{\bar{u}}(y^1_{k^1},y^2_{k^2};j,i,h,k),
\end{align}
where
\begin{align}
\hat{\bar{l}}(y_1,y_2;i,j,k,h)
&=\max\Big\{\hat{\mathbb{P}}(Y-\hat{\mathbb{E}}[Y|X=j]<y_1|X=j)-\hat{\mathbb{P}}(Y-\hat{\mathbb{E}}[Y|X=i]<y_1|X=i)\nonumber\\
&\hspace{1cm}+\hat{\mathbb{P}}(Y-\hat{\mathbb{E}}[Y|X=h]<y_2|X=h)-\hat{\mathbb{P}}(Y-\hat{\mathbb{E}}[Y|X=k]<y_2|X=k)-1,0\Big\},\\
\hat{\bar{u}}(y_1,y_2;i,j,k,h)
&=\min\Big\{\min\{\hat{\mathbb{P}}(Y-\hat{\mathbb{E}}[Y|X=j]<y_1|X=j),\hat{\mathbb{P}}(Y-\hat{\mathbb{E}}[Y|X=h]<y_2|X=h)\},\nonumber\\
&\hspace{1cm}1-\max\{\hat{\mathbb{P}}(Y-\hat{\mathbb{E}}[Y|X=i]<y_1|X=i),\hat{\mathbb{P}}(Y-\hat{\mathbb{E}}[Y|X=k]<y_2|X=k)\}\Big\}.
\end{align}

{\bf Consistency of the estimators for the moments of causal effects.}
First, the empirical CDFs and expectations follow $\displaystyle O_p\left(1/\sqrt{N}\right)$ for any $x \in \Omega_X$ and $y \in \Omega_Y$.
From the delta method \citep{Doob1935,Fang2018},
both $\max\{\min_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y<y_p|X=0)\}-\max_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y<y_p|X=1)\},0\}$ and $\max\{\min_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y<y_p|X=1)\}-\max_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y<y_p|X=0)\},0\}$ follow $ O_p\left(1/\sqrt{N^m}\right)$, {almost surely} w.r.t. $\Omega_Y^m$.
For any $m=1,\dots$, we have
\begin{align}
&\Big|\hat{\sigma}^{(m)}-\sigma^{(m)}\Big|\nonumber\\
&=\Bigg|\Bigg\{\frac{(b-a)^m}{N_1\dots N_m}\sum_{k^1=1}^{N_1}\dots\sum_{k^m=1}^{N_m}
\max\Big\{\min_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y<{y^p_{k^p}}|X=0)\}-\max_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y<{y^p_{k^p}}|X=1)\},0\Big\}\nonumber\\
&+(-1)^m\frac{(b-a)^m}{N_1\dots N_m}\sum_{k^1=1}^{N_1}\dots\sum_{k^m=1}^{N_m}
\max\Big\{\min_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y<{y^p_{k^p}}|X=1)\}-\max_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y<{y^p_{k^p}}|X=0)\},0\Big\}\Bigg\}\nonumber\\
&-\Bigg\{\sigma^{(m)}=\int_{{\Omega_Y}^m} \max\Big\{\min_{p=1,\dots,m}\{\mathbb{P}(Y<y_p|X=0)\}-\max_{p=1,\dots,m}\{\mathbb{P}(Y<y_p|X=1)\},0\Big\}dy_1\dots dy_m\nonumber\\
&\hspace{1cm}+(-1)^m\int_{{\Omega_Y}^m} \max\Big\{\min_{p=1,\dots,m}\{\mathbb{P}(Y<y_p|X=1)\}-\max_{p=1,\dots,m}\{\mathbb{P}(Y<y_p|X=0)\},0\Big\}dy_1\dots dy_m\Bigg\}\Bigg|\nonumber\\
&=\Bigg|\Bigg\{\frac{(b-a)^m}{N_1\dots N_m}\sum_{k^1=1}^{N_1}\dots\sum_{k^m=1}^{N_m}
\max\Big\{\min_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y<{y^p_{k^p}}|X=0)\}-\max_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y<{y^p_{k^p}}|X=1)\},0\Big\}\nonumber\\
&+(-1)^m\frac{(b-a)^m}{N_1\dots N_m}\sum_{k^1=1}^{N_1}\dots\sum_{k^m=1}^{N_m}
\max\Big\{\min_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y<{y^p_{k^p}}|X=1)\}-\max_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y<{y^p_{k^p}}|X=0)\},0\Big\}\Bigg\}\nonumber\\
&-\Bigg\{\int_{{\Omega_Y}^m} \max\Big\{\min_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y<y_p|X=0)\}-\max_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y<y_p|X=1)\},0\Big\}dy_1\dots dy_m\nonumber\\
&\hspace{1cm}+(-1)^m\int_{{\Omega_Y}^m} \max\Big\{\min_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y<y_p|X=1)\}-\max_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y<y_p|X=0)\},0\Big\}dy_1\dots dy_m\Bigg\}\nonumber\\
&+\Bigg\{\int_{{\Omega_Y}^m} \max\Big\{\min_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y<y_p|X=0)\}-\max_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y<y_p|X=1)\},0\Big\}dy_1\dots dy_m\nonumber\\
&\hspace{1cm}+(-1)^m\int_{{\Omega_Y}^m} \max\Big\{\min_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y<y_p|X=1)\}-\max_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y<y_p|X=0)\},0\Big\}dy_1\dots dy_m\Bigg\}\nonumber\\
&-\Bigg\{\int_{{\Omega_Y}^m} \max\Big\{\min_{p=1,\dots,m}\{\mathbb{P}(Y<y_p|X=0)\}-\max_{p=1,\dots,m}\{\mathbb{P}(Y<y_p|X=1)\},0\Big\}dy_1\dots dy_m\nonumber\\
&\hspace{1cm}+(-1)^m\int_{{\Omega_Y}^m} \max\Big\{\min_{p=1,\dots,m}\{\mathbb{P}(Y<y_p|X=1)\}-\max_{p=1,\dots,m}\{\mathbb{P}(Y<y_p|X=0)\},0\Big\}dy_1\dots dy_m\Bigg\}\Bigg|\nonumber\\
&\leq\Bigg|\Bigg\{\frac{(b-a)^m}{N_1\dots N_m}\sum_{k^1=1}^{N_1}\dots\sum_{k^m=1}^{N_m}
\max\Big\{\min_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y<{y^p_{k^p}}|X=0)\}-\max_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y<{y^p_{k^p}}|X=1)\},0\Big\}\nonumber\\
&+(-1)^m\frac{(b-a)^m}{N_1\dots N_m}\sum_{k^1=1}^{N_1}\dots\sum_{k^m=1}^{N_m}
\max\Big\{\min_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y<{y^p_{k^p}}|X=1)\}-\max_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y<{y^p_{k^p}}|X=0)\},0\Big\}\Bigg\}\nonumber\\
&-\Bigg\{\int_{{\Omega_Y}^m} \max\Big\{\min_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y<y_p|X=0)\}-\max_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y<y_p|X=1)\},0\Big\}dy_1\dots dy_m\nonumber\\
&\hspace{1cm}+(-1)^m\int_{{\Omega_Y}^m} \max\Big\{\min_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y<y_p|X=1)\}-\max_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y<y_p|X=0)\},0\Big\}dy_1\dots dy_m\Bigg\}\Bigg|\nonumber\\
&+\Bigg|\Bigg\{\int_{{\Omega_Y}^m} \max\Big\{\min_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y<y_p|X=0)\}-\max_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y<y_p|X=1)\},0\Big\}dy_1\dots dy_m\nonumber\\
&\hspace{1cm}+(-1)^m\int_{{\Omega_Y}^m} \max\Big\{\min_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y<y_p|X=1)\}-\max_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y<y_p|X=0)\},0\Big\}dy_1\dots dy_m\Bigg\}\nonumber\\
&-\Bigg\{\int_{{\Omega_Y}^m} \max\Big\{\min_{p=1,\dots,m}\{\mathbb{P}(Y<y_p|X=0)\}-\max_{p=1,\dots,m}\{\mathbb{P}(Y<y_p|X=1)\},0\Big\}dy_1\dots dy_m\nonumber\\
&\hspace{1cm}+(-1)^m\int_{{\Omega_Y}^m} \max\Big\{\min_{p=1,\dots,m}\{\mathbb{P}(Y<y_p|X=1)\}-\max_{p=1,\dots,m}\{\mathbb{P}(Y<y_p|X=0)\},0\Big\}dy_1\dots dy_m\Bigg\}\Bigg|\nonumber\\
&=\Bigg|\Bigg\{\frac{(b-a)^m}{N_1\dots N_m}\sum_{k^1=1}^{N_1}\dots\sum_{k^m=1}^{N_m}
\max\Big\{\min_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y<{y^p_{k^p}}|X=0)\}-\max_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y<{y^p_{k^p}}|X=1)\},0\Big\}\nonumber\\
&+(-1)^m\frac{(b-a)^m}{N_1\dots N_m}\sum_{k^1=1}^{N_1}\dots\sum_{k^m=1}^{N_m}
\max\Big\{\min_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y<{y^p_{k^p}}|X=1)\}-\max_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y<{y^p_{k^p}}|X=0)\},0\Big\}\Bigg\}\nonumber\\
&-\Bigg\{\int_{{\Omega_Y}^m} \max\Big\{\min_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y<y_p|X=0)\}-\max_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y<y_p|X=1)\},0\Big\}dy_1\dots dy_m\nonumber\\
&\hspace{1cm}+(-1)^m\int_{{\Omega_Y}^m} \max\Big\{\min_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y<y_p|X=1)\}-\max_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y<y_p|X=0)\},0\Big\}dy_1\dots dy_m\Bigg\}\Bigg|\nonumber\\
&+\Bigg|\int_{{\Omega_Y}^m}\Bigg\{\max\Big\{\min_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y<y_p|X=0)\}-\max_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y<y_p|X=1)\},0\Big\}\nonumber\\
&\hspace{4cm}+(-1)^m\max\Big\{\min_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y<y_p|X=1)\}-\max_{p=1,\dots,m}\{\hat{\mathbb{P}}(Y<y_p|X=0)\},0\Big\}\nonumber\\
&-\max\Big\{\min_{p=1,\dots,m}\{\mathbb{P}(Y<y_p|X=0)\}-\max_{p=1,\dots,m}\{\mathbb{P}(Y<y_p|X=1)\},0\Big\}\nonumber\\
&\hspace{2cm}-(-1)^m\max\Big\{\min_{p=1,\dots,m}\{\mathbb{P}(Y<y_p|X=1)\}-\max_{p=1,\dots,m}\{\mathbb{P}(Y<y_p|X=0)\},0\Big\}\Bigg\}dy_1\dots dy_m\Bigg|\nonumber\\
&= O_p\left(\sum_{i=1}^m\frac{1}{\sqrt{N_i}}\right)+ O_p\left(\frac{1}{\sqrt{N^m}}\right).
\end{align}
Then, under SCM ${\cal M}$ and Assumptions \ref{ASEXO2},  \ref{MONO2}, and \ref{exi1}, $\sigma^{(m)}$ follows $\displaystyle O_p\left(1/\sqrt{N^m}+\sum\nolimits_{i=1}^m1/\sqrt{N_i}\right)$.
Similarly, under SCM ${\cal M}$ and Assumptions \ref{ASEXO2}, \ref{MONO2}, and \ref{exi1}, $\displaystyle\sigma_L^{(m)}, \sigma_U^{(m)}$ follow $\displaystyle O_p\left(1/\sqrt{N^m}+\sum\nolimits_{i=1}^m1/\sqrt{N_i}\right)$.
Under SCM ${\cal M}$ and Assumptions \ref{ASEXO2},  \ref{MONO2}, and \ref{exi2}, $\displaystyle\sigma(i,j;k,h), \sigma_L(i,j;k,h), \sigma_U(i,j;k,h)$ follow $\displaystyle O_p\left(1/\sqrt{N^2}+\sum\nolimits_{i=1}^21/\sqrt{N_i}\right)$.
We can make $N_1,\dots,N_m$ as large as computational resources allow. 
Letting $N_1,\dots,N_m \rightarrow \infty$, $\displaystyle\sigma^{(m)}, \sigma_L^{(m)}, \sigma_U^{(m)}$ follow $\displaystyle O_p\left(1/\sqrt{N^m}\right)$ and $\displaystyle\sigma(i,j;k,h), \sigma_L(i,j;k,h), \sigma_U(i,j;k,h)$ follow $\displaystyle O_p\left(1/\sqrt{N^2}\right)$.

{\bf Consistency of the estimators for the central moments of causal effects.}
First, empirical CDFs and expectations follow $\displaystyle O_p\left(1/\sqrt{N}\right)$ for any $x \in \Omega_X$ and $y \in \Omega_Y$.
For the central moment, we make an additional assumption.
\begin{assumption}
\label{Lip}
$\mathbb{P}(Y<y|X=x)$ is differential in $y$ for any $x \in \Omega_X$, almost surely w.r.t. $\Omega_Y$.
\end{assumption}
Then, under SCM ${\cal M}$ and Assumptions \ref{ASEXO2},  \ref{MONO2}, \ref{exi3}, and \ref{Lip},
$\sigma^{(m)}, \sigma_L^{(m)}, \sigma_U^{(m)}$ follow $\displaystyle O_p\left(1/\sqrt{N^{2m}}+\sum\nolimits_{i=1}^m1/\sqrt{N_i}\right)$.
Under SCM ${\cal M}$ and Assumptions \ref{ASEXO2},  \ref{MONO2}, \ref{exi4}, and \ref{Lip},
$\sigma(i,j;k,h), \sigma_L(i,j;k,h), \sigma_U(i,j;k,h)$ follow $\displaystyle O_p\left(1/\sqrt{N^4}+\sum\nolimits_{i=1}^21/\sqrt{N_i}\right)$.
Letting $N_1,\dots,N_m \rightarrow \infty$, 
$\sigma^{(m)}, \sigma_L^{(m)}, \sigma_U^{(m)}$ follow $\displaystyle O_p\left(1/\sqrt{N^{2m}}\right)$ and $\sigma(i,j;k,h), \sigma_L(i,j;k,h), \sigma_U(i,j;k,h)$ follow $\displaystyle O_p\left(1/\sqrt{N^4}\right)$.

Thus, all estimators for the moments of causal effects are consistent.



