

In this section, we study the (central) product moments of causal effects to address (\textbf{Question 2}).




%Researchers frequently compare multiple potential outcomes, including cases with more than three, as discussed in \citep{Bartholomew1959, Page1963, Imbens2000, Imai2004}. We consider the comparison of the $R$ potential outcomes $\{Y_1,Y_2,\dots,Y_R\}$ with $\Omega_X=\{1,\dots,R\}$.
Let $\Omega_X=\{1,\dots,R\}$. 
The causal effect of changing $X=j$ to $X=i$ is given by $Y_i-Y_j$ and the causal effect of changing $X=k$ to $X=h$ is given by $Y_h-Y_k$.
We study the %relationship and 
association of the two causal effects $Y_i-Y_j$ and $Y_h-Y_k$.



\subsection{Definition of the product moment of causal effects}

We define the product moment of two causal effects analogously to the product moment of two random variables.
\begin{definition}[The product moment of causal effects]
The product moment of causal effects is defined by %\jin{I suggest changing the notation to $\rho_{i,j;k,h}$}
\begin{equation}
\rho_{i,j;k,h}\defeq\mathbb{E}\Big[(Y_i-Y_j)(Y_k-Y_h)\Big].
\end{equation}
\end{definition}


We present three examples to illustrate the product moments of causal effects %are specifically measured 
in simple SCMs.


{\bf Example 1 (continued).} (Homogeneous ICE)
%Revisiting Example 1, 
In SCM given by $Y=X+U^Y$ where $\mathbb{E}[U^Y]=0$, 
the product moment of $Y_1-Y_0$ and $Y_0-Y_{-1}$ is equal to $1$.

{\bf Example 2 (continued).} (Heterogeneous ICE)
%Revisiting Example 2, 
In SCM $Y=X(U^Y+1)+1$ where $\mathbb{E}[U^Y]=0$, 
the product moment of $Y_1-Y_0$ and $Y_0-Y_{-1}$ is equal to $\mathbb{E}[(U^Y+1)^2]>0$.


{\bf Example 3.} (Heterogeneous and nonlinear ICE)
We consider a nonlinear SCM with an interaction term between $X^2$ and $U^Y$:  $Y=X^2(U^Y+1)+1$ where $\mathbb{E}[U^Y]=0$. We have  $Y_1-Y_0=U^Y+1$ and $Y_0-Y_{-1}=-(U^Y+1)$ and are heterogeneous.
The product moment of $Y_1-Y_0$ and $Y_0-Y_{-1}$ is equal to $\mathbb{E}[-(U^Y+1)^2]<0$.




%\yuta{The product moment of causal effects for $Y_i-Y_j$ and $Y_h-Y_k$ reveals the association between the two causal effects.
%When $\mathbb{E}[(Y_i-Y_j)(Y_k-Y_h)]$ is positive, subjects with larger $Y_i-Y_j$ tend to have larger $ Y_h-Y_k$.
%When $\mathbb{E}[(Y_i-Y_j)(Y_k-Y_h)]$ is negative, subjects with larger $Y_i-Y_j$ tend to have smaller $ Y_h-Y_k$.}

%\yuta{The product moments provide insights into the patterns of the signs of causal effects.
%The signs of $Y_i-Y_j$ and $Y_h-Y_k$ follow four possible patterns:
%\begin{enumerate}
%    \item $Y_i-Y_j>0$ and $Y_h-Y_k>0$.
%    \item $Y_i-Y_j>0$ and $Y_h-Y_k\leq 0$.
%    \item $Y_i-Y_j\leq 0$ and $Y_h-Y_k>0$.
%    \item $Y_i-Y_j\leq 0$ and $Y_h-Y_k\leq 0$.
%\end{enumerate}
%When the product moment of $Y_i-Y_j$ and $Y_h-Y_k$ is positive, }

%\subsection{The central product moment of causal effects}


%We assess the covariance and correlation of causal effects to examine the relationship between the two causal effects. We define the covariance, which represents the central product moment, and the correlation as follows:
We examine the covariance and correlation of two causal effects. 
\begin{definition}[Covariance of causal effects]
We define the covariance (central product moment of causal effects) as 
\begin{equation}
\begin{aligned}
\overline{\rho}_{i,j;k,h}\defeq&\mathbb{E}\Big[\Big\{(Y_i-Y_j)-(\mathbb{E}[Y_i]-\mathbb{E}[Y_j])\Big\}\\
&\hspace{0.5cm}\times\Big\{(Y_k-Y_h)-(\mathbb{E}[Y_k]-\mathbb{E}[Y_h])\Big\}\Big].
\end{aligned}
\end{equation}
\end{definition}
\begin{definition}[Correlation of causal effects]
We define the correlation of causal effects as 
\begin{equation}
\begin{aligned}
&\overline{\tau}_{i,j;k,h}=\overline{\rho}_{i,j;k,h} \\%\mathbb{E}\Big[\Big\{(Y_i-Y_j)-(\mathbb{E}[Y_i]-\mathbb{E}[Y_j])\Big\}\\
%&\hspace{1cm}\times\Big\{(Y_k-Y_h)-(\mathbb{E}[Y_k]-\mathbb{E}[Y_h])\Big\}\Big]\\
&\hspace{0cm}\Bigg/\bigg\{\sqrt{\mathbb{E}\Big[\Big\{(Y_i-Y_j)-(\mathbb{E}[Y_i]-\mathbb{E}[Y_j])\Big\}^2\Big]}\\
&\hspace{0.5cm}\times\sqrt{\mathbb{E}\Big[\Big\{(Y_k-Y_h)-(\mathbb{E}[Y_k]-\mathbb{E}[Y_h])\Big\}^2\Big]}
\bigg\}.
\end{aligned}
\end{equation}
\end{definition}
Correlation is a measure of association between two variables \citep{Pearson1905}. Similarly, the correlation of causal effects quantifies the association between two causal effects.

%If the causal effects $Y_i-Y_j$ and $Y_h-Y_k$ are positively correlated, individuals with larger $Y_i-Y_j$ than the average tend to have larger $Y_h-Y_k$ than the average. If the causal effects $Y_i-Y_j$ and $Y_h-Y_k$ are negatively correlated, individuals with larger $Y_i-Y_j$ than the average  tend to have smaller $Y_h-Y_k$ than the average. If the causal effects $Y_i-Y_j$ and $Y_h-Y_k$ are uncorrelated, there is no linear relationship between $Y_h-Y_k$ and $Y_i-Y_j$.

For instance, 
when comparing three treatments $X = 0,1,2$, researchers often evaluate their respective averages $\mathbb{E}[Y_0], \mathbb{E}[Y_1],$ and $\mathbb{E}[Y_2]$.
When $\mathbb{E}[Y_1 - Y_0] > 0$ and $\mathbb{E}[Y_2 - Y_1] > 0$, it is concluded that, on average, both changes, from $X = 0$ to $X = 1$ and from $X = 1$ to $X = 2$, have positive effects.
The correlation of causal effects provides more detailed insights.
When the correlation between $Y_1 - Y_0$ and $Y_2 - Y_1$ is negative, patients with larger causal effects $Y_1 - Y_0$ than the average tend to have smaller causal effects $Y_2 - Y_1$ than the average.
Conversely, when patients have smaller causal effects $Y_1 - Y_0$ than the average, they tend to have larger causal effects $Y_2 - Y_1$ than the average.

We present three examples to illustrate  the covariance and correlation of causal effects. % specifically measure relationships in simple SCMs.


{\bf Example 1 (continued).} (Homogeneous ICE)
%Revisiting Example 1, 
In SCM given by $Y=X+U^Y$ where $\mathbb{E}[U^Y]=0$, 
the covariance of $Y_1-Y_0$ and $Y_0-Y_{-1}$ is equal to $0$.
%This implies that $Y_1-Y_0$ and $Y_0-Y_{-1}$ do not have a positive or negative correlation.

{\bf Example 2 (continued).} (Heterogeneous ICE)
%Revisiting Example 2, 
In SCM $Y=X(U^Y+1)+1$ where $\mathbb{E}[U^Y]=0$, 
the covariance of $Y_1-Y_0$ and $Y_0-Y_{-1}$ is equal to $\mathbb{E}[(U^Y)^2]>0$, 
 the correlation of $Y_1-Y_0$ and $Y_0-Y_{-1}$ is $1$, and they have a positive correlation.

{\bf Example 3 (continued).} (Heterogeneous and nonlinear ICE)
%Revisiting Example 3, 
In SCM $Y=X^2(U^Y+1)+1$ where $\mathbb{E}[U^Y]=0$, the covariance of $Y_1-Y_0$ and $Y_0-Y_{-1}$ is equal to $\mathbb{E}[-(U^Y)^2]<0$, 
 the correlation of $Y_1-Y_0$ and $Y_0-Y_{-1}$ is $-1$,  and they have a negative correlation.




\subsection{Identification of the product moment of causal effects}



%{\bf Lemmas related to the moment of causal effects.}
To prepare the discussion on the identification  of the product moment of causal effects, we decompose the product of causal effects $(Y_i-Y_j)$ and $(Y_k-Y_h)$ into four parts.
\begin{lemma}
\label{lem4}
Under SCM ${\cal M}$, %for any $i,j,k,h \in \{1,\dots,R\}$, 
we have
\begin{align}
\label{eq20}
%\begin{aligned}
&(Y_i-Y_j)(Y_k-Y_h)\nonumber\\
&=(Y_i-Y_j)(Y_k-Y_h)\mathbb{I}(Y_i>Y_j,Y_k>Y_h)\nonumber\\
&-(Y_j-Y_i)(Y_k-Y_h)\mathbb{I}(Y_j>Y_i,Y_k>Y_h)\nonumber\\
&-(Y_i-Y_j)(Y_h-Y_k)\mathbb{I}(Y_i>Y_j,Y_h>Y_k)\nonumber\\
&+(Y_j-Y_i)(Y_h-Y_k)\mathbb{I}(Y_j>Y_i,Y_h>Y_k)\nonumber\\
&=\int_{\Omega_Y}\int_{\Omega_Y} \mathbb{I}(Y_j<y_1\leq Y_i,Y_h<y_2\leq Y_k)dy_1 dy_2\nonumber\\
&-\int_{\Omega_Y}\int_{\Omega_Y} \mathbb{I}(Y_i<y_1\leq Y_j,Y_h<y_2\leq Y_k)dy_1 dy_2\nonumber\\
&-\int_{\Omega_Y}\int_{\Omega_Y} \mathbb{I}(Y_j<y_1\leq Y_i,Y_k<y_2\leq Y_h)dy_1 dy_2\nonumber\\
&+\int_{\Omega_Y}\int_{\Omega_Y} \mathbb{I}(Y_i<y_1\leq Y_j,Y_k<y_2\leq Y_h)dy_1 dy_2.
%\end{aligned}
\end{align}
\end{lemma}
%The first part is for subjects who have positive ICE $Y_i-Y_j>0$ and positive ICE $Y_k-Y_h>0$, the second part is for subjects who have negative ICE $Y_i-Y_j<0$ and positive ICE $Y_k-Y_h>0$, the third part is for subjects who have positive ICE $Y_i-Y_j>0$ and negative ICE $Y_k-Y_h<0$, and the fourth part is for subjects who have negative ICE $Y_i-Y_j<0$ and negative ICE $Y_k-Y_h<0$.
The above decomposition consists of four parts based on the signs of ICE. 
%\begin{enumerate}
%    \item Subjects with positive  $Y_i - Y_j > 0$  and positive  $Y_k - Y_h > 0$.
%    \item Subjects with negative  $Y_i - Y_j < 0$  and positive  $Y_k - Y_h > 0$.
%    \item Subjects with positive  $Y_i - Y_j > 0$  and negative  $Y_k - Y_h <0$.
%    \item Subjects with negative  $Y_i - Y_j < 0$  and negative  $Y_k - Y_h < 0$.
%\end{enumerate}
%We present three examples to illustrate how the product of causal effects is concretely decomposed.
%{\bf Example 1.} (Homogeneous ICE)
%Revisiting Example 1, considering $(Y_1-Y_0)(Y_0-Y_{-1})$, the first part is $1$, the second part is $0$, the third part is $0$, and the fourth part is $0$, respectively.
%{\bf Example 2.} (Heterogeneous ICE)
%Revisiting Example 2, considering $(Y_1-Y_0)(Y_0-Y_{-1})$, the first part is $(U^Y+1)^2\mathbb{I}(U^Y+1>0)$, the second part is $0$, the third part is $0$, and the fourth part is $(U^Y+1)^2\mathbb{I}(0>U^Y+1)$, respectively.
%{\bf Example 3.} (Heterogeneous and nonlinear ICE)
%Revisiting Example 3, considering $(Y_1-Y_0)(Y_0-Y_{-1})$, the first part is $-(U^Y+1)^2\mathbb{I}(U^Y+1>0)$, the second part is $0$, the third part is $0$, and the fourth part is $-(U^Y+1)^2\mathbb{I}(0>U^Y+1)$, respectively.
We make the following assumption:
\begin{assumption}[Finiteness of integrals]
\label{exi2}
Under SCM ${\cal M}$,
$\rho_{i,j;k,h}<\infty$ and 
$\int_{\Omega_Y}\int_{\Omega_Y} \mathbb{P}(Y_j<y_1\leq Y_i,Y_h<y_2\leq Y_k)dy_1 dy_2<\infty$ hold for any $i,j,k,h \in \{1,\dots,R\}$.
%$\int_{\Omega_Y}\int_{\Omega_Y} \mathbb{P}(Y_i<y_1\leq Y_j,Y_h<y_2\leq Y_k)dy_1 dy_2<\infty$,
%$\int_{\Omega_Y}\int_{\Omega_Y} \mathbb{P}(Y_j<y_1\leq Y_i,Y_k<y_2\leq Y_h)dy_1 dy_2<\infty$, and $\int_{\Omega_Y}\int_{\Omega_Y} \mathbb{P}(Y_i<y_1\leq Y_j,Y_k<y_2\leq Y_h)dy_1 dy_2<\infty$ hold.
\end{assumption}

%\begin{lemma}
%\label{lem5}
Under SCM ${\cal M}$ and Assumption \ref{exi2}, %for any $i,j,k,h \in \{1,\dots,R\}$, 
taking the expectation on both sides of  Eq.~\eqref{eq20}, we have
\begin{align}
\label{eq21}
%\begin{aligned}
&\rho_{i,j;k,h}\nonumber\\
&=\int_{\Omega_Y}\int_{\Omega_Y} \mathbb{P}(Y_j<y_1\leq Y_i,Y_h<y_2\leq Y_k)dy_1 dy_2\nonumber\\
&-\int_{\Omega_Y}\int_{\Omega_Y} \mathbb{P}(Y_i<y_1\leq Y_j,Y_h<y_2\leq Y_k)dy_1 dy_2\nonumber\\
&-\int_{\Omega_Y}\int_{\Omega_Y} \mathbb{P}(Y_j<y_1\leq Y_i,Y_k<y_2\leq Y_h)dy_1 dy_2\nonumber\\
&+\int_{\Omega_Y}\int_{\Omega_Y} \mathbb{P}(Y_i<y_1\leq Y_j,Y_k<y_2\leq Y_h)dy_1 dy_2.
%\end{aligned}
\end{align}
%\end{lemma}


%The identification of the product moment of causal effects then reduces to the identification problem of the joint distribution of the potential outcomes $\mathbb{P}(Y_j<y_1\leq Y_i,Y_h<y_2\leq Y_k)$, $\mathbb{P}(Y_i<y_1\leq Y_j,Y_h<y_2\leq Y_k)$, $\mathbb{P}(Y_j<y_1\leq Y_i,Y_k<y_2\leq Y_h)$, and $\mathbb{P}(Y_i<y_1\leq Y_j,Y_k<y_2\leq Y_h)$, which were discussed in \citep{Kawakami2024}.
The identification of joint distributions of  potential outcomes in the form of  $\mathbb{P}(Y_j<y_1\leq Y_i,Y_h<y_2\leq Y_k)$ was discussed in \citep{Kawakami2024}, based on which we obtain the following result:
%We show the identification theorem using relatively plausible assumptions (Assumptions \ref{ASEXO2},  \ref{homo}, and \ref{MONO2}). 
\begin{theorem}[Identification of the product moments of causal effects]
\label{theo3}
Under SCM ${\cal M}$ and Assumptions \ref{ASEXO2}, \ref{MONO2}, and \ref{exi2}, %for any $i,j,k,h \in \{1,\dots,R\}$, 
the product moment of $(Y_i-Y_j)$ and $(Y_k-Y_h)$ is identifiable by $\rho_{i,j;k,h}=\sigma(i,j;k,h)$, where
\begin{align}
\label{eq22}
%\begin{aligned}
&\sigma(i,j;k,h)\nonumber\\
&=\int_{{\Omega_Y}^2}\max\Big\{\min\{\mathbb{P}(Y<y_1|X=j),\mathbb{P}(Y<y_2|X=h)\}\nonumber\\
&\hspace{0.2cm}-\max\{\mathbb{P}(Y<y_1|X=i),\mathbb{P}(Y<y_2|X=k)\},0\Big\}dy_1dy_2\nonumber\\
&-\int_{{\Omega_Y}^2}\max\Big\{\min\{\mathbb{P}(Y<y_1|X=i),\mathbb{P}(Y<y_2|X=h)\}\nonumber\\
&\hspace{0.2cm}-\max\{\mathbb{P}(Y<y_1|X=j),\mathbb{P}(Y<y_2|X=k)\},0\Big\}dy_1dy_2\nonumber\\
&-\int_{{\Omega_Y}^2}\max\Big\{\min\{\mathbb{P}(Y<y_1|X=j),\mathbb{P}(Y<y_2|X=k)\}\nonumber\\
&\hspace{0.2cm}-\max\{\mathbb{P}(Y<y_1|X=i),\mathbb{P}(Y<y_2|X=h)\},0\Big\}dy_1dy_2\nonumber\\
&+\int_{{\Omega_Y}^2}\max\Big\{\min\{\mathbb{P}(Y<y_1|X=i),\mathbb{P}(Y<y_2|X=k)\}\nonumber\\
&\hspace{0.2cm}-\max\{\mathbb{P}(Y<y_1|X=j),\mathbb{P}(Y<y_2|X=h)\},0\Big\}dy_1dy_2.
%\end{aligned}
\end{align}
\end{theorem}



\subsection{Bounding the product moment of causal effects}

The monotonicity Assumption \ref{MONO2} may sometimes be considered implausible by researchers. 
%For example, Example 2 does not satisfy Assumption \ref{MONO2} when $\Omega_{X}=\{-1,0,1\}$.
Therefore, we derive bounds for the product moment of causal effects that do not rely on Assumption \ref{MONO2}.


%Assumption \ref{MONO2} is sometimes implausible for researchers.
%For example,Example 2 does not satisfy Assumption \ref{MONO2} for $\Omega_{X}=\{-1,0,1\}$.
%Thus, we provide the bounds of the product moment of causal effects without Assumption \ref{MONO2}.


We first derive  bounds for the joint distribution of  potential outcomes $\mathbb{P}(Y_j<y_1\leq Y_i,Y_h<y_2\leq Y_k)$.
\begin{lemma}
\label{lem6}
Under SCM ${\cal M}$ and Assumptions \ref{ASEXO2} and \ref{exi2}, for any $i,j,k,h \in \{1,\dots,R\}$, $y_1, y_2 \in \Omega_Y$
we have $l(y_1,y_2;i,j,k,h)\leq \mathbb{P}(Y_j<y_1\leq Y_i,Y_h<y_2\leq Y_k)\leq u(y_1,y_2;i,j,k,h)$, where
\begin{align}
&l(y_1,y_2;i,j,k,h)=\nonumber\\
&\hspace{0cm}\max\Big\{\mathbb{P}(Y<y_1|X=j)-\mathbb{P}(Y <y_1|X=i)\nonumber\\
&\hspace{0cm}+\mathbb{P}(Y<y_2|X=h)-\mathbb{P}(Y<y_2|X=k)-1,0\Big\},\\
&u(y_1,y_2;i,j,k,h)=\nonumber\\
&\hspace{0cm}\min\Big\{\min\{\mathbb{P}(Y<y_1|X=j),\mathbb{P}(Y<y_2|X=h)\},\nonumber\\
&\hspace{0cm}1-\max\{\mathbb{P}(Y<y_1|X=i),\mathbb{P}(Y<y_2|X=k)\}\Big\}
\end{align}
%for each $i,j,k,h \in \{1,\dots,R\}$ and $y_1, y_2 \in \Omega_Y$.
\end{lemma}
Then, we have the following theorem.
\begin{theorem}[Bounds of the product moments of causal effects]
\label{theo4}
Under SCM ${\cal M}$ and Assumptions \ref{ASEXO2} and \ref{exi2}, for any $i,j,k,h \in \{1,\dots,R\}$, we have $\sigma_L(i,j;k,h) \leq \rho_{i,j;k,h} \leq \sigma_U(i,j;k,h)$, where
\begin{align}
\label{eq25}
%\begin{aligned}
\sigma_L(i,j;k,h)\nonumber
&=\int_{{\Omega_Y}^2}l(y_1,y_2;i,j,k,h)dy_1dy_2\nonumber\\
&-\int_{{\Omega_Y}^2}u(y_1,y_2;j,i,k,h)dy_1dy_2\nonumber\\
&-\int_{{\Omega_Y}^2}u(y_1,y_2;i,j,h,k)dy_1dy_2\nonumber\\
&+\int_{{\Omega_Y}^2}l(y_1,y_2;j,i,h,k)dy_1dy_2,\\
\label{eq26}
\sigma_U(i,j;k,h)\nonumber
&=\int_{{\Omega_Y}^2}u(y_1,y_2;i,j,k,h)dy_1dy_2\nonumber\\
&-\int_{{\Omega_Y}^2}l(y_1,y_2;j,i,k,h)dy_1dy_2\nonumber\\
&-\int_{{\Omega_Y}^2}l(y_1,y_2;i,j,h,k)dy_1dy_2\nonumber\\
&+\int_{{\Omega_Y}^2}u(y_1,y_2;j,i,h,k)dy_1dy_2.
%\end{aligned}
\end{align}
\end{theorem}
If $\sigma_U=\infty$ and $\sigma_L=-\infty$, then $\rho_{i,j;k,h}$ is unbounded.
{The above bounds for product moments are not sharp.}



\textbf{Remark.}  We present a similar identification theorem and bounds for the central product moment (covariance) of causal effects in Appendix \ref{appC}. 
Additionally, the correlation of causal effects is also bounded, as shown in Appendix \ref{appC}.


