\documentclass{uai2025} % for initial submission
%\documentclass[accepted]{uai2025} % after acceptance, for a revised version; 
% also before submission to see how the non-anonymous paper would look like 
       

\newcommand{\removed}[1]{}
\usepackage{times}
\usepackage{soul}
\usepackage{url}
%\usepackage{hyperref}
\usepackage[utf8]{inputenc}
%\usepackage[small]{caption}
\usepackage{graphicx}
\usepackage{amsmath}
\usepackage{amsthm}
\usepackage{booktabs}
\usepackage{algorithm}
\usepackage{algorithmic}
%\usepackage[switch]{lineno}
\usepackage{stackengine}
\def\defeq{\mathrel{\ensurestackMath{\stackon[1pt]{=}{\scriptscriptstyle\Delta}}}}


\usepackage{algorithm}
\usepackage{algorithmic}

% Set the typeface to Times Roman
\usepackage{times}

%\usepackage{hyperref}
\usepackage{url}

\usepackage{amsmath}
%\usepackage{wrapfig,lipsum,booktabs}

\usepackage{amssymb}
\usepackage{mathtools}
\usepackage{amsthm}


\usepackage{algorithmic}

\usepackage{lscape}
% if yo {\boldsymbol u} use cleveref..
\usepackage[capitalize,noabbrev]{cleveref}

%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
% THEOREMS
%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
\theoremstyle{plain}

% Todonotes is  during development; simply uncomment the next line
%    and comment out the line below the next line to turn off comments
%\usepackage[disable,textsize=tiny]{todonotes}
\usepackage[textsize=tiny]{todonotes}
\usepackage{multirow}

\usepackage{ascmac}
%\usepackage{fancybx}
\usepackage{float}
\usepackage{perpage}
\MakeSorted{figure}
\MakeSorted{table}

\usepackage{url}
\usepackage{natbib}
\usepackage{chapterbib}

\usepackage{color}
\usepackage{tikz}
\tikzset{%
mynode/.style={circle,minimum width=.5ex, fill=none,draw}, % no filling
myfillnode/.style={circle,minimum width=.5ex, fill=lightgray,draw}, % fill with black
}
\usepackage{amssymb}
\usepackage{natbib}

\newcommand{\0}{$\mathrm{I}$}
\newcommand{\2}{$\mathrm{I}\hspace{-1.2pt}\mathrm{I}$}
\newcommand{\3}{$\mathrm{I}\hspace{-1.2pt}\mathrm{I}\hspace{-1.2pt}\mathrm{I}$}
\newcommand{\4}{$\mathrm{I}\hspace{-1.2pt}\mathrm{V}$}
%\newcommand{\3}{$\mathrm{i}$}
%\newcommand{\4}{$\mathrm{i}\hspace{-0.8pt}\mathrm{i}$}
%\newcommand{\5}{$\mathrm{i}\hspace{-0.8pt}\mathrm{i}\hspace{-0.8pt}\mathrm{i}$}
\newcommand{\6}{$\mathrm{i}\hspace{-0.8pt}\mathrm{v}$}
\newcommand{\indep}{\perp \!\!\! \perp}
\usepackage{amsmath}               
\usepackage{lscape}
\usepackage{algorithm}
%\usepackage[dvipdfmx]{graphicx}
%\bibliographystyle{unsrtnat}
%\DeclareMathOperator*{\argmin}{arg\,min}
%\DeclareMathOperator*{\argmax}{arg\,max}
\usepackage{color}
\usepackage{tikz}
% The \icmltitle yo {\boldsymbol u} define below is probably too long as a header.
% Therefore, a short form for the running title is supplied here:
\usepackage{amsmath,amsthm}
\newtheorem{theorem}{Theorem}
\newtheorem{definition}{Definition}
\newtheorem{assumption}{Assumption}
\newtheorem{lemma}{Lemma}
\newtheorem{proposition}{Proposition}
\newtheorem{corollary}{Corollary}
\usepackage{multirow}
\usepackage{comment}
\usepackage{here}
\allowdisplaybreaks[4]
%\usepackage{bbm}
\usepackage{caption}
\usepackage{bbding}
\usepackage{arydshln}
\usepackage{afterpage}

%\usepackage{algpseudocode}
\usepackage{mathrsfs}
\DeclareMathOperator*{\plim}{p-lim}

\newcommand{\jin}[1]{\textcolor{blue}{[[#1]]}}
\newcommand{\jina}[1]{\textcolor{blue}{#1}}
\newcommand{\yuta}[1]{\textcolor{red}{#1}}
\newcommand{\error}[1]{\textcolor{green}{#1}}
\usepackage{soul}


% If accepted, instead use the following line for the camera-ready submission:
%\usepackage[accepted]{icml2024}

% For theorems and such
\usepackage{amsmath}
\usepackage{amssymb}
\usepackage{mathtools}
\usepackage{amsthm}
                 
%% There is a class option to choose the math font
% \documentclass[mathfont=ptmx]{uai2024} % ptmx math instead of Computer
                                         % Modern (has noticeable issues)
% \documentclass[mathfont=newtx]{uai2024} % newtx fonts (improves upon
                                          % ptmx; less tested, no support)
% NOTE: Only keep *one* line above as appropriate, as it will be replaced
%       automatically for papers to be published. Do not make any other
%       change above this note for an accepted version.

%% Choose your variant of English; be consistent
\usepackage[american]{babel}
% \usepackage[british]{babel}

%% Some suggested packages, as needed:
\usepackage{natbib} % has a nice set of citation styles and commands
    \bibliographystyle{plainnat}
    \renewcommand{\bibsection}{\subsubsection*{References}}
\usepackage{mathtools} % amsmath with fixes and additions
% \usepackage{siunitx} % for proper typesetting of numbers and units
\usepackage{booktabs} % commands to create good-looking tables
\usepackage{tikz} % nice language for creating drawings and diagrams

%% Provided macros
% \smaller: Because the class footnote size is essentially LaTeX's \small,
%           redefining \footnotesize, we provide the original \footnotesize
%           using this macro.
%           (Use only sparingly, e.g., in drawings, as it is quite small.)

%% Self-defined macros
\newcommand{\swap}[3][-]{#3#1#2} % just an example

\title{Moments of Causal Effects}

% The standard author block has changed for UAI 2024 to provide
% more space for long author lists and allow for complex affiliations
%
% All author information is authomatically removed by the class for the
% anonymous submission version of your paper, so you can already add your
% information below.
%
% Add authors
\author[1]{\href{mailto:<jj@example.edu>?Subject=Your UAI 2024 paper}{Jane~J.~von~O'L\'opez}{}}
\author[1]{Harry~Q.~Bovik}
\author[1,2]{Further~Coauthor}
\author[3]{Further~Coauthor}
\author[1]{Further~Coauthor}
\author[3]{Further~Coauthor}
\author[3,1]{Further~Coauthor}
% Add affiliations after the authors
\affil[1]{%
    Computer Science Dept.\\
    Cranberry University\\
    Pittsburgh, Pennsylvania, USA
}
\affil[2]{%
    Second Affiliation\\
    Address\\
    …
}
\affil[3]{%
    Another Affiliation\\
    Address\\
    …
  }
  
\begin{document}



Thank you for your valuable feedback and positive review of our paper.

>Comment:
In practice, how well will we accept the SCM with two mediators at the first place?

Our response:
Causal mediation analysis of the total effect $E[Y_{x}-Y_{x'}]$ with two or more mediators has been studied across various fields, including AI [Avin et al., 2005; Shpitser and Pearl, 2008], medicine [Albert and Nelson, 2011; VanderWeele and Vansteelandt, 2014;  Daniel et al., 2015; Vansteelandt and Daniel, 2017], and political science [Zhou and Yamamoto, 2023]. For example, Daniel et al. (2015) studied the effect of heavy drinking in the previous year on systolic blood pressure, mediated through body mass index (BMI) and gamma-glutamyl transpeptidase (GGT).
The linear structural causal model (SCM) given in the last paragraph on page 2  represents one of the most widely used frameworks in mediation analysis involving multiple mediators [e.g., Daniel et al., 2015]. 
This commonly used model satisfies the stated assumptions.

>Comment:
(i) In Figure 1, plot SCM ${\cal M}_1$ in addition to ${\cal M}_2$ will help readibility.

Our response:
We will add a causal graph representing SCM ${\cal M}_1$ in Figure 1.

>Comment:
(ii) This paper is notation heavy, the potential outcomes and total order can be quite dense for applied researchers. (Maybe) the authors can start with univariate case and then naturally extend to multivariate setting.

Our response:
We will add the following sentence after the sentence "We use  $\preceq$ to denote a total order." in Section 2:

"In the univariate case, the total order $\preceq$ reduces to the standard order $\leq$"

The notation remains nearly unchanged if we use $\leq$.

>Comment:
(iii) Consider adding illustrative example (for example, linear SCM).
I really like the 4 questions trying to answer in the first page, something more concrete along this line will be good to have.

Our response:
We will go through the paper trying to use linear SCM as an illustrative example when appropriate.

>Comment:
(i) If the assumptions do not hold, can we bound the probability of causation in certain settings?

Our response:
We will add a discussion about bounding along the following lines: In the settings where the monotonicity assumption does not hold, we can aim to derive bounds for the path-specific PNS [Tian and Pearl 2000] [1]. One approach is to use Fréchet inequalities [2]. Deriving bounds for the path-specific PNS will be a future work.

[1]  Li, Ang, and Judea Pearl. "Probabilities of causation with nonbinary treatment and effect." Proceedings of the AAAI Conference on Artificial Intelligence. Vol. 38. No. 18. 2024.

[2] Fréchet, Maurice. "Sur les tableaux dont les marges et des bornes sont données." Revue de l'Institut international de statistique (1960): 10-32.

>Comment:
(ii) Are the assumptions minimum in order for identification result to hold?

Our response:
We have avoided imposing any apparently unnecessary assumptions. Monotonicity assumptions have been a common assumption for achieving identification in the literature; however, we are not aware of any claim about the necessity of the condition. 

>Comment:
(iii) If paths $X \rightarrow M \rightarrow Y$ and $X \rightarrow N \rightarrow Y$ are not causal, can we answer all the questions building upon previous one mediator result?


Our response:
When the only causal path is $X \rightarrow M \rightarrow N \rightarrow Y$, (Q-a1) reduces to (Q-a) and (Q-b1) reduces (Q-b) by treating $\{M,N\}$ as a single variable.
We can answer the questions using the one-mediator results.

>Comment:
(iv) Which assumptions are testable?

Our response: 
To our understanding, these assumptions are not testable from observational data alone.














%\jina{When the path $X \rightarrow M \rightarrow Y$ or $X \rightarrow N \rightarrow Y$ doesn't exist, (Q-a1) reduces to (Q-a) and (Q-b2) reduces (Q-b). We can answer the questions using the one-mediator results. }
%\jin{Is the above answer applicable for the case that the only caual path is $X \rightarrow M \rightarrow N \rightarrow Y$?}



%\yuta{When the path $X \rightarrow N \rightarrow Y$ doesn't exist, (Q-a1) reduces to (Q-a) and (Q-b2) reduces (Q-b). When the path $X \rightarrow M \rightarrow Y$ doesn't exist, (Q-a1) reduces to (Q-a) and (Q-a2) reduces (Q-b) by treating $\{M,N\}$ as a single variable. When the only path $X \rightarrow M \rightarrow N \rightarrow Y$ exist, (Q-a1) reduces to (Q-a) and (Q-b1) reduces (Q-b) by treating $\{M,N\}$ as a single variable. We can answer the questions using the one-mediator results.}



%None of the assumptions are testable. Thus, violations of monotonicity and the presence of confounders between treatment and mediator, mediator and outcome, or treatment and outcome always pose risks in the analysis.



%If you are referring to the case where there is no arrow between $M$ and $N$, then the answer is no. Even if there is no arrow between $M$ and $N$, the questions still depend on both variables, and our path-specific PNS relies on both $M$ and $N$. \jin{But (Q-a1) and (Q-b1) reduce to (Q-a) and (Q-b) respectively by treating  $\{M,N\}$ as a single variable.  }
%\jin{I think the reviewer refers to the case where paths $X \rightarrow M \rightarrow Y$ and $X \rightarrow N \rightarrow Y$ don't exist (?). In this case, can we treat {M, N} as a single variable and use the previous one mediator result?  }

%\yuta{Even when the case where paths $X \rightarrow M \rightarrow Y$ and $X \rightarrow N \rightarrow Y$ don't exist, we cannot answer (Q-a1), (Q-a2), (Q-b1), or (Q-b2) using previous one-mediator results, since these questions explicitly presume the presence of two mediators. \jin{But (Q-a1) and (Q-b1) reduce to (Q-a) and (Q-b) respectively by treating  $\{M,N\}$ as a single variable.  }
%Instead, we can answer (Q-a) and (Q-b) by previous one mediator result for single mediator $M$, $N$, or the joint mediator set $\{M,N\}$. \jin{It's unclear to me what (Q-a) and (Q-b) means in this setting, even less what "we can answer (Q-a) and (Q-b) by previous one mediator result" means. }}

%\jin{Ignore the following from the rebuttal.}

%\yuta{
%When the path $X \rightarrow N \rightarrow Y$ doesn't exist, (Q-a1) reduces to (Q-a) and (Q-b2) reduces (Q-b). Since we have $Y_{x',{M}_{x},{N}_{x,{M}_{x}}}=Y_{x',{M}_{x}}$ and $Y_{x',{M}_{x},{N}_{x',{M}_{x'}}}=Y_{x',{M}_{x}}$ when the path $X \rightarrow N \rightarrow Y$ doesn't exist, the path-specific PNS become
%\begin{align}
%&\text{\normalfont PNS}^{X \rightarrow Y}(y;x',x,{\cal E},c)\defeq\mathbb{P}(Y_{x'} \prec y \preceq Y_{x}, Y_{x',{M}_{x}} \prec y,\nonumber\\
%&\hspace{3cm} Y_{x',{M}_{x},{N}_{x,{M}_{x}}} \prec y|{\cal E},C=c)\\
%&=\mathbb{P}(Y_{x'} \prec y \preceq Y_{x}, Y_{x',{M}_{x}} \prec y),\\
%&\text{\normalfont PNS}^{X \rightarrow {N} \rightarrow  Y}(y;x',x,{\cal E},c)\defeq\nonumber\\
%&\hspace{1cm}\mathbb{P}(Y_{x'} \prec y \preceq Y_{x}, Y_{x',{M}_{x}} \prec y,\nonumber\\
%&\hspace{3cm} y \preceq  Y_{x',{M}_{x},{N}_{x,{M}_{x}}}|{\cal E},C=c)=0,\\
%&\text{\normalfont PNS}^{X \rightarrow {M} \rightarrow {N} \rightarrow  Y}(y;x',x,{\cal E},c)\defeq\nonumber\\
%&\hspace{1cm}\mathbb{P}(Y_{x'} \prec y \preceq Y_{x},y \preceq Y_{x',{M}_{x}},\nonumber\\
%&\hspace{2.5cm}Y_{x',{M}_{x},{N}_{x',{M}_{x'}}} \prec y|{\cal E},C=c)=0,\\
%&\text{\normalfont PNS}^{X \rightarrow {M}  \rightarrow  Y}(y;x',x,{\cal E},c)\defeq\nonumber\\
%&\hspace{1cm}\mathbb{P}(Y_{x'} \prec y \preceq Y_{x},y \preceq Y_{x',{M}_{x}},\nonumber\\
%&\hspace{2.5cm}y \preceq Y_{x',{M}_{x},{N}_{x',{M}_{x'}}}|{\cal E},C=c)\\
%&=\mathbb{P}(Y_{x'} \prec y \preceq Y_{x},y \preceq Y_{x',{M}_{x}}).
%\end{align}
%Then, $\text{\normalfont PNS}^{X \rightarrow Y}(y;x',x,{\cal E},c)$ and $\text{\normalfont PNS}^{X \rightarrow {M}  \rightarrow  Y}(y;x',x,{\cal E},c)$ reduce to ND-PNS and NI-PNS with evidence.
%}


%\yuta{
%When the path $X \rightarrow M \rightarrow Y$ doesn't exist, (Q-a1) reduces to (Q-a) and (Q-a2) reduces (Q-b) by treating $\{M,N\}$ as a single variable.
%Since we have $Y_{x',{M}_{x},{N}_{x,{M}_{x}}}=Y_{x',{N}_{x,{M}_{x}}}$ and $Y_{x',{M}_{x},{N}_{x',{M}_{x'}}}=Y_{x',{N}_{x',{M}_{x'}}}$ when the path $X \rightarrow M \rightarrow Y$ doesn't exist, the path-specific PNS become
%\begin{align}
%&\text{\normalfont PNS}^{X \rightarrow Y}(y;x',x,{\cal E},c)\defeq\mathbb{P}(Y_{x'} \prec y \preceq Y_{x}, Y_{x',{M}_{x}} \prec y,\nonumber\\
%&\hspace{3cm} Y_{x',{M}_{x},{N}_{x,{M}_{x}}} \prec y|{\cal E},C=c)\\
%&=\mathbb{P}(Y_{x'} \prec y \preceq Y_{x},Y_{x',{N}_{x,{M}_{x}}} \prec y|{\cal E},C=c),\\
%&\text{\normalfont PNS}^{X \rightarrow {N} \rightarrow  Y}(y;x',x,{\cal E},c)\defeq\nonumber\\
%&\hspace{1cm}\mathbb{P}(Y_{x'} \prec y \preceq Y_{x}, Y_{x',{M}_{x}} \prec y,\nonumber\\
%&\hspace{3cm} y \preceq  Y_{x',{M}_{x},{N}_{x,{M}_{x}}}|{\cal E},C=c)\\
%&=\mathbb{P}(Y_{x'} \prec y \preceq Y_{x}, y \preceq  Y_{x',{N}_{x,{M}_{x}}}|{\cal E},C=c),\\
%&\text{\normalfont PNS}^{X \rightarrow {M} \rightarrow {N} \rightarrow  Y}(y;x',x,{\cal E},c)\defeq\nonumber\\
%&\hspace{1cm}\mathbb{P}(Y_{x'} \prec y \preceq Y_{x},y \preceq Y_{x',{M}_{x}},\nonumber\\
%&\hspace{2.5cm}Y_{x',{M}_{x},{N}_{x',{M}_{x'}}} \prec y|{\cal E},C=c)=0,\\
%&\text{\normalfont PNS}^{X \rightarrow {M}  \rightarrow  Y}(y;x',x,{\cal E},c)\defeq\nonumber\\
%&\hspace{1cm}\mathbb{P}(Y_{x'} \prec y \preceq Y_{x},y \preceq Y_{x',{M}_{x}},\nonumber\\
%&\hspace{2.5cm}y \preceq Y_{x',{M}_{x},{N}_{x',{M}_{x'}}}|{\cal E},C=c)=0.
%\end{align}
%Then, $\text{\normalfont PNS}^{X \rightarrow Y}(y;x',x,{\cal E},c)$ and $\text{\normalfont PNS}^{X \rightarrow {N} \rightarrow  Y}(y;x',x,{\cal E},c)$ reduce to ND-PNS and NI-PNS with evidence by treating $\{M,N\}$ as a single variable.
%}

%\yuta{Then, when paths $X \rightarrow M \rightarrow Y$ and $X \rightarrow N \rightarrow Y$ don't exist, we can answer all the questions in this paper by one-mediator results.}


\end{document}

%All assumptions in this paper are extensions of those used in simpler cases, such as the single-mediator setting. We present a linear structural causal model (SCM) with two mediators on page 2 (right column), which represents one of the most widely used frameworks in mediation analysis involving multiple mediators. This commonly used model satisfies the stated assumptions.





%\jin{Does this make sense? a good idea?}
%\yuta{[Yes, I will provide the explicit form of Definition 3.1 using linear SCM.]}
%The experimental settings presented in the main body of the paper and in Appendix D serve as illustrative examples. We also provide the corresponding estimates of our proposed measures within these settings.

%The settings on Appendix D show the three illustrative cases: (1) no effect between ${M}$ and ${N}$, (2) no effect between $\{{M},{N}\}$ and $Y$, and (3) only effect through $X \rightarrow {M} \rightarrow {N} \rightarrow Y$.

%\jin{Remove the following.}

%We can provide the bounds of our path-specific PNS with no evidence using Frécht inequalities. For example, $\text{\normalfont PNS}^{X \rightarrow Y}(y;x',x,\emptyset,c)$
%\defeq\mathbb{P}(Y_{x'} \prec y \preceq Y_{x}, Y_{x',{M}_{x}} \prec y,Y_{x',{M}_{x},{N}_{x,{M}_{x}}} \prec y|C=c)$ is bounded by $\max\{\mathbb{P}(Y_{x'} \prec y|C=c)+\mathbb{P}(y \preceq Y_{x}|C=c)+\mathbb{P}(Y_{x',{M}_{x}} \prec y|C=c)+\mathbb{P}(Y_{x',{M}_{x},{N}_{x,{M}_{x}}} \prec y|C=c)-3,0\} \leq \text{\normalfont PNS}^{X \rightarrow Y}(y;x',x,\emptyset,c) \leq \min\{\mathbb{P}(Y_{x'} \prec y|C=c),\mathbb{P}(y \preceq Y_{x}|C=c),\mathbb{P}(Y_{x',{M}_{x}} \prec y|C=c),\mathbb{P}(Y_{x',{M}_{x},{N}_{x,{M}_{x}}} \prec y|C=c)\}$.


%We will provide all cases and add the following discussion.

%"The bounds derived from the Fréchet inequalities are not sharp [1], and obtaining tighter bounds remains a challenging mathematical problem. Some studies [2,3] provide improved Fréchet–Hoeffding bounds by incorporating additional information. This will be a future work."

%[1] Nelsen, Roger B. An introduction to copulas. springer, 2006.


%[2] Lux, Thibaut, and Antonis Papapantoleon. "Improved Fréchet–Hoeffding bounds on d-copulas and applications in model-free finance." (2017): 3633-3671.

%[3] Bartl, Daniel, et al. "Marginal and dependence uncertainty: bounds, optimal transport, and sharpness." arXiv preprint arXiv:1709.00641 (2017).





%We do not claim that the assumptions in our theorems are necessary conditions; however, we have avoided imposing any apparently unnecessary assumptions.
