
%In this section, we show the backgrounds and notations in this paper.
We represent each variable with a capital letter $(X)$ and its realized value with a small letter $(x)$.
Let $\mathbb{I}(x)$ be an indicator function that takes $1$ if $x$ is true; and $0$ if $x$ is false.
Denote $\Omega_Y$ be the domain of $Y$,
$\mathbb{E}[Y]$ be the expectation of $Y$, $\mathbb{P}(Y\leq y)$ be the cumulative distribution function (CDF) of continuous variable $Y$, and $\mathbb{P}(Y)$ be the probability of discrete variable $Y$.
%In addition, let $\mathbb{P}(Y\leq y|X=x)$ and $\mathbb{P}(Y= y|X=x)$ be the conditional CDF and probability given $X=x$.
We denote $X \indep Y|C$ if $X$ and $Y$ are conditionally independent given $C$.


{\bf Total order over vector space.} 
We denote a total order on vectors of variables by $\prec$. 
For example, according to the lexicographical order \citep{Harzheim2005}, we order two dimensional vectors $(y_1, y_2) \prec_{\text{lexi}} (y'_1, y'_2)$ if ``$y_1 < y'_1$'', or ``$y_1 = y'_1$ and $y_2 < y'_2$''. 
A formal definition of the lexicographical order is given in Appendix~\ref{app0}.


{\bf Structural Causal Models (SCM).} We use the language of SCMs as our basic semantic and inferential framework \citep{Pearl09}.
An SCM ${\cal M}$ is a tuple $\left<{\boldsymbol V},{\boldsymbol U}, {\cal F}, \mathbb{P}_{\boldsymbol U} \right>$, where ${\boldsymbol U}$ is a set of exogenous (unobserved) variables following a  distribution $\mathbb{P}_{\boldsymbol U}$, and ${\boldsymbol V}$ is a set of endogenous (observable) variables whose values are determined by structural functions ${\cal F}=\{f_{V_i}\}_{V_i \in {\boldsymbol V}}$ such that $v_i:= f_{V_i}({\mathbf{pa}}_{V_i},{\boldsymbol u}_{V_i})$ where ${\mathbf{PA}}_{V_i} \subseteq {\boldsymbol V}$ and $U_{V_i} \subseteq {\boldsymbol U}$. 
Each SCM ${\cal M}$ induces an observational distribution $\mathbb{P}_{\boldsymbol V}$ over ${\boldsymbol V}$, and a causal graph $G({\cal M})$ over ${\boldsymbol V}$ in which there exists a directed edge from every variable in ${\mathbf{PA}}_{V_i}$ to $V_i$.
An intervention of setting a set of endogenous variables ${\boldsymbol X}$ to constants ${\boldsymbol x}$, denoted by $do({\boldsymbol x})$, replaces the original equations of ${\boldsymbol X}$
 by the constants ${\boldsymbol x}$ and induces a \textit{sub-model}  ${\cal M}_{{\boldsymbol x}}$.
We denote the potential outcome $Y$ under intervention $do({\boldsymbol x})$ by $Y_{{\boldsymbol x}}({\boldsymbol u})$, which is the solution of $Y$ in the sub-model ${\cal M}_{{\boldsymbol x}}$ given ${\boldsymbol U}={\boldsymbol u}$. 


{\bf Probabilities of Causation (PoC).} 
%We show the definitions and an identification theorem of probabilities of causation with binary treatment and outcome.
Let $X$ be a binary treatment taking values $x_0$ and $x_1$, and $Y$ be a binary outcome taking values $y_0$ and $y_1$. PoC are defined as follows:
\begin{definition}[PoC]
\label{def1}
Probability of necessity and sufficiency (PNS), probability of necessity (PN), and probability of sufficiency (PS) are defined by   \citep{Pearl1999}:
    \begin{equation}
    \begin{aligned}
    &\text{PNS}\defeq\mathbb{P}(Y_{x_0}=y_0,Y_{x_1}=y_1),\\
    &\text{PN}\defeq\mathbb{P}(Y_{x_0}=y_0|Y=y_1,X=x_1),\\
   &\text{PS}\defeq\mathbb{P}(Y_{x_1}=y_1|Y=y_0,X=x_0).
        \end{aligned}
    \end{equation}
\end{definition}
\citet{Tian2000} show that these PoC are identified under the following assumptions.
%\yuta{They give two assumptions for identifying PNS, PN, and PS.
\begin{assumption}[Exogeneity]
\label{BEXO}
    $Y_{x_0} \indep X$ and $Y_{x_1} \indep X$.
\end{assumption}
\begin{assumption}[Monotonicity]
\label{BMONO}
    $\mathbb{P}(Y_{x_0}=y_1,Y_{x_1}=y_0)=0$.
\end{assumption}
%\citet{Tian2000} gave the following identification results:
%\begin{theorem}[Identification of PoC]
    %If $X$ is exogenous
    %, i.e., $Y_{x_0} \indep X$ and $Y_{x_1} \indep X$, 
    %$X \indep U$,
     %and $Y$ is monotonic relative to $X$,
     %, i.e., $\mathbb{P}(Y_{x_0}=y_1,Y_{x_1}=y_0)=0$,
     Under Assumptions \ref{BEXO} and \ref{BMONO},
     the PoC are identifiable by \citep{Tian2000}
    \begin{equation}
        \begin{aligned}
        &\text{PNS}=\mathbb{P}(Y=y_1|X=x_1)-\mathbb{P}(Y=y_1|X=x_0),\\
        &\text{PN}=\frac{\mathbb{P}(Y=y_1|X=x_1)-\mathbb{P}(Y=y_1|X=x_0)}{\mathbb{P}(Y=y_1|X=x_1)},\\
        &\text{PS}=\frac{\mathbb{P}(Y=y_1|X=x_1)-\mathbb{P}(Y=y_1|X=x_0)}{\mathbb{P}(Y=y_0|X=x_0)}.
        \end{aligned}
    \end{equation}
%\end{theorem}




%\jin{Move the whole Orders part to the appendix.}\\