\section{Additional Information on Application}
\label{appB}

%\subsection{Additional Information on Application}


In this section, we provide additional information on the application.

\subsection{Details of Dataset}
First, we explain all variables in the application. 
We pick up the following variables as {\bf outcomes}.
\begin{enumerate}
%these grades are related with the course subject, Math or Portuguese:
\item G1 - first period grade (numeric: from 0 to 20)
\item G2 - second period grade (numeric: from 0 to 20)
\item G3 - final grade (numeric: from 0 to 20, output target)
\end{enumerate}
We pick up the following variables as {\bf treatments}.
\begin{enumerate}
    \item studytime - weekly study time (numeric: 1 - < 2 hours, 2 - 2 to 5 hours, 3 - 5 to 10 hours, or 4 - >10 hours)
    \item paid - extra paid classes within the course subject (Math or Portuguese) (binary: yes or no)
\end{enumerate}
We show the other variables as potential {\bf covariates}.
\begin{enumerate}
\item school - student's school (binary: 'GP' - Gabriel Pereira or 'MS' - Mousinho da Silveira)
\item sex - student's sex (binary: 'F' - female or 'M' - male)
\item age - student's age (numeric: from 15 to 22)
\item address - student's home address type (binary: 'U' - urban or 'R' - rural)
\item famsize - family size (binary: 'LE3' - less or equal to 3 or 'GT3' - greater than 3)
\item Pstatus - parent's cohabitation status (binary: 'T' - living together or 'A' - apart)
\item Medu - mother's education (numeric: 0 - none,  1 - primary education (4th grade), 2 “ 5th to 9th grade, 3 “ secondary education or 4 “ higher education)
\item Fedu - father's education (numeric: 0 - none,  1 - primary education (4th grade), 2 “ 5th to 9th grade, 3 “ secondary education or 4 “ higher education)
\item Mjob - mother's job (nominal: 'teacher', 'health' care related, civil 'services' (e.g. administrative or police), 'at home' or 'other')
\item Fjob - father's job (nominal: 'teacher', 'health' care related, civil 'services' (e.g. administrative or police), 'at home' or 'other')
\item reason - reason to choose this school (nominal: close to 'home', school 'reputation', 'course' preference or 'other')
\item guardian - student's guardian (nominal: 'mother', 'father' or 'other')
\item traveltime - home to school travel time (numeric: 1 - <15 min., 2 - 15 to 30 min., 3 - 30 min. to 1 hour, or 4 - >1 hour)
\item failures - number of past class failures (numeric: n if 1<=n<3, else 4)
\item schoolsup - extra educational support (binary: yes or no)
\item famsup - family educational support (binary: yes or no)
\item activities - extra-curricular activities (binary: yes or no)
\item nursery - attended nursery school (binary: yes or no)
\item higher - wants to take higher education (binary: yes or no)
\item internet - Internet access at home (binary: yes or no)
\item romantic - with a romantic relationship (binary: yes or no)
\item famrel - quality of family relationships (numeric: from 1 - very bad to 5 - excellent)
\item freetime - free time after school (numeric: from 1 - very low to 5 - very high)
\item goout - going out with friends (numeric: from 1 - very low to 5 - very high)
\item Dalc - workday alcohol consumption (numeric: from 1 - very low to 5 - very high)
\item Walc - weekend alcohol consumption (numeric: from 1 - very low to 5 - very high)
\item health - current health status (numeric: from 1 - very bad to 5 - very good)
\item absences - number of school absences (numeric: from 0 to 93)
\end{enumerate}
We show the attributes of ID number $1$ in Table \ref{Atab1}.



\begin{table}[tb]
\renewcommand{\arraystretch}{1.1}
\centering
\caption{Attributes of the ID number $1$ subject.}
\label{Atab1}
\begin{tabular}{lllllllllll}
\hline \hline
school & sex & age & address & famsize & Pstatus & Medu & Fedu & Mjob     & Fjob    & reason \\
\hline
GP     & F   & 18  & U       & GT3     & A       & 4    & 4    & at\_home & teacher & course\\
\hline
\hline
guardian & traveltime & studytime & failures & schoolsup & famsup & paid & activities & nursery & higher & internet \\
\hline
mother   & 2          & 2         & 0        & yes       & no     & no   & no         & yes     & yes    & no      \\
\hline
\hline
romantic & famrel & freetime & goout & Dalc & Walc & health & absences & G1 & G2 & G3 \\
\hline
no       & 4      & 3        & 4     & 1    & 1    & 3      & 6        & 5  & 6  & 6 \\
\hline
\end{tabular}
\end{table}


\subsection{Additional Analyses of Application}
We give three additional analyses of the four applications in the body of the paper.

{\bf Effect of study time only.}
First, we evaluate conditional PNS, PN, and PS, letting ${\boldsymbol y}=(6,6,6)$, ${\boldsymbol x}_0=(2,1)$, ${\boldsymbol x}_1=(4,1)$, and ${\boldsymbol c}_1$ in Def. \ref{def41}.
The estimated values of conditional PNS, PN, and PS are 
\begin{equation}
    \begin{aligned}
       &\text{PNS:} &2.491 \% &(\text{CI}: [0.000\%,7.395\%]),\\
       &\text{PN:} &2.709 \% &(\text{CI}: [0.000\%,8.060\%]),\\
      &\text{PS:}  &25.864 \% &(\text{CI}: [0.000\%,73.544\%]),
    \end{aligned}
\end{equation}
respectively.
Second, we evaluate conditional PNS with evidence $({\boldsymbol y}',{\boldsymbol x}',{\boldsymbol c})$, letting ${\boldsymbol y}=(6,6,6)$, ${\boldsymbol y}'=(6,6,5)$, ${\boldsymbol x}_0=(2,1)$,
${\boldsymbol x}_1=(4,1)$, 
${\boldsymbol x}'=(2,1)$, and ${\boldsymbol c}_1$ in Def. \ref{EV1}.
Then, the estimated value of it is 
\begin{equation}
     \text{PNS:}\ \  0.000 \%\ \ \ \  (\text{CI}: [0.000\%,0.000\%]).
\end{equation}
Third, we evaluate conditional PNS with multi-hypothetical terms, letting ${\boldsymbol y}_1=(5,5,5)$, ${\boldsymbol y}_2=(6,6,6)$, ${\boldsymbol x}_0=(1,1)$, ${\boldsymbol x}_1=(2,1)$, ${\boldsymbol x}_2=(4,1)$, and ${\boldsymbol c}_1$ in Def. \ref{EV2}.
The estimated value of it is 
\begin{equation}
     \text{PNS:}\ \  0.000 \%\ \ \ \  (\text{CI}: [0.000\%,0.000\%]).
\end{equation}
Finally, we evaluate conditional PNS with multi-hypothetical terms and evidence $({\boldsymbol y}',{\boldsymbol x}',{\boldsymbol c})$, letting ${\boldsymbol y}_1=(5,5,5)$, ${\boldsymbol y}_2=(6,6,6)$, ${\boldsymbol y}'=(6,6,5)$, ${\boldsymbol x}_0=(1,1)$, ${\boldsymbol x}_1=(2,1)$,
${\boldsymbol x}_2=(4,1)$, 
${\boldsymbol x}'=(2,1)$, and ${\boldsymbol c}_1$ in Def. \ref{EV3} .
We eliminate the results of NA, then the estimated value of it is 
\begin{equation}
     \text{PNS:}\ \  42.489 \%\ \ \ \  (\text{CI}: [0.000\%,100.000\%]).
\end{equation}




{\bf Effect of extra paid classes only.}
First, we evaluate conditional PNS, PN, and PS, letting ${\boldsymbol y}=(6,6,6)$, ${\boldsymbol x}_0=(1,1)$, ${\boldsymbol x}_1=(2,2)$, and ${\boldsymbol c}_1$ in Def. \ref{def41}.
The estimated values of conditional PNS, PN, and PS are 
\begin{equation}
    \begin{aligned}
       &\text{PNS:} &7.700 \% &(\text{CI}: [1.072\%,16.614\%]),\\
       &\text{PN:} &8.132\% &(\text{CI}: [1.090\%,18.139\%]),\\
      &\text{PS:}  &65.398 \% &(\text{CI}: [37.015\%,89.795\%]),
    \end{aligned}
\end{equation}
respectively.
Second, we evaluate conditional PNS with evidence $({\boldsymbol y}',{\boldsymbol x}',{\boldsymbol c})$, letting ${\boldsymbol y}=(6,6,6)$, ${\boldsymbol y}'=(6,6,5)$, ${\boldsymbol x}_0=(1,1)$,
${\boldsymbol x}_1=(2,2)$, 
${\boldsymbol x}'=(2,1)$, and ${\boldsymbol c}_1$ in Def. \ref{EV1}.
Then, the estimated value of it is 
\begin{equation}
     \text{PNS:}\ \  0.009 \%\ \ \ \  (\text{CI}: [0.000\%,0.139\%]).
\end{equation}


\begin{comment}
{\bf (1).}
We evaluate conditional PNS, PN and PS letting ${\boldsymbol y}=(6,6,6)$, ${\boldsymbol x}_0=(2,1)$, ${\boldsymbol x}_1=(4,2)$, and ${\boldsymbol c}_1$ in Def. \ref{def41}.
First, we estimate by {\bf logistic regression}, including all variables.
The estimated values of PNS, PN are
\begin{equation}
    \begin{aligned}
       &\text{PNS:} &20.484 \% &(\text{CI}: [0.000\%,99.716\%]),\\
       &\text{PN:} &76.563 \% &(\text{CI}: [0.000\%,99.999\%]),\\
      &\text{PS:}  &33.618 \% &(\text{CI}: [0.000\%,99.999\%]),
    \end{aligned}
\end{equation}
respectively.
Next, we also estimate by {\bf logistic ridge regression} including all variables to avoid data complexities from multicollinearity.
We choose the optimal regularization parameters by cross-validation.
The estimated values of PNS, PN are
\begin{equation}
    \begin{aligned}
       &\text{PNS:} &1.273 \% &(\text{CI}: [0.000\%,2.620\%]),\\
       &\text{PN:} &2.620 \% &(\text{CI}: [0.000\%,5.752\%]),\\
      &\text{PS:}  &2.495 \% &(\text{CI}: [0.000\%,4.949\%]),
    \end{aligned}
\end{equation}
respectively.
The estimated values by logistic regression including all variables have large variances, and the estimated values by logistic ridge regression including all variables may have large  regularization biases.



{\bf (2).}
We evaluate conditional PNS with evidence $({\boldsymbol y}',{\boldsymbol x}',{\boldsymbol c})$ ${\boldsymbol y}_1=(5,5,5)$, ${\boldsymbol y}_2=(6,6,6)$, ${\boldsymbol y}'=(6,6,5)$, ${\boldsymbol x}_0=(1,1)$, ${\boldsymbol x}_1=(2,1)$,
${\boldsymbol x}_2=(4,2)$, 
${\boldsymbol x}'=(2,1)$, and ${\boldsymbol c}_1$ in Def. \ref{EV1}.
First, we estimate by {\bf logistic regression}, including all variables.
The estimated value of PNS is
\begin{equation}
   \text{PNS:}\ \  17.763 \%\ \ \ \  (\text{CI}: [0.000\%,99.642\%]).
\end{equation}
Next, we also estimate by {\bf logistic ridge regression}, including all variables.
We choose the optimal regularization parameters by cross-validation.
The estimated value of PNS is
\begin{equation}
    \text{PNS:}\ \ 3.107 \%\ \ \ \  (\text{CI}: [0.000\%,20.349\%]).
\end{equation}
The estimated values by logistic regression including all variables have large variances, and the estimated values by logistic ridge regression including all variables may have large  regularization biases.


{\bf (3).}
We evaluate conditional PNS with multi-hypothetical terms letting ${\boldsymbol y}_1=(5,5,5)$, ${\boldsymbol y}_2=(6,6,6)$, ${\boldsymbol x}_0=(1,1)$, ${\boldsymbol x}_1=(2,1)$, ${\boldsymbol x}_1=(4,2)$, ${\boldsymbol c}_1$ in Def. \ref{EV2}.
First, we estimate by {\bf logistic regression}, including all variables.
The estimated value of PNS is
\begin{equation}
    \text{PNS:}\ \ 0.000 \%\ \ \ \  (\text{CI}: [0.000\%,0.000\%]).
\end{equation}
Next, we also estimate by {\bf logistic ridge regression}, including all variables.
We choose the optimal regularization parameters by cross-validation.
The estimated value of PNS is
\begin{equation}
    \text{PNS:}\ \ 0.000 \%\ \ \ \  (\text{CI}: [0.000\%,0.000\%]).
\end{equation}
The estimated values by logistic regression and logistic ridge regression including all variables are all 0.


{\bf (4).}
We evaluate conditional PNS with multi-hypothetical terms and evidence $({\boldsymbol y}',{\boldsymbol x}',{\boldsymbol c})$${\boldsymbol y}_1=(5,5,5)$, ${\boldsymbol y}_2=(6,6,6)$, ${\boldsymbol y}'=(6,6,5)$, ${\boldsymbol x}_0=(1,1)$, ${\boldsymbol x}_1=(2,1)$,
${\boldsymbol x}_2=(4,2)$, 
${\boldsymbol x}'=(2,1)$, and ${\boldsymbol c}_1$ in Def. \ref{EV3}.
First, we estimate by {\bf logistic regression}, including all variables.
The estimated value of PNS is
\begin{equation}
    \text{PNS:}\ \ 0.000 \%\ \ \ \  (\text{CI}: [0.000\%,0.000\%]).
\end{equation}
Next, we also estimate by {\bf logistic ridge regression}, including all variables.
We choose the optimal regularization parameters by cross-validation.
The estimated value of PNS is
\begin{equation}
    \text{PNS:}\ \ 0.000 \%\ \ \ \  (\text{CI}: [0.000\%,0.000\%]).
\end{equation}
The estimated values by logistic regression and logistic ridge regression, including all variables, are all 0.

\end{comment}









\begin{comment}
\subsection{Code}
We release the code used numerical experiments in this section.

\begin{lstlisting}[caption=Code,label=fuga]
library(readr)
library(glmnet)
Data <- read_delim("student+performance/student/student-mat.csv",delim = ";", escape_double = FALSE, trim_ws = TRUE)

Data_m<-data.matrix(Data)
Data_m<-Data_m[,c(1,2,3,14,18)]

ID<-1
Ite<-100
NO1<-Data_m[ID,]
### Situation 0
CNO1_0<-Data_m[ID,]
CNO1_0[4]<-1
CNO1_0[5]<-1
### Situation 2
CNO1_2<-Data_m[ID,]
CNO1_2[4]<-4
CNO1_2[5]<-2


N<-length(Data$G1)
Y_1<-as.numeric(N)
Y_2<-as.numeric(N)


for(i in 1:length(Data$G1)){
  if(Data$G3[i]>5){
    Y_1[i]<-1
  }else if(Data$G3[i]==5&Data$G2[i]>5){
    Y_1[i]<-1
  }
  else if(Data$G3[i]==5&Data$G2[i]==5&Data$G1[i]>5){
    Y_1[i]<-1
  }else{
    Y_1[i]<-0
  }
}
Y_1<-1-Y_1

for(i in 1:length(Data$G1)){
  if(Data$G3[i]>6){
    Y_2[i]<-1
  }else if(Data$G3[i]==6&Data$G2[i]>6){
    Y_2[i]<-1
  }
  else if(Data$G3[i]==6&Data$G2[i]==6&Data$G1[i]>6){
    Y_2[i]<-1
  }else{
    Y_2[i]<-0
  }
}
Y_2<-1-Y_2

PNS1<-numeric(Ite)
PN1<-numeric(Ite)
PS1<-numeric(Ite)
PNS2<-numeric(Ite)

for(boot in 1:Ite){
  
  ID_s<-sample(1:N, N, replace = TRUE)
  Y_1s<-Y_1[ID_s]
  Y_2s<-Y_2[ID_s]
  Data_s<-Data_m[ID_s,]
  
#  lasso.model.cv_1 <- cv.glmnet(x = Data_s, y = Y_1s, family = "binomial", alpha = 0, standardize = FALSE)
#  lasso.model.cv_2 <- cv.glmnet(x = Data_s, y = Y_2s, family = "binomial", alpha = 0, standardize = FALSE)
#  lasso.model_1 <- glmnet(x = Data_s, y = Y_1s, family = "binomial", lambda = lasso.model.cv_1$lambda.1se, alpha = 0, standardize = FALSE)
#  lasso.model_2 <- glmnet(x = Data_s, y = Y_2s, family = "binomial", lambda = lasso.model.cv_2$lambda.1se, alpha = 0, standardize = FALSE)
  
  
# No ridge
lasso.model_1 <- glmnet(x = Data_s, y = Y_1s, family = "binomial", lambda =0, alpha = 0, standardize = FALSE)
lasso.model_2 <- glmnet(x = Data_s, y = Y_2s, family = "binomial", lambda =0, alpha = 0, standardize = FALSE)
  
  ## P(Y<=y1;X=x0,C=c)
  p_11<-exp(as.numeric(lasso.model_1$beta)%*%NO1+lasso.model_1$a0)/(1+exp(as.numeric(lasso.model_1$beta)%*%NO1+lasso.model_1$a0))
  ## P(Y<=y1;X=x1,C=c)
  p_10<-exp(as.numeric(lasso.model_1$beta)%*%CNO1_0+lasso.model_1$a0)/(1+exp(as.numeric(lasso.model_1$beta)%*%CNO1_0+lasso.model_1$a0))
  ## P(Y<=y1;X=x1,C=c)
  p_12<-exp(as.numeric(lasso.model_1$beta)%*%CNO1_2+lasso.model_1$a0)/(1+exp(as.numeric(lasso.model_1$beta)%*%CNO1_2+lasso.model_1$a0))
  
  ## P(Y<=y2;X=x0,C=c)
  p_21<-exp(as.numeric(lasso.model_2$beta)%*%NO1+lasso.model_2$a0)/(1+exp(as.numeric(lasso.model_2$beta)%*%NO1+lasso.model_2$a0))
  ## P(Y<=y2;X=x1,C=c)
  p_20<-exp(as.numeric(lasso.model_2$beta)%*%CNO1_0+lasso.model_2$a0)/(1+exp(as.numeric(lasso.model_2$beta)%*%CNO1_0+lasso.model_2$a0))
  ## P(Y<=y2;X=x2,C=c)
  p_22<-exp(as.numeric(lasso.model_2$beta)%*%CNO1_2+lasso.model_2$a0)/(1+exp(as.numeric(lasso.model_2$beta)%*%CNO1_2+lasso.model_2$a0))
  
  #### PNS(y2;X=x0,X=x1,C=c)
  PNS1[boot]<-max(p_21-p_22,0)
  PN1[boot]<-max(p_21-p_22,0)/(1-p_22)
  PS1[boot]<-max(p_21-p_22,0)/p_21
  
  #### PNS(y1,y2;X=x0,X=x1,X=x2,C=c)
  PNS2[boot]<-max(min(p_21,p_10)-max(p_22,p_11),0)
  
}


mean(PNS1)
quantile(PNS1,0.025)
quantile(PNS1,0.975)

mean(PN1)
quantile(PN1,0.025)
quantile(PN1,0.975)

mean(PS1)
quantile(PS1,0.025)
quantile(PS1,0.975)

mean(PNS2)
quantile(PNS2,0.025)
quantile(PNS2,0.975)

\end{lstlisting}

\end{comment}