%\subsection{Additional Information of Experiments}

\label{appG}


In this section, we give detailed information about the settings of  the experiments and  additional experimental results.

{We note that the choice of the reference point $z_0$ does not affect the consistency results or rate of convergence, but it may affect the variance of the estimator. In our experiments, we take the minimum value of $Z$ as a standard reference point $z_0$. The choice of the reference point $z_0$ did not affect the standard deviation of the estimators much in our experiments.}


\subsection{Detailed settings of experiments}

We present detailed settings of numerical experiments in the following.
%to demonstrate the performance of the proposed P-CAPCE, sieve CAPCE,  and RKHS CAPCE estimators. \jin{Detailed settings are  in Appendix G.} 
 
%{\bf Baselines.} We compare with the most widely used methods PTSLS (parametric), NTSLS (sieve), and Kernel IV. These methods compute $\mathbb{E}[Y_{x}|{w}]$ which we differentiate to compute CAPCE  $\mathbb{E}[\partial_x Y_{x}|{w}]$.\\
%Additional information shown in Appendix.
%\subsection{Parametric Estimation}
%First, we compare the PTSLS and P-CAPCE estimator when $g_0$ is null in Eq. (\ref{EQ1}).\\
%{\bf SCM Settings.} We consider the following two SCMs:  $W:=U+E_1, X:=Z+W+U+E_2$, and 
%\begin{eqnarray}
%\label{eq-scm}
%\left\{
%\begin{array}{l}
%Y:=10X^2+WX+X+W+50(W^5+W^4+W^3+W^2)U+E_3\ \ \ \hspace*{\fill}\cdots\text{ (A)}\\Y:=\text{exp}(X)\text{exp}(W)+25(W^5+W^4+W^3+W^2)U+E_3\ \ \ \hspace*{\fill}\cdots\text{ (B)}\\
%\end{array}
%\right..
%\end{eqnarray}
%We use setting (A) as a parametric setting and setting (B) as a nonparametric setting. 
% Values of $Z$, $U$, $E_1$, $E_2$, and $E_3$ are   sampled i.i.d. from a uniform distribution $U[-1,1]$.
%True CAPCE  is $20x+w+1$ in setting (A) and $\text{exp}(x)\text{exp}(w)$ in setting (B). %The sample size are $N=1000$ and $N=10000$.

{\bf Setting of P-CAPCE  and PTSLS.} We learn the conditional expectations of basis functions
$\mathbb{E}[Y|Z=z]$, $\mathbb{E}[X|Z=z]$, $\mathbb{E}[WX|Z=z]$ and $\mathbb{E}[X^2|Z=z]$
by the nonlinear model, 
%\begin{eqnarray}
    $b_0+ b_1Z+b_2Z^2$.
%\end{eqnarray}
We used the basis terms $\{1,W,X\}$ for P-CAPCE and $\{1,W,X,WX,X^2\}$ for PTSLS, which match setting (A), and let $z_0=-1$.
%We regularize the matrix $\displaystyle \hat{\bf G}^T \hat{\bf G}$ by adding $0.001 {\bf I}$ for PTSLS estimator and $0.1 {\bf I}$ for P-CAPCE estimator, where ${\bf I}$ is an identity matrix of size $M$.
Regularize value is determined by test error from $\{1,10^{-1},10^{-2},10^{-3}\}$.
%The results of the test errors are shown in Table 1.

{\bf Setting of NTSLS and sieve CAPCE.} We learn the conditional expectations by the nonlinear model, 
%\begin{eqnarray}
    $b_0+ b_1Z+b_2Z^2+b_3Z^3$,
%\end{eqnarray}
We consider the  basis terms $h_p(X)h_q(W)$ for $p=0,1,2$ and $q=0,1,2$, where $h_p$ is Hermite polynomial functions ($h_0(t)=1$, $h_1(t)=t$, $h_2(t)=t^2-1$ and $h_3(t)=t^3-3t$), and let $z_0=-1$.
Let $\kappa=2$ and {$l=1$}, and we calculate $\hat{\Lambda}$ by Monte Carlo integration using uniform distribution $(x,w)=(U(-4,4),U(-2,2))$, where $\Omega_X \subseteq [-4,4]$ and $\Omega_X \subseteq [-2,2]$. Regularize value is determined by test error from $\{1,10^{-1},10^{-2},10^{-3}\}$.
%We regularize the matrix $\displaystyle \hat{\bf G}^T \hat{\bf G}$ by adding $10^{-2} \hat{\Lambda}$.
%In addition, we give an experiment using multivariate linear basis function $\{1,W,X\}$, which is a minimal basis function to build CAPCE.
%Results of the test errors are shown in Table 5.
We estimate CAPCE via differentiating estimated $\mathbb{E}[Y_{x}|{W}={w}]$.
%{\bf Setting of sieve NTSLS estimator.} We learn $\mathbb{E}[Y|Z=z], \mathbb{E}[h_p(X)h_q(W)|Z=z]$ for any $p=0,1,2,3$, $q=0,1,2,3$ and $q=0,1$ by the nonlinear model, 
%\begin{eqnarray}
%    $b_0+ b_1Z+b_2Z^2+b_3Z^3$.
%\end{eqnarray}
%where $h_0(t)=1$, $h_1(t)=t$, $h_2(t)=t^2-1$ and $h_3(t)=t^3-3t$.
%Multivariate linear basis function are $\{1,W,X,WX,X^2\}$.
%In this situation, the function $f_Y^2$ is mis-specified.
%Let $\kappa=2$, and we calculate $\hat{\Lambda}$ by Monte Carlo integration using uniform distridution $(x,w)=(U(-4,4),U(-2,2))$.
%Regularize value is determined by test error from $\{1,10^{-1},10^{-2},10^{-3},\ldots\}$.
%We regularize the matrix $\displaystyle \hat{\bf G}^T \hat{\bf G}$ by adding $10^{-3} \hat{\Lambda}$.
%We estimate CAPCE via differentiating estimated $\mathbb{E}[Y_{x}|{W}={w}]$. \jin{Explain why NTSLS uses different settings than S-CAPCE.}
%Results of the test errors are shown in Table 6.\\


{\bf Setting of kernel IV and RKHS CAPCE estimator.} We use polynomial kernel function $k_Z(z,z')=(z^Tz'+C_1)^{C_2}$ and $k_{X,{W}}((x,{w})(x,{w})^T+C_3)^{C_4}$.
We select the kernel parameters $(C_1,C_2)$ and $(C_3,C_4)$ from $\{1,2,3,4,5\} \times \{1,2,3,4,5\}$, respectively.
%, and determined $(\zeta_1,\zeta_2)=(4,5)$ by test error.
We select the regularize values $\lambda_1$ and $\lambda_2$ from $\{1,10^{-1},10^{-2},10^{-3}\}$, respectively, and $(\lambda_3,\xi)$ is from Cartesian product set $\{100,10,1\} \times \{100,10,1\}$. 
%Then, we determine $(\lambda_1,\lambda_2,\lambda_3,\xi)=(0.01,0.01,1,100)$.\\
%{\bf Setting of PTSLS estimator.} We learn $\mathbb{E}[Y|Z=z]$, $\mathbb{E}[W|Z=z]$, $\mathbb{E}[X|Z=z]$, $\mathbb{E}[WX|Z=z]$ and $\mathbb{E}[X^2|Z=z]$ by the nonlinear model, 
%\begin{eqnarray}
%    $b_0+ b_1Z+b_2Z^2$.
%\end{eqnarray}
%We consider the following terms, $\{1,W,X,WX,X^2\}$ to build model of $\mathbb{E}[Y_{x}|{W}={w}]$.
%We regularize the matrix $\displaystyle \hat{\bf G}^T \hat{\bf G}$ by adding $0.1 {\bf I}$.
%Regularize value is determined by test error from $\{1,10^{-1},10^{-2},10^{-3},\ldots\}$.
%We estimate CAPCE via differentiating estimated $\mathbb{E}[Y_{x}|{W}={w}]$. \jin{The settings have a lot of overlap, no need to repeat. Write a single Settings paragraph.} 
%Results of the test errors are shown in Table 3.\\

\begin{comment}
{\bf Results.}
\jin{Show summary results of all estimators in a Table.}
The means of coefficient by $100$ time simulations of PTSLS and P-CAPCE estimators are shown in Table \ref{tab:TAB1}.% \ref{tab:PNUM_EXMP1} and \ref{tab:PNUM_EXMP2}.
The mean of test error of each estimator by $100$ time simulations are shown in Table \ref{tab:TAB2}.
We note that TSLS (PTSLS and NTSLS) and CAPCE estimators (parametric, sieve and RKHS) have different risk functions.
\yuta{The estimator of coefficients by P-CAPCE and PTSLS have large SD when $N=1000$, shown in Appendix.}
The means of coefficients of P-CAPCE estimators are closer to true coefficients than PTSLS; on the other hand, PTSLS is biased largely due to the violation of the separability when $N=10000$.
%, $f_Y(X,{\boldsymbol W},{\boldsymbol H},{\boldsymbol u}_Y)=f_Y^1(X,{\boldsymbol W},{\boldsymbol u}_Y)+f_Y^2({\boldsymbol H},{\boldsymbol u}_Y)$.
We plotted the true and estimated CAPCE curve given $w=1$ in Figure \ref{fig:FIG02}.
We plotted the true CAPCE surface and estimated CAPCE and estimated PTSLS surface of the setting (A) in Figure \ref{fig:FIG2}.
The true surface and estimated surfaces of the sieve NTSLS estimator, sieve CAPCE estimator, and RKHS estimator of the setting (B) are shown in Figure \ref{fig:FIG22}.
The sieve and RKHS CAPCE surface is closer to the true CAPCE surface than NTSLS.

By the experiments' results, we show that our proposed methods (P-CAPCE estimator, sieve CAPCE estimator, and RKHS estimator) are superior to the previous works (PTSLS and sieve NTSLS) in terms of unbiasedness.
In the setting (A), all CAPCE estimators are almost the same MSE; on the other hand, sieve and RKHS CAPCE estimators are superior to P-CAPCE estimator in the setting (B).
The RKHS CAPCE estimator requires much computational time and tuning a lot of regularization parameters.
Sieve CAPCE estimator sometimes requires so many basis functions if the tuple $(X,{\boldsymbol W})$ is high dimensional.

\end{comment}

\begin{comment}
%\subsection{Nonparametric Estimation}
%Next, we compare the sieve NTSLS, sieve and RKHS CAPCE estimator when ${\boldsymbol \beta}$ is null in Eq. (\ref{EQ1}).\\
%{\bf SCM Settings.} We consider the following two SCM:
%\begin{eqnarray}
%\label{eq-scm}
%\left\{
%\begin{array}{l}
%    W:=U+E_1,\ \ \ X:=Z+W+U+E_2\\
%   Y:=\text{exp}(X)\text{exp}%(W)+25(W^5+W^4+W^3+W^2)U+E_3
%\end{array}
%\right..
%\end{eqnarray}
%Each realized the value of $Z$, $U$, $E_1$, $E_2$ and $E_3$ are i.i.d. and sampled from a uniform distribution $U[-1,1]$.
True CAPCE $\mathbb{E}[Y_{x}|{W}={w}]$ is $\text{exp}(x)\text{exp}(w)$, and the sample size are $N=10000$.\\
%{\bf Setting of P-CAPCE estimator and PTSLS estimator.} We learn $\mathbb{E}[Y|Z=z]$, $\mathbb{E}[X|Z=z]$, $\mathbb{E}[WX|Z=z]$ and $\mathbb{E}[X^2|Z=z]$ by the nonlinear model, 
%\begin{eqnarray}
%    $b_0+ b_1Z+b_2Z^2$.
%\end{eqnarray}
%We consider the following basis terms, $\{1,W,X\}$ for P-CAPCE model, $\{1,W,X,WX,X^2\}$ for PTSLS model , and let $z_0=-1$.
%We regularize the matrix $\displaystyle \hat{\bf G}^T \hat{\bf G}$ by adding $0.001 {\bf I}$ for PTSLS estimator and $0.1 {\bf I}$ for P-CAPCE estimator, where ${\bf I}$ is an identity matrix of size $M$.
%Regularize value is determined by test error from $\{1,10^{-1},10^{-2},10^{-3},\ldots\}$.
%The results of the test errors are shown in Table 1.
%We estimate CAPCE via differentiating estimated $\mathbb{E}[Y_{x}|{W}={w}]$.\\
{\bf Setting of sieve CAPCE estimator.} We learn $\mathbb{E}[Y|Z=z], \mathbb{E}[h_p(X)h_q(W)|Z=z]$ for any $p=0,1,2$ and $q=0,1,2$ by the nonlinear model, 
%\begin{eqnarray}
    $b_0+ b_1Z+b_2Z^2+b_3Z^3$,
%\end{eqnarray}
where $h_p$ is Hermite polynomial functions ($h_0(t)=1$, $h_1(t)=t$, $h_2(t)=t^2-1$ and $h_3(t)=t^3-3t$), and let $z_0=-1$.
Let $\kappa=2$, and we calculate $\hat{\Lambda}$ by Monte Carlo integration \citep{Kroese2011} using uniform distridution $(x,w)=(U(-4,4),U(-2,2))$, where $\Omega_X \subseteq [-4,4]$ and $\Omega_X \subseteq [-2,2]$.
Regularize value is determined by test error from $\{1,10^{-1},10^{-2},10^{-3},\ldots\}$.
We regularize the matrix $\displaystyle \hat{\bf G}^T \hat{\bf G}$ by adding $10^{-2} \hat{\Lambda}$.
%In addition, we give an experiment using multivariate linear basis function $\{1,W,X\}$, which is a minimal basis function to build CAPCE.
%Results of the test errors are shown in Table 5.
We estimate CAPCE via differentiating estimated $\mathbb{E}[Y_{x}|{W}={w}]$.\\
%{\bf Setting of sieve NTSLS estimator.} We learn $\mathbb{E}[Y|Z=z], \mathbb{E}[h_p(X)h_q(W)|Z=z]$ for any $p=0,1,2,3$, $q=0,1,2,3$ and $q=0,1$ by the nonlinear model, 
%\begin{eqnarray}
%    $b_0+ b_1Z+b_2Z^2+b_3Z^3$.
%\end{eqnarray}
%where $h_0(t)=1$, $h_1(t)=t$, $h_2(t)=t^2-1$ and $h_3(t)=t^3-3t$.
%Multivariate linear basis function are $\{1,W,X,WX,X^2\}$.
%In this situation, the function $f_Y^2$ is mis-specified.
%Let $\kappa=2$, and we calculate $\hat{\Lambda}$ by Monte Carlo integration using uniform distridution $(x,w)=(U(-4,4),U(-2,2))$.
%Regularize value is determined by test error from $\{1,10^{-1},10^{-2},10^{-3},\ldots\}$.
%We regularize the matrix $\displaystyle \hat{\bf G}^T \hat{\bf G}$ by adding $10^{-3} \hat{\Lambda}$.
%We estimate CAPCE via differentiating estimated $\mathbb{E}[Y_{x}|{W}={w}]$. \jin{Explain why NTSLS uses different settings than S-CAPCE.}
%Results of the test errors are shown in Table 6.\\
{\bf Setting of RKHS CAPCE estimator.} We use polynomial kernel function $k_Z(z,z')=(z^Tz'+\zeta_1)^{\zeta_2}$, and we determined $(\zeta_1,\zeta_2)=(4,5)$.
We select the regularize values $\lambda_1,\lambda_2$ from $\{1,0.1,0.01,\ldots\}$, respectively, and $(\lambda_3,\xi)$ is from cartesian product $\{100,10,1\} \times \{100,10,1\}$ by Algorithm \ref{ALG2}. 
Then, we determine $(\lambda_1,\lambda_2,\lambda_3,\xi)=(0.01,0.01,1,100)$.\\

{\bf Results.} 
The true surface and estimated surfaces of the sieve NTSLS estimator, sieve CAPCE estimator, and RKHS estimator are shown in Figure \ref{fig:FIG22}.
We plotted the surfaces in the range of $-2 \leq x \leq 2$ and $-1 \leq w \leq 1$ since the edge of the domain of all nonparametric estimators is unstable.
The sieve and RKHS CAPCE surfaces are closer to the true CAPCE surface, and the sieve NTSLS surface is largely biased. \jin{Is there a numerical performance measure for function estimation that can be computed, e.g. root mean squared error (RMSE) or variants used in Machine learning for regression performance? Then a summary results table could be presented. }

\end{comment}




\begin{comment}
\begin{table}[H]
\caption{Basic statistics of the test error of the CAPCE estimator over 1000 runs for regularization value ($N=1000$); the bold number is the smallest.}
\centering
\label{tab:TEST1}

\begin{tabular}{l|ccccc}
\hline
$\lambda$  & 1 & 0.1 & 0.01 &0.001 &0.0001\\
\hline \hline
Min.   & 14697     & 9625      & 3645      & 12107     & 624       \\
1st Qu.    & 1142891   & 706462    & 613128    & 957617    & 889920    \\
Median & 2581357   & 1935108   & 1946924   & 1720578   & 2562135   \\
3rd Qu.    & 5944603   & 6159807   & 4679010   & 5361448   & 6646507   \\
Max.   & 30939470  & 26625863  & 22605166  & 29466366  & 19800472  \\
\hline
Mean   & 4690293   & 4402619   & 3888198   & {\bf 3887842}   & 4187281   \\
SD     & 5725131.0 & 5355639.0 & 4880814.0 & 5250446.0 & 4508818.0 \\
\hline
\end{tabular}
\end{table}
\end{comment}


\subsection{Additional information on experimental results in the body of paper}
%We give additional  information on experiments. 
{\textbf{Results: Parametric setting (A).} The basic statistics of estimated coefficients by $100$ time simulations of 
PTSLS and P-CAPCE  are shown in Tables ~\ref{tab:PNUM_EXMP1} and \ref{tab:PNUM_EXMP2}. 
These tables supplement  Table 1 in the paper. The true and estimated CAPCE surfaces over $(X, W)$ are shown in Fig.~\ref{fig:FIG2}.}


{\textbf{Results: Nonparametric setting (B).} The true and estimated CAPCE surfaces over $(X, W)$ are shown in Fig.~\ref{fig:FIG22}.}


\begin{table}[H]
\centering
\caption{Basic statistics of the P-CAPCE estimator over 1000 runs when $N=1000$ and $N=10000$ in setting (A).
\vspace{0cm}}
\label{tab:PNUM_EXMP1}
\renewcommand{\arraystretch}{1.1}
\begin{minipage}[c]{0.45\textwidth}
\centering
\begin{tabular}{l|cccc}
\hline
   $N=1000$      & $1$ &$W$ &$X$ \\
   \hline
   True Coeff. & 1 & 1 & 20\\
         \hline \hline
Min.    & -51.515 & -18.715 & -116.480 \\
1st Qu. & -10.044 & 0.160   & -10.809  \\
Median  & -1.849  & 3.035   & 17.691   \\
3rd Qu. & 7.926   & 12.239  & 50.007   \\
Max.    & 40.458  & 109.791 & 213.306  \\
\hline
Mean    & -1.651  & 10.383  & 19.293   \\
SD      & 14.707  & 22.309  & 50.957   \\
\hline
\end{tabular}
\end{minipage}
\hspace{1cm}
\begin{minipage}[c]{0.45\textwidth}
\centering
\begin{tabular}{l|cccc}
\hline
   $N=10000$      & $1$ &$W$ &$X$ \\
   \hline
   True Coeff. & 1 & 1 & 20\\
         \hline \hline
Min.    & -13.466 & -2.302 & -23.863 \\
1st Qu. & -2.324  & -0.157 & 10.908  \\
Median  & 1.138   & 0.543  & 22.075  \\
3rd Qu. & 4.643   & 1.568  & 29.509  \\
Max.    & 14.988  & 11.017 & 59.559  \\
\hline
Mean    & 1.226   & 0.963  & 19.971  \\
SD      & 5.380   & 2.124  & 15.487 \\
\hline
\end{tabular}
\end{minipage}
\end{table}







%\subsection{NTSLS estimator}


\begin{comment}
\begin{table}[H]
\caption{Basic statistics of the test error of the NTSLS over 1000 runs for regularization value ($N=1000$); the bold number is the smallest.}
\centering
\label{tab:TEST2}

\begin{tabular}{l|ccc}
\hline
$\lambda$  & 1 & 0.1 & 0.01 \\
\hline \hline
Min.   & 15606279  & 13623674  & 14019980  \\
1st Qu.    & 20943014  & 20609263  & 21674532  \\
Median & 23919469  & 23994604  & 24633018  \\
3rd Qu.    & 27036646  & 27329930  & 28037611  \\
Max.   & 38088863  & 40235204  & 41456719  \\
\hline
Mean   & 24258777  & {\bf 24218756}  & 25204835  \\
SD     & 4837954.0 & 4749243.0 & 5104092.0 \\
\hline
\end{tabular}
\end{table}
\end{comment}


\begin{table}[H]
\centering
\caption{Basic statistics of the PTSLS over 1000 runs when $N=1000$ and $N=10000$ in setting (A).
\vspace{0cm}}
\label{tab:PNUM_EXMP2}
\renewcommand{\arraystretch}{1.1}
\begin{minipage}[c]{0.45\textwidth}
\centering
\begin{tabular}{l|ccccccc}
\hline
   $N=1000$      & $1$ &$W$ &$X$ \\
   \hline
   True Coeff. & 1 & 1 & 20\\
         \hline \hline
Min.    & -33.368 & 2.971   & -113.509 \\
1st Qu. & -4.258  & 28.662  & 0.518    \\
Median  & 2.785   & 45.497  & 28.629   \\
3rd Qu. & 7.617   & 62.155  & 61.569   \\
Max.    & 26.799  & 161.738 & 138.283  \\
\hline
Mean    & 1.248   & 50.032  & 27.862   \\
SD      & 11.374  & 29.523  & 46.388    \\
\hline
\end{tabular}
\end{minipage}
\hspace{1cm}
\begin{minipage}[c]{0.45\textwidth}
\centering
\begin{tabular}{l|ccccc}
\hline
   $N=10000$      & $1$ &$W$ &$X$\\
   \hline
   True Coeff. & 1 & 1 & 20\\
         \hline \hline
Min.    & -12.117 & 30.794 & -20.407 \\
1st Qu. & -2.336  & 45.907 & 9.404   \\
Median  & 1.704   & 50.716 & 19.347  \\
3rd Qu. & 4.494   & 57.017 & 30.498  \\
Max.    & 8.952   & 78.573 & 54.494  \\
\hline
Mean    & 1.101   & 51.181 & 19.763  \\
SD      & 4.638   & 8.814  & 15.171  \\
\hline
\end{tabular}
\end{minipage}
\end{table}



\begin{comment}
\newpage
\section{Experiment: Additional Information of Nonparametric Settings}




\begin{table}[H]
\caption{Basic statistics of the test error of the sieve CAPCE estimator over 1000 runs for regularization value ($N=1000$); the bold number is the smallest.}
\centering
\label{tab:TESTN1}

\begin{tabular}{l|cccc}
\hline
$\lambda$  & 1 & 0.1 & 0.01 & 0.001 \\
\hline \hline
Min.   & 30749     & 17490     & 11666     & 1162    \\
1st Qu.    & 393222    & 267892    & 163843    & 213469  \\
Median & 868635    & 785864    & 459062    & 653862  \\
3rd Qu.    & 2128704   & 1850865   & 1193130   & 1419073 \\
Max.   & 11915998  & 10501820  & 6207421   & 9983759 \\
\hline
Mean   & 1637283   & 1334405   & {\bf 943600}    & 1255112 \\
SD     & 2209637.0 & 1693960.0 & 1263695.0 & 1732494\\
\hline
\end{tabular}
\end{table}



\begin{table}[H]
\caption{Basic statistics of the test error of the NTSLS over 1000 runs for regularization value ($N=10000$); the bold number is the smallest.}
\centering
\label{tab:TESTN2}

\begin{tabular}{l|ccccc}
\hline
$\lambda$  & 1 & 0.1 & 0.01 & 0.001 & 0.0001\\
\hline \hline
Min.   & 21830    & 20971    & 13734    & 19512    & 24647    \\
1st Qu.   & 742515   & 223184   & 178707   & 140371   & 153036   \\
Median & 1051622  & 431384   & 325818   & 277296   & 239295   \\
3rd Qu.   & 1664026  & 655220   & 468745   & 413653   & 406530   \\
Max.   & 3692342  & 1776898  & 1911188  & 1080841  & 1160372  \\
\hline
Mean   & 1238307  & 496540   & 373658   & {\bf 312570}   & 327906   \\
SD     & 758360.0 & 356171.3 & 297606.8 & 227955.3 & 261267.5 \\
\hline
\end{tabular}
\end{table}





\begin{table}[H]
\caption{Basic statistics of the test error of $\lambda_1$ of the RKHS CAPCE estimator over 10 runs for regularization value ($N=100$); the bold number is the smallest.}
\centering
\label{tab:TESTN1}

\begin{tabular}{l|cccc}
\hline
$\lambda$  & 1 & 0.1 & 0.01 & 0.001 \\
\hline \hline
Min.    & 353   & 363.2 & 334.9 & 345.7 \\
1st Qu. & 374.9 & 372.6 & 353.7 & 366.8 \\
Median  & 386.1 & 384   & 366.5 & 387.3 \\
3rd Qu. & 407.4 & 397.4 & 371.2 & 406.6 \\
Max.    & 432   & 432.6 & 409.5 & 414.9 \\
\hline
Mean    & 392.2 & 387.8 & {\bf 365.8} & 385.6 \\
SD      & 26.5  & 20.3  & 22.0  & 24.1  \\
\hline
\end{tabular}
\end{table}




\begin{table}[H]
\caption{Basic statistics of the test error of $\lambda_2$ of the RKHS CAPCE estimator over 10 runs for regularization value ($N=100$); the bold number is the smallest.}
\centering
\label{tab:TESTN1}

\begin{tabular}{l|cccc}
\hline
$\lambda$  & 1 & 0.1 & 0.01 & 0.001 \\
\hline \hline
Min.    & 893   & 1053  & 1000  & 797.7  \\
1st Qu. & 1261  & 1141  & 1028  & 1220.9 \\
Median  & 1476  & 1306  & 1144  & 1259.5 \\
3rd Qu. & 1581  & 1457  & 1246  & 1475.1 \\
Max.    & 2189  & 1986  & 1545  & 1650.9 \\
\hline
Mean    & 1466  & 1384  & {\bf 1169}  & 1277.4 \\
SD      & 361.5 & 322.8 & 170.2 & 261.3  \\
\hline
\end{tabular}
\end{table}



\begin{table}[H]
\caption{Basic statistics of the test error of $(\xi,\lambda_3)$ of the RKHS CAPCE estimator over 10 runs for regularization value ($N=100$); the bold number is the smallest.}
\centering
\label{tab:TESTN1}

\begin{tabular}{l|ccccccccc}
\hline
$(\xi,\lambda_3)$  & (100,100))& (100,10) & (100,1) & (10,100))& (10,10) & (10,1) & (1,100))& (1,10) & (1,1) \\
\hline \hline
Min.    & 763    & 728.2  & 448.2  & 544.2  & 711.9  & 527.9    & 801.7    & 863.2    & 779.5    \\
1st Qu. & 824.5  & 804.7  & 704.4  & 760.8  & 741.6  & 669.5    & 816      & 919.9    & 822.8    \\
Median  & 900.3  & 949.3  & 887.7  & 881.6  & 925.4  & 820.5    & 886.3    & 1059.9   & 875.3    \\
3rd Qu. & 974.1  & 1080   & 927.3  & 963.8  & 1036.5 & 1099.5   & 942.3    & 1312.3   & 962.5    \\
Max.    & 1575.5 & 1468.7 & 1022.8 & 1345.9 & 1826.6 & 1259.7   & 1132.3   & 1815.6   & 2006.3   \\
\hline
Mean    & 958.8  & 975.2  & {\bf 810.4}  & 887.5  & 998.7  & 871.4    & 903.7    & 1159.9   & 998.1    \\
SD      & 234.1  & 222.7  & 176.4  & 244.5  & 346.4  & 253.3599 & 104.5766 & 321.6026 & 365.5905 \\
\hline
\end{tabular}
\end{table}

\end{comment}


\input{Fig2_1}

\input{Fig2_2}
