\subsection{Proof of Proposition \ref{prop:mu-sigma-def}}
We also refer to \citep[Appendix A]{dai2023quantum} for the proof.

To emphasize Proposition \ref{prop:mu-sigma-def} holds for any weights and sequence $x_1, x_2, \cdots$,
we prove the following.
\begin{prop}
    \label{prop:mu-sigma-def}
    Let $n \in \ZZ_{\ge 1}$, $x_1, \dots, x_n \in \cX$, $\omega_1, \dots, \omega_n > 0$,
    $y_1, \dots, y_n \in \RR$.
    Define a self-adjoint operator $\cS: \cH_k \rightarrow \cH_k$ as 
    $\cS = \reg 1 + \sum_{i=1}^{n}\omega_i \phi(x_i)\phi(x_i)^\trn$.
    We put $Y_n = (y_1, \cdots, y_n)^\top \in \RR^n$,
    $\bomega = \diag(\omega_1, \dots, \omega_n)$,
    and define $K \in \RR^{n\times n}$ as $K_{ij} = k(x_i, x_j)$.
    Then for any $x \in \cX$, we have 
    \begin{align*}
       & \phi(x)^\trn \cS^{-1} \sum_{i=1}^{n} \omega_i y_i \phi(x_i) =  k(x)^\trn (\reg I_n + \bomega K)^{-1}\bomega Y_n ,\\
       & \reg\| \phi(x)\|_{\cS^{-1}}^2 = k(x, x) - k(x)^\trn (\reg I_n + \bomega K)^{-1} \bomega k(x).
    \end{align*}
    Here, $k(x) \in \RR^{n}$ is a column vector defined by $(k(x))_i = k(x, x_i)$ for $1 \le i \le n$.
\end{prop}

\begin{proof}
    Let $x \in \cX$.
    % For simplicity, we assume that $x_1, x_2, \dots, x_n, x$ are pairwise distinct 
    % (as we will see shortly the statements of the proposition hold even if this assumption is not satisfied).
    % Define $\cG \subseteq \cH_k$ as the subspace generated by $\phi(x_1), \dots, \phi(x_n)$
    % and $\cG'$ as the subspace generated by $\cG$ and $\phi(x)$.
    % We note that by the assumption and since $k$ is positive definite, 
    % $\cB = \{\phi(x_1), \dots, \phi(x_n)\}$ is a basis of $\cG$ and 
    % $\cB' = \{\phi(x_1), \dots, \phi(x_n), \phi(x)\}$ is a basis of $\cG'$.
    % By definition, we see that $\cS(\cG) = \cG$ and $\cS(\cG') = \cG'$.
    Since for $1\le i \le n$ ,
    \begin{equation*}
        \cS \phi(x_i) = \reg \phi(x_i) + \sum_{j} \omega_jk(x_i, x_j) \phi(x_j) 
        = \sum_{j}( \reg \delta_{ij} + \omega_j k(x_i, x_j))\phi(x_j),
    \end{equation*}
    we have 
    \begin{equation*}
        \left(\cS \phi(x_1), \cdots, \cS \phi(x_n)\right)
            =
        \left( 
        \phi(x_1),\cdots, \phi(x_n)
        \right)
        (\reg I_n + \bomega K_n).
    \end{equation*}
    % the matrix representation of $\cS|_{\cG}$ with respect to the basis $\cB$ is given as $\reg I_n + \bomega K$.
    Thus, we see that $\cS \sum_{i}a_i \phi(x_i) = \sum_{i} \omega_i y_i \phi(x_i)$,
    where $a \in \RR^{n}$ is given as 
    $(\reg I_n + \bomega K)^{-1} \bomega Y_n $.
    Therefore, we have the first statement of the proposition by the reproducing property.

    Similarly, we have the following equality:
    \begin{equation*}
            \left(\cS \phi(x_1),\  \cdots,\ \cS \phi(x_n),\ \cS \phi(x)\right)
        = 
        \left( \phi(x_1),\ \cdots, \phi(x_n),\ \phi(x) \right)     
        \begin{pmatrix}
            \reg I_n + \bomega K & \bomega k(x)\\
            0 & \reg
        \end{pmatrix}.
    \end{equation*}
    Define $b \in \RR^n$ by $(\reg I_n + \bomega K)^{-1}\bomega k(x)$.
    Then, 
    \begin{align*}
        \left(\cS \phi(x_1),\  \cdots,\ \cS \phi(x_n),\ \cS \phi(x)\right)
        \begin{pmatrix}
            - b \\ 1
        \end{pmatrix}
        &= 
        \left( \phi(x_1),\ \cdots, \phi(x_n),\ \phi(x) \right)     
        \begin{pmatrix}
            \reg I_n + \bomega K & \bomega k(x)\\
            0 & \reg
        \end{pmatrix}
        \begin{pmatrix}
            - b \\ 1
        \end{pmatrix}\\
        &=\reg \phi(x).
    \end{align*}
    Thus, it follows that  
    \begin{equation*}
        \cS \left(\phi(x) - \sum_{i=1}^{n}b_i \phi(x_i) \right) = \reg \phi(x),
    \end{equation*}
    Therefore, we have the following.
    \begin{align*}
        \reg \|\phi(x)\|_{\cS^{-1}} ^2
        = \reg \phi(x)^\trn \cS^{-1}\phi(x)
        = \phi(x)^\trn \left( \phi(x) - \sum_{i=1}^n b_i \phi(x_i)\right)
        = k(x, x) - k(x)^\trn b.
    \end{align*}
    Here, the last equality holds from the reproducing property.
    This completes the proof.
\end{proof}

\subsection{Proof of Proposition \ref{prop:conf-bd}}
% \begin{lem}
%     \label{lem:trace-bd}
%     For $s\in \ZZ_{\ge 1}$, we have the following inequality:
%     \begin{equation*}
%         \Tr \left( \id -\lambda V_{s}^{-1} \right) \le s \log 2.
%     \end{equation*}
% \end{lem}
% \begin{proof}
%     We let $V_s' := \lambda^{-1}V_{s}$. Then, we note that $V_s'$ is positive-definite and 
%     $ V_{s}' \succeq \id$.
%     By \citep[Lemma 12]{hazan2007logarithmic}, for symmetric matrices $A, B$ with $A \succeq B \succeq 0$, 
%     we have the following inequality:
%     \begin{equation*}
%         \Tr (A^{-1}(A - B)) \le \log \det A - \log \det B.
%     \end{equation*}
%     Therefore, it follows that:
%     \begin{equation*}
%         \Tr \left( \id - \lambda V_s^{-1}\right)  = 
%         \Tr \left\{(V_s')^{-1} \left(V_s' - \id \right)\right\}
%         \le \log \det V_s'.
%     \end{equation*}
%     By \eqref{eq:det-v_k-rec} and $V_0 = \lambda \id$, we see that $\log \det V_s' = s \log 2$.
%     This completes the proof.
% \end{proof}
For any $x\in \cX$, we have
\begin{equation*}
    |\mu(x) - \muw_s(x)|= |\phi(x)^\trn \theta^* - \phi(x)^\trn \thetahat_{s}|
    \le \|\phi(x)\|_{V_s^{-1}}
    \left\| \theta^* - \tthat_s \right\|_{V_s}
    = \left\| \theta^* - \tthat_s \right\|_{V_s}\sigmaw_s(x).
\end{equation*}
Thus, Proposition \ref{prop:conf-bd} follows from the following lemma.
\begin{lem}
    \label{lem:theta-conf-bd} 
    Let $\totnst$ be the total number of stage of Algorithm \ref{alg:qmc-kernel-ucb}
    and assume that $\nstin \ge \totnst$.
    Then, with probability at least $1-\delta$, the following inequality holds for any $s = 1,\dots, m$:
    \begin{equation*}
        \left\| 
        \theta^* - \tthat_s 
        \right\|_{V_s} \le \beta_s. 
    \end{equation*}
    Here, $\beta_s =\sqrt{\reg}S + \tradeoff \sqrt{s}$.
\end{lem}
\begin{proof}
    This can be proved similarly to \citep[Lemma 3]{wan2023quantum}.
    However, since a naive application of their proof would lead to 
    a bound involving the dimension of the RHKS $\cH_k$,
    we bound $\left\|\theta^* - \tthat_s \right\|_{V_s}$ as follows.


    Define an event $\cE$ as 
    \begin{equation*}
        \cE = \left\{
        \left| \mu(x_s) - y_s\right| \le \varepsilon_s, \quad 1 \le s \le m
        \right\}.
    \end{equation*}
    Since there are $\totnst$ stages in Algorithm \ref{alg:qmc-kernel-ucb} and $\nstin \ge \totnst$,
    by taking a union bound, 
    \begin{equation*}
        P\left(\cE\right)
        \ge 1 - \frac{\totnst}{\nstin}\delta 
        \ge 1 - \delta.
    \end{equation*}
    In the rest of the proof, we assume that the event $\cE$ holds.
    By the same proof as \citep[Lemma 3]{wan2023quantum}, 
    i.e., by replacing $x_s$ by $\phi(x_s)$ in their proof,
    with probability at least $1 - \delta$, 
    we have 
    \begin{equation}
        \| \theta^* - \tthat_s \|_{V_s}
        \le \reg \|\theta^*\|_{V_s^{-1}}  + 
        \|  \Phi_s^\trn W_s^{1/2} \Gamma_s\|_{V_{s}^{-1}}.
        \label{eq:theta-conf-bd-lem}
        % \sqrt{
        % \Gamma_s^\trn W_s^{1/2} \Phi_s V_s^{-1} \Phi_s^\trn W_s^{1/2} \Gamma_s
        % }.
    \end{equation}
    Here, $\Gamma_s = W_s^{1/2} (\Phi_s \theta^* - Y_s) \in \RR^s$.
    % and $\Phi_s^\trn W_s^{1/2} \Gamma_s = \sum_{i=1}^{s} \epsilon_i^{-1}\gamma_i\phi(x_i)$.
    Then, by Lemma \ref{lem:qmc}, we have $\|\Gamma_s\|_\infty \le \tradeoff$.
    We note that $\Phi_s$ is a linear operator from $\cH_k$ to $\RR^s$ defined by 
    $\cH_k \ni f \mapsto (\phi(x_1)^\trn f, \cdots, \phi(x_s)^\trn f)=(f(x_1), \cdots, f(x_s)) \in \RR^s$.
    Similarly, $\Phi_s^\trn$ is a linear operator from $\RR^s$ to $\cH_k$ defined by
    $(a_i)_{1 \le i \le s} \mapsto \sum_{i=1}^{s}a_i \phi(x_i)$.
    Therefore, we note that $\Phi_s V_s^{-1} \Phi_s^\trn $ is a linear operator from $\RR^s \rightarrow \RR^s$, i.e., a matrix in $\RR^{s \times s}$.
    % Noting that the $i$-th entry of $\Gamma_s$ is given as $\epsilon_i^{-1}(\mu(x_i) - y_i)$,
    Since the trace norm is dual to the spectral norm with respect to the inner product of the space of symmetric matrices defined as
    $(A, B) \mapsto \Tr A B$, we have
    \begin{align*}
        \|  \Phi_s^\trn W_s^{1/2} \Gamma_s\|_{V_{s}^{-1}}^2
        &=\Gamma_s^\trn W_s^{1/2} \Phi_s V_s^{-1} \Phi_s^\trn W_s^{1/2} \Gamma_s \\
        &= \Tr \Gamma_s \Gamma_s^\trn W_s^{1/2} \Phi_s V_s^{-1} \Phi_s^\trn W_s^{1/2} \\
        &\le \Tr \left(\Gamma_s \Gamma_s^\trn\right)
        \sigma_{\mathrm{max}} \left(  W_s^{1/2} \Phi_s V_s^{-1} \Phi_s^\trn W_s^{1/2}\right) \\
        & \le \eta^2 s \ \sigma_{\mathrm{max}} \left(  W_s^{1/2} \Phi_s V_s^{-1} \Phi_s^\trn W_s^{1/2}\right). 
    \end{align*}
    Here, $\sigma_{\mathrm{max}} $ denotes the spectral norm and the last inequality follows from $\|\Gamma_s\|_\infty \le \tradeoff$. 
    We put $\tph_s = W_s^{1/2} \Phi_s$.
    Then, noting that 
    \begin{equation*}
    (\rho I + \tph_s^\trn \tph_s)\tph_s^\trn = \tph_s^\trn (\rho I + \tph_s \tph_s^\trn), 
    \end{equation*}
    we have the following (c.f., \cite{valko2013finite}): 
    \begin{equation*}
        \tph_s^\trn  (\rho I + \tph_s \tph_s^\trn)^{-1}  =
        (\rho I + \tph_s^\trn \tph_s)^{-1}  \tph_s^\trn . 
    \end{equation*}
    Thus, we have
    \begin{align*}
        \sigma_{\mathrm{max}} \left( W_s^{1/2} \Phi_s V_s^{-1} \Phi_s^\trn W_s^{1/2}\right)   
        = \sigma_{\mathrm{max}}\left( \tph_s \left(\rho I + \tph_s^\trn  \tph_s\right)^{-1}\tph^\trn_s\right)
        = \sigma_{\mathrm{max}}\left( \tph_s  \tph_s^\trn  (\rho I + \tph_s \tph_s^\trn)^{-1}\right)
        \le 1.
    \end{align*}
    Therefore, we see that $\|  \Phi_s^\trn W_s^{1/2} \Gamma_s\|_{V_{s}^{-1}} \le \eta \sqrt{s}$.
    Noting that $\|\theta^*\|_{V_s^{-1}} \le \reg^{-1/2}\|\theta^*\|_{\cH_k}$, we have our assertion by \eqref{eq:theta-conf-bd-lem}.
\end{proof}

\subsection{Proof of Proposition \ref{prop:regret-using-m}}
\begin{proof}
    This can be proved by a standard argument for the analysis of UCB-type algorithm, 
    Lemma \ref{lem:qmc}, and Proposition \ref{prop:conf-bd}. 
    We let $\cE$ be an event on which the inequalities in Proposition \ref{prop:conf-bd} hold
    and assume that $\cE$ holds.
    Let $x^* = \argmax_{x \in \cX} \phi(x)^\trn \theta^*$.
    By definition of $x_s$ and Proposition \ref{prop:conf-bd}, we have 
    \begin{align*}
       \mu(x^*)  - \mu(x_s) 
       &\le \muw_{s-1}(x^*) + \beta_{s-1} \sigmaw_{s-1}(x^*) - \muw_{s-1}(x_s) + \beta_{s-1} \sigmaw_{s-1}(x_s)\\
       &\le 2 \beta_{s-1} \sigmaw_{s-1}(x_s) = 2\beta_{s-1}\epsilon_s.
    \end{align*}
    Thus, by Lemma \ref{lem:qmc}, the regret that the player incurs in the stage $s$ is at most 
    \begin{equation*}
        2\beta_{s-1} \epsilon_s \qmcubc\log(\nstin/\delta) \frac{1}{\tradeoff \epsilon_s} 
        = 2  \qmcubc (\sqrt{\reg}S \tradeoff^{-1} + \sqrt{s-1})\log(\nstin/\delta) 
        \le 2 \qmcubc (\sqrt{\reg}S \tradeoff^{-1} + \sqrt{m})  \log(\nstin/\delta).
    \end{equation*}
    Therefore, with probability at least $1-\delta$, the cumulative regret $R(T)$ is bounded as 
    \begin{equation*}
        R(T) 
            \le 
        2 \qmcubc m(\sqrt{\reg}S \tradeoff^{-1} + \sqrt{m})  \log(\nstin/\delta)
        = O(m (\tradeoff^{-1} + \sqrt{m})  \log(\nstin/\delta)).
    \end{equation*}
\end{proof}



% %TODO: fix this
% \subsection{Proofs in }
% \begin{lem}
%     \label{lem:gamma-ub}
%     \begin{equation}
%     \qinfgain\leq D\log\left(1+\frac{\Bar{k}}{D\reg}\sum_{s=1}^m\frac{1}{\epsilon_s^2}\right)+\frac{\delta_D}{\reg}\sum_{s=1}^m\frac{1}{\epsilon_s^2}
%     \end{equation}
% \end{lem}
% \begin{proof}
%     We define $k_P, k_O: \cX \times \cX \rightarrow \RR$ as 
%     \begin{equation*}
%         k_P(x, x') = \sum_{i=1}^D \lambda_i \psi_i(x) \psi_i(x'), 
%         \quad
%         k_O(x, x') =\sum_{i \in I, i > D} \lambda_i \psi_i(x) \psi_i(x') = k(x, x') - k_P(x, x').
%     \end{equation*}
%     We also define matrices $K, K_P, K_O, K', K_P', K_O' \in \RR^{m \times m}$ by
%     $K = (k(x_i, x_j))_{1\le i, j \le m}, K_P = (k_P(x_i, x_j))_{1\le i, j \le m}$,
%     $K_O = (k_O(x_i, x_j))_{1 \le i, j\le m}$, and 
%     $K' = W^{1/2}KW^{1/2}$, $K_P' = W^{1/2} K_PW^{1/2}$, $K_O' = W^{1/2} K_O W^{1/2}$.
%     Then, we decompose $\qinfgain$ as follows.
%     \begin{align}
%         \qinfgain =& \log \left(\det\left(I_m+\frac{1}{\reg}K'\right)\right) \notag \\
%         =& \log\left(\det\left(I_m+\frac{1}{\reg}\left(K'_P+K'_O\right)\right)\right) \notag \\
%         =& \log\det\left(\left(I_m+\frac{1}{\reg}K'_P\right)\left(I_m+\frac{1}{\reg}\left(I_m+\frac{1}{\reg}K'_P\right)^{-1}K'_O\right)\right) \notag \\
%         =&\log\det\left(I_m+\frac{1}{\reg}K'_p\right)
%         +\log\det\left(I_m+\frac{1}{\reg}\left(I_m+\frac{1}{\reg}K'_P\right)^{-1}K'_O\right)
%         \label{eq:gamma-decomp}
%     \end{align}
%     We first provide an upper bound of the first term.
%     We put $\Psi_D = (\psi_j(x_i))_{1 \le i \le m, 1\le j \le D} \in \RR^{m \times D}$ 
%     and $\Lambda_D = \diag(\lambda_1, \cdots, \lambda_D)$.
%     Then, by definition of $K'_P$, we have
%     \begin{equation*}
%         K'_P = W^{1/2}  \Psi_D \Lambda_D \Psi_D^\trn W^{1/2} .
%     \end{equation*}
%     By the Weinstein-Aronszajn identity, we have
%     \begin{equation*}
%     \det\left(I_D+\frac{1}{\reg}G \right)=\det\left(I_m+\frac{1}{\reg}K'_P\right),
%     \end{equation*}
%     where the matrix $G \in \RR^{D \times D}$ is defined as 
%     \begin{equation*}
%         G =\Lambda_D^{\frac{1}{2}}\Psi_{D}^\trn W \Psi_{D} \Lambda_{D}^{\frac{1}{2}}.
%     \end{equation*}
%     Noting that for any positive definite matrix $P \in \RR^{n \times n}$ ,
%     \begin{equation}
%     \label{eq:log-det-tr}
%     \log \det(P) \leq n \log\frac{\Tr(P)}{n},
%     \end{equation}
%     to bound the first term of \eqref{eq:gamma-decomp}, it is sufficient to bound the trace of $I_D+\frac{1}{\reg}G $.
%     Letting $\bpsi_D(x) \in \RR^{D}$ be a column vector defined as $(\bpsi_D(x))_i = \psi_i(x)$, 
%     we have
%     \begin{align*}
%     \Tr \left(I_{D}+\frac{1}{\reg}G_m\right)=& D+\frac{1}{\reg}\Tr \left( \Lambda_{D}^{\frac{1}{2}}\Psi_{D}^\trn W \Psi_{D} \Lambda_{D}^{\frac{1}{2}}\right) \\
%     =& D+\frac{1}{\reg} \Tr \left(\Lambda_{D}^{\frac{1}{2}} \left[ \sum_{i=1}^m \frac{1}{\epsilon^2_i} \bpsi_D (x_i)\bpsi_{D}^\trn (x_i) \right] \Lambda_{D}^{\frac{1}{2}}\right) \\
%     % =&  D+\frac{1}{\reg} \Tr \left(\sum_{s=1}^m \frac{1}{\epsilon^2_i}\Lambda_D^{\frac{1}{2}} \phi_D (x_i)\phi_D^\intercal (x_i) \Lambda_D^{\frac{1}{2}}\right) \\
%     % =& D+ \frac{1}{\reg} \sum_{s=1}^m \frac{1}{\epsilon^2_i} \Tr \left( \Lambda_D^{\frac{1}{2}} \phi_D (x_i)\phi_D^\intercal (x_i) \Lambda_D^{\frac{1}{2}} \right)\\
%     =& D+ \frac{1}{\reg} \sum_{i=1}^m \frac{1}{\epsilon^2_i}
%     \| \bpsi_D(x_i)\Lambda_D^{\frac{1}{2}} \|_2^{2} \\
%     \leq & D+\frac{\Bar{k}}{\reg}\sum_{s=1}^m\frac{1}{\epsilon_s^2}
%     \end{align*}
%     Here, the last inequality follows from
%     \begin{align*}
%         \| \bpsi_{D}(x)\Lambda_{D}^{\frac{1}{2}} \|_2^2 = \sum_{i=1}^{D} \lambda_i \psi_i^2(x)
%         \leq  \overline{k}.
%     \end{align*}
%     Thus, noting that \eqref{eq:log-det-tr}, we have 
%     \begin{align}
%         \log \det \left(
%             I_m + \frac{1}{\reg} K_P' 
%         \right) \notag &=
%         \log \det \left( 
%             I_D + \frac{1}{\reg}G
%         \right)\\
%         &\le D \log \left( 
%             \frac{\Tr \left(I_D + \frac{1}{\reg}G \right)}{D}
%         \right)
%         = D \log \left(
%             1 + \frac{m\overline{k}}{D\reg}\sum_{i=1}^m \frac{1}{\epsilon_i^2}
%          \right).
%     \end{align}
%     Next, we bound the second term of \eqref{eq:gamma-decomp}.
%     We let $\delta_D=\sum_{i\in I, i > D} \lambda_i\psibar^2$, where $\psibar > 0$ satisfies $\|\psi_i\|_{\infty}\le \psibar$ for all $i$.
%     Then, by definition of $k_o$, we have $k_o(x, x) = \sum_{ i \in I, i > D} \lambda_i \psi_i^2(x)\le \delta_D$.
%     Noting that $I_m + \frac{1}{\reg} K'_P$ is positive definite and its eigenvalues are greater than $1$,
%     we see that 
%     \begin{equation}
%     \Tr\left(\left(I_m+\frac{1}{\reg}K'_P\right)^{-1}K'_O\right)\leq \Tr(K'_O)
%     =\Tr(W^{\frac{1}{2}}K_O W^{\frac{1}{2}})=\sum_{s=1}^{m}\frac{1}{\epsilon_s^2}k_O(x_s,x_s)
%     \leq \delta_D \sum_{s=1}^{m}\frac{1}{\epsilon_s^2}.
%     \label{eq:gamma-second-term-tr-bd}
%     \end{equation}
%     Thus, we can bound the second term as follows.
%     \begin{align*}
%         &\log\det\left(I_m+\frac{1}{\reg}\left(I_m+\frac{1}{\reg}K'_P\right)^{-1}K'_O\right)\\
%         &\le m \log \frac{1}{m}\Tr \left(I_m +  \frac{1}{\reg}\left(I_m+\frac{1}{\reg}K'_P\right)^{-1}K'_O\right)\\
%         & \le m \log \left( 1 + \frac{\delta_D}{m\reg}\sum_{s=1}^{m}\frac{1}{\epsilon_s^2} \right)\\
%         & \le \frac{\delta_D}{\reg} \sum_{s=1}^{m}\frac{1}{\epsilon_s^2}.
%     \end{align*}
%     Here, the first inequality follows from \eqref{eq:log-det-tr}, the second inequality follows from \eqref{eq:gamma-second-term-tr-bd},
%     and the third inequality follows from $\log (1 + x) \le x$ for any $x \in \RR_{\ge 0}$.
%     This completes the proof.
% \end{proof}
\subsection{Proof of Proposition \ref{prop:log-det-ineq}}
\begin{proof}
   As we remarked in Sec. \ref{sec:det_tr_rem},
   we note that there is no difficulty in defining $\log \det (I + \frankop)$ since $\frankop$ is of finite-rank.
   We decompose $\cH_k$ as $\cH_k = \cH_1 \oplus \cH_2$ by the projection $\pi$,
   where $\cH_1 = \Ran \pi$ and $\cH_2 = \Ran (I - \pi)$.
   We define $\frankop_{11}: \cH_1 \rightarrow \cH_1$,
   $\frankop_{22}: \cH_2 \rightarrow \cH_2$,
   and $\frankop_{12}: \cH_2 \rightarrow \cH_1$ by 
   $\frankop_{11} =  \pi\frankop|_{\cH_{1}}$, 
   $\frankop_{22} = (I - \pi) \frankop|_{\cH_{2}}$,
   $\frankop_{12}= (I - \pi) \frankop|_{\cH_{2}}$.
   That is, with respect to the decomposition $\cH_1 \oplus \cH_2$,
   $\frankop$ can be represented by a matrix $\begin{pmatrix}
    \frankop_{11} & \frankop_{12}\\
    \frankop_{12}^\trn & \frankop_{22}
   \end{pmatrix}.$
   Since 
   \begin{align*}
    &\begin{pmatrix}
       I & 0\\
       -\frankop_{12}^\trn (I + \frankop_{11})^{-1}& I
    \end{pmatrix}
    \begin{pmatrix}
        I + \frankop_{11} & \frankop_{12}\\
        \frankop_{12}^\trn & I + \frankop_{22}
    \end{pmatrix}
    \begin{pmatrix}
       I & -(I + \frankop_{11}) ^{-1}\frankop_{12}\\
       0 & I
    \end{pmatrix}
    \\
    &= \begin{pmatrix}
        I + \frankop_{11}  & 0\\
        0 & I + \frankop_{22} - \frankop_{12}^\trn (I + \frankop_{11}) ^{-1}\frankop_{12} 
    \end{pmatrix} 
   \end{align*}
   and noting that they are finite-rank operators, we have
   \begin{align*}
    \log \det (I + \frankop) 
    = \log \det (I + \frankop_{11}) + \log \det (I + \frankop_{22} - \frankop_{12}^\trn (I + \frankop_{11}) ^{-1}\frankop_{12} ).
   \end{align*}
   We introduce the following well-known matrix inequalities 
   (for the first inequality, we refer to \citep[Lemma 1]{vakili2021information}).
   For a positive semi-definite matrix $A \in \RR^{n \times n}$, 
   we have 
   \begin{equation*}
    \log \det (I + A) \le n \log (1 + \Tr A/n), \quad\log \det(1 + A) \le \Tr A.
   \end{equation*}
   Noting that $\dim \cH_1 = D$ and these matrix inequalities hold for finite rank operators,
   we see that 
   \begin{align*}
    \log \det (I + \frankop)& \le  
    D \log (1 + \Tr \frankop_{11}/D) + \Tr \left(\frankop_{22} - \frankop_{12}^\trn (I + \frankop_{11}) ^{-1}\frankop_{12} \right) \\
 &\le D \log (1 + \Tr \frankop_{11}/D) + \Tr\frankop_{22} .
   \end{align*}
   Here, the second inequality holds since $ \frankop_{12}^\trn (I + \frankop_{11}) ^{-1}\frankop_{12} $
   is positive semi-definite.
   We have our assertion by noting that $\Tr \frankop_{11}  = \Tr \frankop \pi$
   and $\Tr \frankop_{22} = \Tr \frankop (I - \pi)$.
\end{proof}
\subsection{Proof of Proposition \ref{prop:totnst-ub}}
To prove Proposition \ref{prop:totnst-ub}, first, we relate $\sum_{s=1}^{m}\frac{1}{\epsilon_s^2}$ to $\eta T$.
\begin{lem}
    \label{lem:e-t}
    Let $m$ be the total number of stages of Algorithm \ref{alg:qmc-kernel-ucb}.
    We assume that $\nstin \ge e$, where $\nstin$ is a parameter of Algorithm \ref{alg:qmc-kernel-ucb}.
    Then, we have
    \begin{equation*}
        \sum_{s=1}^m \frac{1}{\epsilon_s^2} \le (\eta T)^2.
    \end{equation*}
\end{lem}
\begin{proof}
    Essentially, this was proved in \citep[Lemma 2]{wan2023quantum} and easily follows from Lemma \ref{lem:qmc} and our problem setting.
    Since the number of queries of quantum reward oracles is limited up to $T$, by $\qmcubc > 1$ and Lemma \ref{lem:qmc}, we have
    \begin{align*}
            T \ge \sum_{s=1}^m \frac{\log (\nstin/\delta)}{\eta \epsilon_s}
            \ge 
            \eta^{-1}  \sum_{s=1}^m\frac{1}{ \epsilon_s}
            \ge \eta^{-1} \sqrt{\sum_{s=1}^m\frac{1}{\epsilon_s^2}}.
    \end{align*}
    This completes the proof.
\end{proof}

We can prove the following lemma by Corollary \ref{cor:gamma-bound} and the proof of \citep[Corollary 1]{vakili2021information}.
\begin{lem}
    \label{lem:e-ub}
    Let $m$ be the total number of stages of Algorithm \ref{alg:qmc-kernel-ucb}
    and put $E = \sum_{s=1}^m \frac{1}{\epsilon_s^2}$.
    \begin{enumerate}
        \item Suppose that $k$ has $(C_p, \beta_p)$ polynomial eigendecay with $C_p > 0, \beta_p > 1$.
        Then, there exists a constant $c'_p > 0$ depending only on 
        $C_p, \beta_p, \reg, \overline{k}, \overline{\psi}$ satisfying the following inequality:
        \begin{equation*}
            \qinfgain \le c_p' E^{1/\beta_p}\log^{1-1/\beta_p}(E + 1).
        \end{equation*}
        \item Suppose that $k$ has $(C_{e, 1}, C_{e, 2}, \beta_e)$ exponential eigendecay with $C_{e, 1}, C_{e, 2}, \beta_e > 0$.
        Then, there exists a constant $c_e' > 0$ depending only on 
        $C_{e, 1}, C_{e, 2}, \beta_e, \reg, \overline{k}, \overline{\psi}$ 
        such that 
        \begin{equation*}
            \qinfgain \le c_e' \log^{1 + 1/\beta_e}\left(E + 1\right).
        \end{equation*}
    \end{enumerate} 
\end{lem}
\begin{proof}
    First, suppose that $k$ has $(C_p, \beta_p)$ polynomial eigendecay.
    Then, by proof of \citep[Corollary 1]{vakili2021information}, we have $\delta_D \le C_p D^{1 -\beta_p} \psibar^2$.
    By Corollary \ref{cor:gamma-bound}, we obtain
    \begin{equation*}
        \qinfgain \le D \log \left( 1 + \frac{\kbar}{D \reg} E\right) + \frac{C_p \psibar^2}{\reg}   D^{1-\beta_p}E
        \le D \log \left( 1 + \frac{\kbar}{\reg} E\right) + \frac{C_p \psibar^2}{\reg}   D^{1-\beta_p}E.
    \end{equation*}
    Taking $D = \lceil  E^{1/\beta_p} \log^{-1/\beta_p} \left(1 + \frac{\kbar}{\reg} E\right)\rceil$, 
    we see that $\qinfgain \lesssim E^{1/\beta_p}\log^{1-1/\beta_p}(E + 1)$, 
    where notation $\lesssim$ ignores constants depending only on $C_p, \beta_p, \reg, \overline{k}, \overline{\psi}$.
    Next, suppose that $k$ has $(C_{e, 1}, C_{e, 2}, \beta_e)$ exponential eigendecay.
    Then, by proof of \citep[Corollary 1]{vakili2021information},
    there exists a constant $c''_e > 0$ depending only on $C_{e, 1}, C_{e, 2}, \beta_e, \psibar$ such that 
    $\delta_D \le c''_e \exp\left(-C_{e, 2}' D^{\beta_e}\right)$,
    where $C_{e, 2}' = C_{e, 2}$ if $\beta_e = 1$ and $C_{e, 2}' = C_{e, 2}/2$ if $\beta_e \neq 1$.
    Thus, by Corollary \ref{cor:gamma-bound}, we see that 
    \begin{equation*}
        \qinfgain \le D  \log \left( 1 + \frac{\kbar}{D \reg} E\right)  + \frac{c''_e}{\reg} \exp\left(- C_{e, 2}' D^{\beta_e}\right)E.
    \end{equation*}
    By taking $D = C_{e, 2}'^{1/\beta_e}\lceil \log^{1/\beta_e} (E + 1) \rceil$, 
    we have $\qinfgain \lesssim \log^{1/\beta_e + 1}(E + 1)$,
    where notation $\lesssim$ hides constants depending only on $C_{e, 1}, C_{e, 2} , \beta_e,  \reg, \overline{k}, \overline{\psi}$.
\end{proof}

% To prove Lemma \ref{lem:gamma-m}, we prove the following elementary lemma. 
% \begin{lem}
%     \label{lem:det-v-vt}
%     Let $f \in \cH_k$ and define a finite-rank operator $A = I_{\cH_k} + f f^\trn$, then
%     we have $\log \det A = \|f\|_{\cH_k}^2$.
% \end{lem}
% \begin{proof}
%     If $f = 0$, then the statement trivially holds. 
%     If $f \neq 0$, then 
% \end{proof}
Similarly to \citep{wan2023quantum}, we relate $\qinfgain$ to $m$.
\begin{lem}
    \label{lem:gamma-m}
    Let $m$ be the total number of stages of Algorithm \ref{alg:qmc-kernel-ucb}
    and $\qinfgain$ be as in \eqref{eq:gamma-def}. Then, we have $\qinfgain = m \log 2$.
\end{lem}
\begin{proof}
    We let $\cG_s$ be a finite dimensional subspace of $\cH_k$ spanned by $\{\phi(x_1), \dots, \phi(x_s)\}$
    and $\pwp_s = \sum_{i=1}^s \epsilon_i^{-2}\phi(x_i)\phi(x_i)^\trn$.
    By Definition \ref{def:det-tr} and its remark, we have 
    \begin{equation*}
        \qinfgain = \log \det (I + \reg^{-1}\pwp_m) = \log \det (I + \reg^{-1}\pwp_m|_{\cG_m}).
    \end{equation*}
    Therefore, the proof can be reduced to the finite dimensional case (i.e., the finite dimensional space $\cG_m$)
    and by \citep[Lemma 3]{wan2023quantum}, we have the following for each $s \ge 1$:
    \begin{equation*}
         \det (I + \reg^{-1}\pwp_s|_{\cG_m}) =2\det (I + \reg^{-1} \pwp_{s-1}|_{\cG_m}).
    \end{equation*}
    Since $\pwp_0 = 0$, we have the assertion of the lemma.
    % and $\cG_s^\perp$ the orthogonal complement of $\cG_s$ in $\cH_k$.
    % In the finite dimensional case, the statement of the lemma is proved in .
    % Since $\cG_m$ is finite dimensional the same proof works.
    % More formally, we can prove the statement of the lemma as follows.
   
    % For $s \in \ZZ_{\ge 1}$, we define a self-adjoint operator $V_s': \cH_k \rightarrow \cH_k$ by 
    % \begin{align*}
    %     V_s' &= \reg^{-1}V_s
    %     = I_{\cH_k} + \reg^{-1}\sum_{i=1}^{s} \epsilon_i^{-2}\phi(x_i)\phi(x_i)^\trn
    %     = I_{\cH_k} + \sum_{i=1}^{s}\epsilon_i'^{-2} \phi(x_i)\phi(x_i)^\trn.
    % \end{align*} 
    % Here $\epsilon_i' = \|x_s\|_{V_{s-1}'^{-1}} = \reg^{1/2}\epsilon_s$.
    % Then, $V_s'$ maps $\cG_s$ onto itself and acts on $\cG_s^\perp$ as the identity operator.
    % For $1 \le i, j \le m$, we let $\cV_{i, j}$ the restriction $V'_{i}|_{\cG_j}$ of $V'_i$ on the space $\cG_j$.
    % Since $\cG_s$ is finite dimensional, we can consider determinant of the linear operator $\cV_{s, s}$.
    % We also note that $\cV_{s, s}$ and $\cV_{s-1, s}$ are self-adjoint, positive operators on $\cG_s$.
    % By definition of $\cV_{s, s}$, we have the following.
    % \begin{align*}
    %     \det \cV_{s, s} &= \det \left(\cV_{s-1, s} + \epsilon_s'^{-2} \phi(x_s) \phi(x_s)^\trn\right)\\
    %     &= \det (\cV_{s-1, s})  \det \left(I_{\cG_s} + \epsilon_s'^{-2} \cV_{s-1, s}^{-1/2} \phi(x_s)\phi(x_s)^\trn \cV_{s-1, s}^{-1/2} \right)\\
    %     &= \det (\cV_{s-1, s}) \left(1 +  \epsilon_s'^{-2}  \|\cV_{s-1, s}^{-1/2} \phi(x_s) \|_{\cH_k}^2 \right)\\
    %     &= \det (\cV_{s-1, s}) \left(1 +  \epsilon_s'^{-2}  \|V_{s-1}'^{-1/2} \phi(x_s) \|_{\cH_k}^2 \right)\\
    %     &= \det (\cV_{s-1, s}) \left(1 +  \epsilon_s'^{-2}  \| \phi(x_s) \|_{V'^{-1}_{s-1}}^2 \right)\\
    %     & = 2 \det (\cV_{s-1, s}).
    % \end{align*}
    % Since $\cV_{s-1, s}$ acts on the orthogonal complement of $\cG_{s-1} \subseteq \cG_{s}$ as the identity operator,
    % we have $\det \cV_{s-1, s} = \det \cV_{s-1, s-1}$.
    % By the recursive equality $\det \cV_{s, s} = 2 \det \cV_{s-1, s-1}$ and $\cV_{0, 0} = I_{\cH_k}$,
    % we obtain $\gamma = \log \det \reg^{-1}V_{m} = m \log 2$.
\end{proof}

\begin{proof}[Proof of Proposition \ref{prop:totnst-ub}]
   If $k$ has an exponential eigendecay and $\eta = 1$,
   then the statement of the proposition follows from Lemma \ref{lem:e-t}, \ref{lem:e-ub}, \ref{lem:gamma-m}.
   Let us suppose $k$ has $\beta_p$ polynomial eigendecay.
   Then, by Lemma \ref{lem:e-t}, \ref{lem:e-ub}, \ref{lem:gamma-m}, for any $\alpha>0$, we have 
   $m \lesssim (\eta T)^{2\beta_p^{-1}}\log^{1 - \beta_p^{-1}}(1 + \eta T)$.
   By Proposition \ref{prop:regret-using-m}, 
   we take $\eta$ so that $\eta^{-1}$ and $(\eta T)^{\beta_p^{-1}}$ have the same order, i.e., $\eta = T^{-1/(1 + \beta_p)}$.
   This completes the proof.
\end{proof}

\subsection{Proof of Theorem \ref{thm:upper-bd}}
\begin{proof}
Theorem \ref{thm:upper-bd} follows from Proposition \ref{prop:regret-using-m} and Proposition \ref{prop:totnst-ub}.
\end{proof}