\newpage
\subsection{Proof for Theorem~\ref{thm:UCBE-FMUCB}}\label{proof:ucbefmucb}
\begin{theorem*}[Last iterate convergence of UCBE-FMUCB with noisy side information]
When the leader uses UCBE with $S_0 = \mO\left( \frac{B}{\varepsilon^3} \log\frac{ABT}{\delta}\right)$ and $\varepsilon = \min\{\Delta_4, \Delta_5, \Delta_6\}$, the follower uses FMUCB, and let $T_{f,w}$ be the total number of rounds that the follower did not play the best manipulation strategy in $T$ rounds, with probability at least $1-3\delta$,
\[
T_{f,w} \leq  \mO\left(\frac{ A B }{ \varepsilon^2} \log \frac{ABT}{\delta}\right),
\]
and for $T\geq  \mO\left( \frac{A S_0}{\Delta_3^2}\right)$, $\mathbb{P}\big[a_T \neq a_{fm} \big]\leq \frac{\delta}{T}$.
\end{theorem*}
\bigskip\bigskip

Since the leader who uses UCBE will do pure exploration for each $a\in\mA$ with $\mO\left(\frac{B}{\varepsilon^3} \log\frac{ ABT}{\delta}\right)$ according to the analysis in Appendix~\ref{proof:ucbeucb}, where $\varepsilon=\min\{\Delta_4,\Delta_5,\Delta_6\}$. So by the union bound, with probability at least $1-3\delta$,
\begin{equation*}
    T_{f,w}\leq \mO\left(t_1 + AB t_2 +AB t_3\right)=\mO\left(\frac{ A B }{\varepsilon^2} \log \frac{ABT}{\delta}\right).
\end{equation*}
Similar to the proof of Theorem~\ref{thm:ucbe-ucb}, we bound the difference between the accumulative reward the leader receives and the accumulative reward under best manipulation strategy,
\begin{align*}
&\left|\sum_{t=1}^{n(a)} r_{l,t}(a, b_t)-\mu_l(a, \mF_{fm}(a))\right| \\
\leq & \left|\sum_{t=1}^{n(a)} \left(r_{l,t}\left(a, \mF_{fm}(a)\right) - \mu_l\left(a, \mF_{fm}(a)\right)\right)\mI\left\{b_t = \mF_{fm}(a)\right\}\right| + \sum_{t=1}^{n(a)} \mI\left\{b_t \neq \mF_{fm}(a)\right\}.
\end{align*}
And based on the proof of Theorem~\ref{thm:EXP3-FMUCB} in Appendix~\ref{proof:ucbeucb} and Lemma~\ref{lemma: bound for wbr and wwr}, we have
\begin{equation*}
    \sum_{t=1}^{n(a)} \mI\left\{b_t \neq \mF_{fm}(a)\right\}\leq T_{wwr}(a)+Bt_2 +Bt_3
    =\mO\left(\frac{B}{\varepsilon^2} \log \frac{ABT}{\delta}\right).
\end{equation*}
Analogous to the proof of Theorem~\ref{thm:ucbe-ucb} in Appendix~\ref{proof:ucbeucb}, we can complete the proof of Theorem~\ref{thm:UCBE-FMUCB}. 