\begin{lemma}
    \label{lemm:ST_equiv_rev} 
    For any $\gamma > \epsilon$, the following implication holds:
    \begin{equation*}
        \frac{\norm{R_2 x}}{\norm{x}} \leq \gamma - \epsilon := \gamma' \quad \Rightarrow \quad \frac{\norm{(I - \hat{\Pi}_1)x}}{\norm{x}} \leq \gamma
    \end{equation*}
%    \guannan{RHS should also be $\gamma'$ according to (30)?}\ziyi{modified.}
\end{lemma}
\begin{proof}
    \begin{align}
        \frac{\norm{(I - \hat{\Pi}_1)x}}{\norm{x}} &= \frac{\norm{(I - \hat{\Pi}_1 + \Pi_1 - \Pi_1)x}}{\norm{x}} \notag
        \\
        \leq & \frac{\norm{(I - \Pi_1) x}}{\norm{x}} + \frac{\norm{\hat{\Pi}_1 - \Pi_1}\norm{x}}{\norm{x}}
        \notag
        \\
        \leq& \frac{\norm{\Pi_2 x}}{\norm{x}} + \epsilon
        \notag
        \\
        =& \frac{\norm{\Pi_2 \Pi_s x}}{\norm{x}} + \epsilon
        \label{eqn:B2.1}
        \\
        \leq& \frac{\norm{\Pi_s x}}{\norm{x}} + \epsilon
        \notag 
        \\
        \leq & \gamma
    \end{align}
where \eqref{eqn:B2.1} holds because $E_2$ is orthogonal to $E_1$, therefore $\Pi_2 \Pi_u = 0$, as $P_2P_2^* Q_1 R_1=0$ by orthogonality of $P_2$ and $Q_1 = P_1$.
\end{proof}
%\begin{lemma}
%\label{lemm:ST_equiv}
    %\begin{equation*}
    %    \frac{\norm{(I - \hat{\Pi}_1)x}}{\norm{x}} \leq \gamma \quad \Rightarrow \quad \frac{\norm{R_2 x}}{\norm{x}} \leq \gamma + \epsilon + \frac{\sqrt{2\xi}}{1-\xi} := \gamma'
    %\end{equation*}
%\end{lemma}
%\begin{proof}
    %\begin{align}
        %\frac{\norm{(I - \hat{\Pi}_1)x}}{\norm{x}} &= \frac{\norm{(I - \hat{\Pi}_1 + \Pi_1 - \Pi_1)x}}{\norm{x}} \notag
        %\\
        %\geq & \frac{\norm{(I - \Pi_1) x}}{\norm{x}} - \frac{\norm{\hat{\Pi}_1 - \Pi_1}\norm{x}}{\norm{x}}
        %\notag
        %\\
        %\geq& \frac{\norm{\Pi_2 x}}{\norm{x}} - \epsilon
        %\notag
        %\\
        %=& \frac{\norm{\Pi_2 \Pi_s x}}{\norm{x}} - \epsilon
        %\label{eqn:L5.1}
    %\end{align}
    %\guannan{Justify the last equality above.}\ziyi{better?} The last equality holds because $E_s$ is orthogonal to $E_1$ in the stable-unstable space decomposition.  
    %We can also use
    %\begin{align}
        %\frac{\norm{\Pi_s x}}{\norm{x}} =& \frac{\norm{(\Pi_1 + \Pi_2)\Pi_s x}}{\norm{x}}\notag
        %\\
        %\leq & \frac{\norm{\Pi_1 \Pi_s x}}{\norm{x}} + \frac{\norm{\Pi_2 \Pi_s x}}{\norm{x}}\notag
        %\\
        %= & \frac{\norm{P_1 P_1^* Q_2 R_2 x}}{\norm{x}} + \frac{\norm{\Pi_2 \Pi_s x}}{\norm{x}}\notag
        %\\
        %\leq & \frac{\sqrt{2\xi}}{1-\xi} + \frac{\norm{\Pi_2 \Pi_s x}}{\norm{x}}
        %\label{eqn:L5.2}
    %\end{align}
    %Combining \eqref{eqn:L5.1} and \eqref{eqn:L5.2}, we obtain
    %\begin{equation*}
    %    \frac{\norm{\Pi_s x}}{\norm{x}} \leq \frac{\norm{(I - \hat{\Pi}_1)x}}{\norm{x}} + \frac{\sqrt{2\xi}}{1-\xi} + \epsilon
    %\end{equation*}
    %The Lemma directly follows from the above.
%\end{proof}

In the following propositions, we show that the stopping time $\omega_i$ defined in Algorithm~\ref{alg:LTS0} guarantees a bound on $\norm{x_t}$.

\begin{proposition}
\label{prop:base_portion}
    Under the premise of Theorem~\ref{thm:main}, for any constant $\gamma > \epsilon$, if in the open loop system, 
    \begin{equation*}
        \frac{\norm{(I - \hat{\Pi}_1) x_{t}}}{\norm{x_{t}}} > \gamma,
    \end{equation*}
    then, exists $C_{\gamma} \in \mathbb{R}^+$ such that $\norm{x_{t}} < C_{\gamma}$. 
\end{proposition}

\begin{proof}
 Since we have that $x_{t} = \sum_{j = 0}^{t} A^{t-j}\eta_{j}$, we have
    %\begin{equation*}
        %\frac{\norm{R_1 x_{T}}}{\norm{R_2 x_{T}}} = \frac{\norm{ \sum_{j = 0}^{T} R_1 A^{T-j}\eta_j}}{\norm{ \sum_{j = 0}^{T} R_2 A^{T-j}\eta_j}}
    %\end{equation*}
    \small
    \begin{equation*}
        R x_{t} = \begin{bmatrix}
            R_1 x_{t} \\ R_2 x_{t}
        \end{bmatrix}
        =
        \begin{bmatrix}
            R_1 \sum_{j = 0}^{t} A^{t-j}\eta_j \\ R_2 \sum_{j = 0}^{t} A^{t-j}\eta_j
        \end{bmatrix}
        = 
        \begin{bmatrix}
            \sum_{j = 0}^{t} N_1^{t-j} R_ 1\eta_j \\ \sum_{j = 0}^{t} N_2^{t-j} R_2\eta_j
        \end{bmatrix}
    \end{equation*}
    \normalsize
    Therefore, we have that %\guannan{below, should be $R_2 x_t$?}\ziyi{yes}
    \small
    \begin{align*}
        \norm{R_2 x} &\leq \sum_{j=0}^{t} \norm{N_2^j} \norm{R_2} C \leq \sum_{j=0}^{t}\zeta_{\epsilon_4}(N_2)(\lambda_{k+1}+\epsilon_4)^j \norm{R_2} C
        \\
        &\leq \frac{\zeta_{\epsilon_4}(N_2) C}{1-\xi} \frac{1}{1 - (\lambda_{k+1}+\epsilon_4)}
    \end{align*} 
    \normalsize
    where we used Lemma A.1 of \citet{LTI}. As $\norm{R_2 x_{j}}$ is bounded above by a constant, so is $\norm{\Pi_s x_t} = \norm{Q_2 R_2 x_t}$. 
    
    Since $\frac{\norm{(I - \hat{\Pi}_1) x_{t}}}{\norm{x_{t}}} > \gamma$, by Lemma~\ref{lemm:ST_equiv_rev}, $\frac{\norm{R_2 x_t}}{\norm{x_t}} > \gamma'$. %\guannan{A bit confused - should be $R_2$? And also, for Lemma B.1 it is $<$} 
    Correspondingly, we have
    \begin{align*}
        \gamma' < \frac{\norm{R_2 x_t}}{\norm{x_t}},
    \end{align*}
    which implies
    \begin{equation}
    \label{eqn:C_gamma}
        \norm{x_t} < \frac{\zeta_{\epsilon_4}(N_2) C}{\gamma'(1-\xi)} \frac{1}{1 - (|\lambda_{k+1}|+\epsilon_4)} := C_{\gamma}.
    \end{equation}
\end{proof}

\begin{proposition}
\label{prop:ST_induction}
    Under the premise of Theorem~\ref{thm:main}, for any constant $\gamma > \epsilon$, consider the initial state $x_i$ such that $\frac{\norm{P_2^* x_i}}{\norm{x_i}} > \gamma$. Moreover, $x_{i+1} = A x_{i} + Bu + \eta_i$, i.e. we insert control right after the initial state and let the system run in open-loop thereafter. If for $t \in \mathbb{Z}^+$ such that
    \begin{equation*}
        \frac{\norm{(I - \hat{\Pi}_1) x_{i+t}}}{\norm{x_{i+t}}} > \gamma,
    \end{equation*}
    then, for all $\alpha < \frac{1}{\norm{B}}$,
    \begin{equation*}
        \norm{x_{i+t}} < \frac{1}{\gamma'} \left(\frac{2\zeta_{\epsilon_4}(N_2)}{1-\xi}\norm{x_i} + C_{\gamma}\right).
    \end{equation*}
\end{proposition}
\begin{proof}
    \begin{align}
        \norm{R_2 x_{i+t}} \leq& \norm{N_2^t R_2 x_i + N_2^{t-1}R_2 B u} + \sum_{j=0}^t \norm{N_2^j} \norm{R_2} C\notag
        \\
        \leq& \frac{\zeta_{\epsilon_4}(N_2)}{1-\xi}(|\lambda_{k+1}|+\epsilon_4)^{t-1}((1 + \alpha\norm{B})\norm{x_i}) + C_{\gamma}\notag
        \\
        \leq& \frac{2\zeta_{\epsilon_4}(N_2)}{1-\xi}(|\lambda_{k+1}|+\epsilon_4)^{t-1}\norm{x_i} + C_{\gamma}.
        \label{eqn:propv4.1}
    \end{align}
    Since $\frac{\norm{(I - \hat{\Pi}_1) x_{i+t}}}{\norm{x_{i+t}}} > \gamma$, by Lemma~\ref{lemm:ST_equiv_rev}, we have that 
    \begin{align*}
        \gamma' < \frac{\norm{R_2 x_{i+t}}}{\norm{x_{i+t}}}.
    \end{align*}
    Substitute the above in \eqref{eqn:propv4.1} finishes the proof.
\end{proof}

\begin{proposition}
\label{prop:ST_final}
    Under the premise of Theorem~\ref{thm:main}, for any constant $\gamma > \epsilon$ and stopping time $\omega_{i}$ such that:
    \begin{equation*}
        \omega_i = \min \left\{t > t_{i-1} : \frac{\norm{(I - \hat{\Pi}_1) x_{t}}}{\norm{x_{t}}} \leq \gamma \wedge  \norm{x_t} > \frac{C}{\delta}\right\},
    \end{equation*}
    where we assume $t_0 = T$. Then, Algorithm~\ref{alg:LTS0} guarantees that %\guannan{Just $R_2$, not $R_2^*$. It seems most previous places are right, but many recent edits have this additional transpose }\guannan{Why do we care $\frac{\Vert R_2 x_{t_i}\Vert}{\Vert x_{t_i}\Vert}$? I think in eq. (30) we care $\frac{\Vert P_2^* x_{t_i}\Vert}{\Vert x_{t_i}\Vert}$}
    \begin{equation*}
        \frac{\norm{P_2^* x_{t_i}}}{\norm{x_{t_i}}} < \gamma + \epsilon, \qquad \forall i \in \{1,\dots, m\},
    \end{equation*}
    while maintaining %\guannan{We want the below to hold for all times between $t_i$ and $t_{i+1}$?} \ziyi{just a change of notation. Better?}
    \begin{equation*}
        \norm{x_{t_1}} \leq \max\left\{\norm{A}\frac{C}{\delta} + C, \norm{A} C_{\gamma} + C, \norm{x_T}\right\},
    \end{equation*}
    \begin{equation*}
        \norm{x_{t}} < \max\left\{\norm{A}\frac{C}{\delta} + C, \left(\frac{\norm{A}}{\gamma'}\frac{2\zeta_{\epsilon_4}(N_2)}{1-\xi}\right)^i \norm{x_{t_1}} + \sum_{j=1}^{i-1} \left(\frac{\norm{A}}{\gamma'}\frac{2\zeta_{\epsilon_4}(N_2)}{1-\xi}\right)^j \left(\frac{\norm{A}}{\gamma'} C_\gamma + C\right)\right\}, \quad \forall t_i \leq t \leq t_{i+1}.
    \end{equation*}
\end{proposition}
\begin{proof}
    Similar to the steps in proof of Lemma~\ref{lemm:ST_equiv_rev}, we obtain that %\guannan{Provide more details - how to obtain the below?...}\ziyi{better?}\guannan{I actually find the first two equalities are completely redundant?}
    \begin{equation*}
        \frac{\norm{P_2^* x_{t_i}}}{\norm{x_{t_i}}} = \frac{\norm{\Pi_2(\Pi_u + \Pi_s) x_{t_i}}}{\norm{x_{t_i}}} = \frac{\norm{\Pi_2 \Pi_s x_{t_i}}}{\norm{x_{t_i}}} \leq \frac{\norm{\Pi_2 x_{t_i}}}{\norm{x_{t_i}}} = \frac{\norm{(I - \hat\Pi_1+ \hat\Pi_1 - \Pi_1) x_{t_i}}}{\norm{x_{t_i}}} \leq \gamma + \epsilon,
    \end{equation*}
    which shows the first part of the result. 
    
    We now focus on the second part (bounding $\Vert x_t\Vert$). 
    For the base case, We either have $t_1 = T$, thus $x_{t_1} = x_T$, in which case the stopping time criteria is already met after Stage 1 of algorithm~\ref{alg:LTS0}, or, if $t_1 > T$, there are two scenarios depending which of the two stopping criteria is violated at time $t_1-1$ . If $\frac{\norm{(I - \hat{\Pi}_1) x_{t_1 - 1}}}{\norm{x_{t_1 - 1}}} > \gamma$, by Proposition~\ref{prop:base_portion}, we have $\norm{x_{t_1 - 1}} < C_{\gamma}$, where $C_{\gamma}$ is defined in \eqref{eqn:C_gamma}, in which case, we have
    \begin{equation}
    \label{eqn:upper_base}
        \norm{x_{t_1}} = \norm{A x_{t_1 - 1} + \eta_{t_1 - 1}} \leq \norm{A} C_{\gamma} + C.
    \end{equation}
    In the second case, $\norm{x_{t_1-1}} \leq \frac{C}{\delta}$, so we have
    \begin{equation*}
    \label{eqn:upper_base2}
        \norm{x_{t_1}} < \norm{A}\frac{C}{\delta} + C.
    \end{equation*}
    Therefore, to sum up the base case, we have
    \begin{equation*}
        \norm{x_{t_1}} \leq \max\left\{\norm{A}\frac{C}{\delta} + C, \norm{A} C_{\gamma} + C, \norm{x_T}\right\}
    \end{equation*}
    
    For the induction case, given $\norm{x_{t_i}}$, there are again two cases depending on which criterion is violated at time $t_{i+1}-1$. If $\norm{x_{t_{i+1}-1}} \leq \frac{C}{\delta}$, we have
    \begin{equation*}
        \norm{x_{t_{i+1}}} < \norm{A}\frac{C}{\delta} + C.
    \end{equation*}
    Otherwise, if $\frac{\norm{(I - \hat{\Pi}_1) x_{t_{i+1}-1}}}{\norm{x_{t_{i+1}-1}}} > \gamma$, by Proposition~\ref{prop:ST_induction}, we obtain that 
    \begin{equation}
        \norm{x_{t_{i+1}-1}} < \frac{1}{\gamma'} \left(\frac{2\zeta_{\epsilon_4}(N_2)}{1-\xi}\norm{x_i} + C_{\gamma}\right),
    \end{equation}
    where $\gamma'$ is defined in Lemma~\ref{lemm:ST_equiv_rev}.
    
    By the definition of $\omega_i$, the maximum of the above inequalities also holds for all $x_{t}$ such that $t < t_{i+1}$. Therefore, 
    \begin{equation*}
        \norm{x_{t_{i+1}}} < \max\left\{\norm{A}\frac{C}{\delta} + C, \frac{\norm{A}}{\gamma'} \left(\frac{2\zeta_{\epsilon_4}(N_2)}{1-\xi}\norm{x_i} + C_{\gamma}\right) + C\right\},
    \end{equation*}
    as required. Note that the same bound above also holds for all $t_i<t<t_{i+1}$. Hence we get the desired result after a simple recursive expansion. 
\end{proof}

We are now ready to bound $\norm{\hat{B}_\tau - B_{\tau}}$.
\begin{proposition}
    \label{prop:G6}
    Under the premise of Theorem~\ref{thm:main}, 
    \begin{equation*}
        \norm{\hat{B}_\tau - B_\tau} < C_B \left(|\lambda_1|+\epsilon_1\right)^{\tau-1} \delta,
    \end{equation*}
    where $C_B := (\zeta_{\epsilon_1}^2 (A) (3\tau\norm{A} + \norm{B} + \tau C + 1)+ (\tau+1)C_{\Delta})\frac{\sqrt{m}}{\alpha}$.
\end{proposition}
\begin{proof}
    We have
    \begin{align*}
        \norm{b_i - \hat{b}_i}
        = & \frac{1}{\alpha\norm{x_{t_i}}}\Bigg \lVert P_1^* x_{t_i + \tau} - M_1^\tau P_1^* x_{t_i} - \Delta_{\tau} P_2^* x_{t_i} - \sum_{j = 1}^{\tau-1} (M_1^{\tau-j} P_1^* \eta_{t_i + j} - \Delta_{\tau-j} P_2^* \eta_{t_i + j})
        \\
        & - \left(\hat{P}_1^* x_{t_i+\tau} - \hat{M}_1^\tau \hat{P}_1^* x_{t_i}\right) \Bigg \rVert
        \\
        \leq & \frac{1}{\alpha\norm{x_{t_i}}} \Bigg(\norm{(P_1 - \hat{P}_1)^* \left(A^\tau x_{t_i} + B_\tau u_{t_i}\right)} + \norm{\sum_{j=1}^{\tau-1} M_1^{\tau-j} (P_1 -\hat{P}_1)^* \eta_{t_i + j}} + \norm{M_1^\tau P_1^* x_{t_i} - \hat{M}_1^\tau \hat{P}_1^* x_{t_i}}
        \\
        & + \norm{\Delta_{\tau} P_2^* x_{t_i}} + \sum_{j = 1}^{\tau-1} \norm{M_1^{\tau-j} P_1^* \eta_{t_i + j}} + \sum_{j = 1}^{\tau-1}\norm{\Delta_{\tau-j} P_2^* \eta_{t_i + j}}\Bigg).
    \end{align*}
    Here, the first term is bounded by
    \begin{align*}
        \norm{(P_1 - \hat{P}_1)^* \left(A^\tau x_{t_i} + B_\tau u_{t_i}\right)} 
        \leq & \norm{P_1 - \hat{P}_1} \left(\norm{A^\tau} + \norm{A^{\tau-1}B}\right) \norm{x_{t_i} }
        \\
        \leq & \norm{x_{t_i} } \zeta_{\epsilon_1} (A) \left(|\lambda_1| + \epsilon_1\right)^{\tau - 1} (\norm{A} + \norm{B})\delta,
    \end{align*}
    where in the last inequality we applied Corollary~\ref{coro:52.1} and Gelfand's formula; the second term is bounded by 
    \begin{align*}
        \norm{\sum_{j=1}^{\tau-1} M_1^{\tau-j} (P_1 -\hat{P}_1)^* \eta_{t_i + j}} 
        \leq & \sum_{j=1}^{\tau-1} \zeta_{\epsilon_1} (A) \left(|\lambda_1| + \epsilon_1\right)^{\tau - j} C \delta
        \\
        < & \tau \zeta_{\epsilon_1} (A) \left(|\lambda_1| + \epsilon_1\right)^{\tau - 1} C \delta,
    \end{align*}
    where we used Corollary~\ref{coro:52.1} and Gelfand's formula. 
    
    The third term is bounded above by 
    \begin{align*}
        \norm{M_1^\tau P_1^* x_{t_i} - \hat{M}_1^\tau \hat{P}_1^* x_{t_i}}
        \leq & \left(\norm{M_1^\tau (P_1 - \hat{P}_1)^* } + \norm{(M_1^\tau - \hat{M}_1^\tau) \hat{P}_1^*)}\right)\norm{x_{t_i}}
        \\
        < & \big(\zeta_{\epsilon_1} (A) \left(|\lambda_1| + \epsilon_1\right)^{\tau - 1} \norm{A} \delta + 3\tau \norm{A}\zeta_{\epsilon_1} (A) \left(|\lambda_1| + \epsilon_1\right)^{\tau - 1} \delta\big)\norm{x_{t_i}}
        \\
        \leq & \norm{x_{t_i}}\zeta_{\epsilon_1} (A)^2 \left(|\lambda_1| + \epsilon_1\right)^{\tau - 1} (3\tau+1) \norm{A} \delta,
    \end{align*}
    where we applied Gelfand's formula and \Cref{prop:G2}. 
    The fourth term is bounded by
    \begin{align}
        \frac{\norm{\Delta_\tau} \norm{P_2^* x_{t_i}}}{\norm{x_{t_i}}}
        \leq & C_{\Delta}(|\lambda_1| + \epsilon_1)^\tau (\gamma + \epsilon)
        \label{eqn:26}
        \\
        \leq & C_{\Delta}(|\lambda_1| + \epsilon_1)^\tau \delta,
        \label{eqn:28}
    \end{align}
    where in \eqref{eqn:26}, we used Proposition G.1 of \citet{LTI} and Proposition~\ref{prop:ST_final}, while and \eqref{eqn:28} we need to pick stopping time $\omega$ defined by $\gamma$:
    \begin{equation}
        \gamma \leq \delta - \epsilon = (\sqrt{2k}-1)\epsilon.
    \end{equation}
    For the second to last and the last term,
    \begin{align}
        \frac{1}{\norm{x_{t_i}}}\sum_{j = 1}^{\tau-1} \norm{M_1^{\tau-j} P_1^* \eta_{t_i + j}} \leq & \frac{1}{\norm{x_{t_i}}}\sum_{j=1}^{\tau-1} \zeta_{\epsilon_1} (A) \left(|\lambda_1| + \epsilon_1\right)^{\tau - j} C \notag
        \\
        < & \frac{1}{\norm{x_{t_i}}}\tau \zeta_{\epsilon_1} (A) \left(|\lambda_1| + \epsilon_1\right)^{\tau - 1} C \notag
        \\
        < & \tau \zeta_{\epsilon_1} (A) \left(|\lambda_1| + \epsilon_1\right)^{\tau - 1} \delta,
        \label{eqn:ST_ms}
    \end{align}
    \begin{align}
        \frac{1}{\norm{x_{t_i}}}\sum_{j = 1}^{\tau-1}\norm{\Delta_{\tau-j} P_2^* \eta_{t_i + j}}
        \leq & \frac{1}{\norm{x_{t_i}}} \tau C_{\Delta}(|\lambda_1| + \epsilon_1)^\tau C
        \notag
        \\
        \leq & \tau C_{\Delta}(|\lambda_1| + \epsilon_1)^\tau \delta,
        \label{eqn:ST_xt}
    \end{align}
    where in \eqref{eqn:ST_ms} and \eqref{eqn:ST_xt}, we need
    \begin{equation}
    \label{eqn:additional_ST}
        \frac{C}{\norm{x_{t_i}}} < \delta.
    \end{equation}
    %\guannan{Reword the below sentence to cite the previous Propositions D.4?}\ziyi{better?}
    We notice that \eqref{eqn:additional_ST} happens with high probability since the system runs mostly in open loop. If the above inequality is not satisfied, we can keep the system running in open loop until it is. If the above is never satisfied, then the system is stable. More formally, as the first stopping time $t_1$ stated in \Cref{prop:ST_final} is never reached, the bound for $\norm{x_{t_1}}$ holds for all $x_t$. 

    Finally, to bound the error of the whole matrix, we simply apply the definition
    \begin{align*}
        \norm{\hat{B}_{\tau} - B_{\tau}} =& \max_{\norm{u}=1}\norm{(\hat{B}_{\tau} - B_{\tau})u} \leq \max_{\norm{u}=1}\sum_{i=1}^m |u_i| \norm{\hat{b}_i - b_i}
        \\
        <& (\zeta_{\epsilon_1}^2 (A) (3\tau\norm{A} + \norm{B} + \tau C + 1)+ (\tau+1)C_{\Delta})\left(|\lambda_1| + \epsilon_1\right)^{\tau - 1} \delta \frac{\sqrt{m}}{\alpha}.
    \end{align*}
\end{proof}
