\section{Lipschitz Property of \texorpdfstring{$H_{x,x}$}{}}\label{sec:lips_H_xx}
In Section~\ref{sub:lips_H_xx:main_res}, we present the main results of the Lipschitz property of $H_{x,x}$. In Section~\ref{sub:lips_H_xx:summary}, we summarize the results from following steps 1-9. In Section~\ref{sub:lips_H_xx:upper_bound}, we compute the upper bound of basic functions for the following proof. In Section~\ref{sub:lips_H_xx:basic_lips}, we compute the Lipschitz Property of basic functions for the following proof. In Section~\ref{sub:lips_H_xx:step1}, we analyze the first step of Lipschitz function $c(x,:)_{j_0,i_0} \cdot \diag( f(x)_{j_0} \circ v )$. In Section~\ref{sub:lips_H_xx:step2}, we analyze the second step of Lipschitz function $-\gamma_{j_0}(x) \cdot c(x,:)_{j_0,i_0} \cdot \diag( f(x)_{j_0} \circ v )$. In Section~\ref{sub:lips_H_xx:step3}, we analyze the third step of Lipschitz function $- 2 \gamma_{j_0}(x) \cdot   (f(x)_{j_0} \circ v ) f(x)_{j_0}^\top $. In Section~\ref{sub:lips_H_xx:step4}, we analyze the fourth step of Lipschitz function $-c(x,:)_{j_0,i_0} \cdot   (f(x)_{j_0} \circ v ) f(x)_{j_0}^\top $. In Section~\ref{sub:lips_H_xx:step5}, we analyze the fifth step of Lipschitz function $- 2 \gamma_{j_0}(x)  \cdot  f(x)_{j_0} (f(x)_{j_0} \circ v)^\top$. In Section~\ref{sub:lips_H_xx:step6}, we analyze the sixth step of Lipschitz function $ - c(x,:)_{j_0,i_0}) \cdot  f(x)_{j_0} (f(x)_{j_0} \circ v)^\top$. In Section~\ref{sub:lips_H_xx:step7}, we analyze the seventh step of Lipschitz function $ 2 \gamma_{j_0}(x) c(x,:)_{j_0,i_0}  \cdot f(x)_{j_0} f(x)_{j_0}^\top$. In Section~\ref{sub:lips_H_xx:step8}, we analyze the eighth step of Lipschitz function $  \gamma_{j_0}(x)^2  \cdot f(x)_{j_0} f(x)_{j_0}^\top$. 
In Section~\ref{sub:lips_H_xx:step9}, we analyze the nineth step of Lipschitz function $   (f(x)_{j_0} \circ v) \cdot ( f(x)_{j_0} \circ v )^\top$. 


\subsection{Main Result}\label{sub:lips_H_xx:main_res}

In this section, we present the main result of the Lipschitz property.

\begin{lemma}\label{lem:lip_main}
If the following conditions hold
\begin{itemize}
    \item Let $H_{j_0,i_0} = \frac{\d^2 L_{j_0,i_0}}{\d x \d x} : \R^{d^2} \rightarrow \R^{d^2 \times d^2}$
    \item Let $H = \sum_{j_0=1}^n \sum_{i_0=1}^d H_{j_0,i_0}$ (because $L = \sum_{j_0=1}^n \sum_{i_0=1}^d L_{j_0,i_0} $)
    \item Let $\A \in \R^{n^2 \times d^2}$ and $u(x)_{j_0} \in \R^n$ be defined as Definition~\ref{def:u}
    \item Let $\alpha(x)_{j_0} \in \R$ be defined as Definition~\ref{def:alpha}
    \item Let $f(x)_{j_0} \in \R^n$ be defined as Definition~\ref{def:f}
    \item Let $c(x,:)_{j_0,i_0} \in \R$ be defined as Definition~\ref{def:c}
    \item Let $\gamma(x)_{j_0} = \langle f(x)_{j_0}, v \rangle \in \R$
    \item $\| A_1 \|, \| A_2 \| , \| A_3 \| \leq R$, $\| \A_{j_0} \| \leq R$, $\| x \|_2 \leq R$,$| b_{j_0,i_0} | \leq R$, $\| v \|_2 \leq R^2$
    \item Let $R \geq 4$
   
    \item Let $M:=\exp( O( R^2+ \log (nd ) )  )$
\end{itemize}

Then, we have for all $x, \wt{x} \in \R^{d^2}$
\begin{itemize}
\item Part 1. For each $j_0 \in [n]$, $i_0 \in [d]$
\begin{align*}
    \| H_{j_0,i_0}(x) - H_{j_0,i_0}( \wt{x} ) \| \leq M \cdot \| x - \wt{x} \|_2
\end{align*}
\item Part 2.
\begin{align*}
    \| H(x) - H( \wt{x} ) \| \leq M \cdot \| x - \wt{x} \|_2 
\end{align*}
\end{itemize}
\end{lemma}


\begin{proof}

{\bf Proof of Part 1.}
We have 
\begin{align*}
 \| H_{j_0,i_0}(x) - H_{j_0,i_0}(\wt{x}) \| \leq & ~ \sum_{k=1}^9 \| \A_{j_0}^\top \| \cdot \| G_k(x) - G_k(\wt{x}) \| \cdot \| \A_{j_0} \| \\
 \leq & ~ 9 R^2 \cdot n^{1.5} \exp(20R^2) \\
 \leq & ~ n^{1.5} \exp(30R^2)
\end{align*}
where the first step follows from definition of $H_{j_0,i_0}(x)$,  the second step follows from Lemma~\ref{lem:summary_Gi}, and last step follows from simple algebra.

{\bf Proof of Part 2.}

Then, we have 
\begin{align*}
\| H(x) - H(\wt{x}) \| 
\leq & ~ \sum_{j_0=1}^n \sum_{i_0=1}^d \| H_{j_0,i_0}(x) - H_{j_0,i_0}(\wt{x}) \| \\
\leq & ~ nd \cdot n^{1.5} \exp(30R^2)
\end{align*}
where the first step follows from triangle inequality and $H = \sum_{j_0=1}^n \sum_{i_0=1}^d H_{j_0,i_0}$, and the second step follows from {\bf Part 1.}
\end{proof}


\subsection{Summary of Nine Steps}\label{sub:lips_H_xx:summary}

In this section, we provide a summary of the nine-step calculation of Lipschitz for different matrix functions.

\begin{lemma}\label{lem:summary_Gi}
    If the following conditions hold 
    \begin{itemize}
        \item $G_1(x) =  c(x,:)_{j_0,i_0} \cdot \diag( f(x)_{j_0} \circ v )$
        \item $G_2(x) = -\gamma_{j_0}(x) \cdot c(x,:)_{j_0,i_0} \cdot \diag( f(x)_{j_0} \circ v )$
        \item $G_3(x) =  - 2 \gamma_{j_0}(x) \cdot   (f(x)_{j_0} \circ v ) f(x)_{j_0}^\top  $
        \item $G_4(x) = -c(x,:)_{j_0,i_0} \cdot   (f(x)_{j_0} \circ v ) f(x)_{j_0}^\top  $
        \item $G_5(x) = - 2 \gamma_{j_0}(x)  \cdot  f(x)_{j_0} (f(x)_{j_0} \circ v)^\top$ (The proof of this is identical to $G_3$)
        \item $G_6(x) =  - c(x,:)_{j_0,i_0} \cdot  f(x)_{j_0} (f(x)_{j_0} \circ v)^\top$ (The proof of this is identical to $G_4$)
        \item $G_7(x) =  2 \gamma_{j_0}(x) c(x,:)_{j_0,i_0} \cdot f(x)_{j_0} f(x)_{j_0}^\top$
        \item $G_8(x) = \gamma_{j_0}(x)^2  \cdot f(x)_{j_0} f(x)_{j_0}^\top $
        \item $G_9(x) = (f(x)_{j_0} \circ v) \cdot ( f(x)_{j_0} \circ v )^\top$
    \end{itemize}
    Then, we have
    \begin{align*}
        \max_{k \in [9]} \| G_k(x) - G_k( \wt{x} ) \| \leq n^{1.5} \exp(20R^2).
    \end{align*}
\end{lemma}
\begin{proof}
The proof follows from Lemma~\ref{lem:lipschitz_G1}, Lemma~\ref{lem:lipschitz_G2}, Lemma~\ref{lem:lipschitz_G3}, Lemma~\ref{lem:lipschitz_G4},
Lemma~\ref{lem:lipschitz_G5},
Lemma~\ref{lem:lipschitz_G6},
Lemma~\ref{lem:lipschitz_G7},
Lemma~\ref{lem:lipschitz_G8}, and 
Lemma~\ref{lem:lipschitz_G9}.
\end{proof}

\subsection{A Core Tool: Upper Bound for Several Basic Functions}\label{sub:lips_H_xx:upper_bound}

In this section, we analyze the upper bound of several basic functions.

\begin{lemma}[Lemma 8.9 in \cite{dls23} page 44 and Lemma 6.2 in \cite{gsx23_incontext} page 20]\label{lem:lower_bound_A:beta}
Provided that the subsequent requirements are satisfied
\begin{itemize}
    \item Let $\A \in \R^{n^2 \times d^2}$ satisfy $\max_{j_0 \in [n]}\| \A_{j_0} \| \leq R$
    \item Let $x \in \R^{d^2}$ satisfy that $\| x \|_2 \leq R $
    \item We define $u(x)$ as Definition~\ref{def:u} 
    \item Let $\beta$ be the greatest lower bound of $\langle u(x)_{j_0} , {\bf 1}_n \rangle$
\end{itemize}
Then we have
\begin{align*}
    \beta \geq \exp(-R^2).
\end{align*}
\end{lemma}

\begin{lemma}[Basic Functions Upper Bound]\label{lem:upper_bound}
If the following conditions hold,
\begin{itemize}
    \item Let $u(x)_{j_0} \in \R^n$ be defined as Definition~\ref{def:u}
    \item Let $\alpha(x)_{j_0} \in \R$ be defined as Definition~\ref{def:alpha}
    \item Let $f(x)_{j_0} \in \R^n$ be defined as Definition~\ref{def:f}
    \item Let $c(x,:)_{j_0,i_0} \in \R$ be defined as Definition~\ref{def:c}
    \item Let $\gamma(x)_{j_0} = \langle f(x)_{j_0}, v \rangle \in \R$
     \item Let $\beta$ be the greatest lower bound of $\langle u(x)_{j_0} , {\bf 1}_n \rangle$
    \item $\| A_1 \|, \| A_2 \| , \| A_3 \| \leq R$
    \item $\| \A_{j_0} \| \leq R$
    \item $\| x \|_2 \leq R$
    \item $| b_{j_0,i_0} | \leq R$  
    \item Let $R \geq 4$
    \item $\| v \|_2 \leq R^2$
\end{itemize}
Then we have: for all $x \in \R^{d^2}$ 
\begin{itemize}
    \item Part 1. $\| u(x)_{j_0} \|_2 \leq \sqrt{n} \cdot \exp(R^2)$
    \item Part 2. $| \alpha(x)_{j_0} | \leq n \exp(R^2)$
    \item Part 3. $| \alpha(x)_{j_0} |^{-1} \leq \exp(R^2)$
    \item Part 4. $\| f(x)_{j_0} \|_2 \leq 1$
    \item Part 5. $| \gamma(x)_{j_0} | \leq R^2$
    \item Part 6. $| c(x,:)_{j_0,i_0} | \leq 2R^2$
\end{itemize}
\end{lemma}
\begin{proof}
We present our proof as follows.

{\bf Proof of Part 1.}
We have
\begin{align*}
    \| u(x)_{j_0} \|_2 = & ~ \| \exp (\A_{j_0} x) \|_2 \\
    \leq & ~ \sqrt{n} \cdot \| \exp(\A_{j_0} x) \|_\infty \\ 
     \leq & ~ \sqrt{n} \cdot  \exp( \| \A_{j_0} x\|_2) \\
    \leq & ~ \sqrt{n} \cdot \exp(R^2)
\end{align*}
where the first step follows from Definition~\ref{def:u}, the second step is based on Fact~\ref{fac:vector_norm}, the third step follows from Fact~\ref{fac:vector_norm}, and the fourth step is because of $\| \A_{j_0} \| \leq R$ and $\| x \|_2 \leq R$ (see from the Lemma statement).

{\bf Proof of Part 2.}
We have  
\begin{align*}
    | \alpha(x)_{j_0} | = & ~ | \langle u(x)_{j_0}, {\bf 1}_n \rangle | \\
    \leq & ~ \sqrt{n} \cdot \| u(x)_{j_0} \|_2 \\
    \leq & ~ \sqrt{n} \cdot \sqrt{n} \cdot \exp(R^2) \\
    = & ~ n \exp(R^2) 
\end{align*}
where the first step is due to Definition~\ref{def:alpha}, the second is based on Fact~\ref{fac:vector_norm}, the third step follows from {\bf Part 1}. and the forth step follows from simple algebra.

{\bf Proof of Part 3.}

We have 
\begin{align*}
   | \alpha^{-1}(x)_{j_0} | = & ~ \frac{1}{\langle u(x)_{j_0} , {\bf 1}_n \rangle} \\
    \leq & ~ \frac{1}{\beta} \\
    \leq & ~ \exp(R^2)
\end{align*}
where the first step is because of Definition~\ref{def:alpha}, the second step follows from the definition of $\beta$ and the third step is due to Lemma~\ref{lem:lower_bound_A:beta}.

{\bf Proof of Part 4.}
We have
\begin{align*}
    \| f(x)_{j_0} \|_2 \leq & ~ \| f(x)_{j_0} \|_1 \\
    = & ~ 1
\end{align*}
where the first step follows from Fact~\ref{fac:vector_norm}, the second step is due to Definition~\ref{def:f} 

{ \bf Proof of Part 5.}
We have
\begin{align*}
    | \gamma(x)_{j_0} | = & ~ | \langle f(x)_{j_0}, v \rangle |\\
    \leq & ~\| f(x)_{j_0} \|_2 \cdot \| v \|_2 \\
    \leq & ~ 1 \cdot R^2 \\
    = & ~ R^2 
\end{align*}
where the first step follows from the definition of $\gamma(x)_{j_0}$ (see from the Lemma statement), the second step follows from Cauchy–Schwarz inequality, the third step follows from {\bf Part 2} and the upper bound for the $\ell_2$ norm of $v$ (from the Lemma statement), and the last step follows from simple algebra.

{\bf Proof of Part 6.}
We have
\begin{align*}
    |c(x,:)_{j_0,i_0}| = & ~ |\langle f(x)_{j_0}, v \rangle - b_{j_0,i_0}| \\
    \leq & ~ |\gamma_{j_0}(x) - b_{j_0,i_0}| \\
    \leq & ~ | \gamma_{j_0}(x) | + | b_{j_0,i_0}| \\
    \leq & ~ R^2 + R \\
    \leq & ~ 2R^2
\end{align*}
where the first step is based on Definition~\ref{def:c}, the second step is because of the definition of $\gamma_{j_0}(x)$, the third step follows from triangle inequality, the fourth step is based on {\bf Part 6} and $|b_{j_0,i_0}| \leq R$ (see from the Lemma statement), and the last step follows from $R \geq 1$.
\end{proof}

\subsection{A Core Tool: Lipschitz Property for Several Basic Functions}\label{sub:lips_H_xx:basic_lips}

In this section, we analyze the Lipschitz property of several basic functions.



\begin{lemma}[Basic Functions Lipschitz Property]\label{lem:basic_lips}
If the following conditions hold,
\begin{itemize}
    \item $\| v \|_2 \leq R^2$
    \item $\| \A_{j_0} \| \leq R$ 
     \item Let $\beta$ be the greatest lower bound of $\langle u(x)_{j_0} , {\bf 1}_n \rangle$
    \item Let $\beta^{-1} \leq \exp(R^2)$
    \item Let $R\geq 4$
    \item Let $\|x\|_2 \leq R$ and $\|\wt{x}\|_2 \leq R$.
\end{itemize}
Then, we have: for all $x, \wt{x} \in \R^{d^2}$
\begin{itemize}
    \item Part 1. $\| u(x)_{j_0} - u( \wt{x} )_{j_0}\|_2 \leq  \sqrt{n}  \exp(2 R^2) \cdot \| x - \wt{x} \|_2$
    \item Part 2. $| \alpha(x)^{-1} - \alpha^{-1}( \wt{x} ) | \leq  n  \exp(4 R^2) \cdot \| x - \wt{x} \|_2$
    \item Part 3. $\| f(x)_{j_0} - f(\wt{x})_{j_0} \|_2 \leq    n^{1.5} R \exp(6 R^2)  \cdot \| x - \wt{x} \|_2$
    \item Part 4. $| \gamma(x)_{j_0} - \gamma (\wt{x})_{j_0} | \leq   n^{1.5} \exp(7 R^2) \cdot \| x - \wt{x} \|_2$
    \item Part 5. $| c(x,:)_{j_0,i_0} - c(\wt{x},:)_{j_0,i_0} | \leq   n^{1.5} \exp(7 R^2) \cdot \| x - \wt{x} \|_2$
\end{itemize}
    
\end{lemma}
\begin{proof}

{\bf Proof of Part 1.}

We have
\begin{align*}
\| u(x)_{j_0} - u(\wt{x})_{j_0} \|_2
= & ~ \| \exp( \A_{j_0} x) - \exp( \A_{j_0} \wt{x}) \|_2 \\ 
\leq & ~ \exp(\| \A_{j_0}x \|_2 )  \cdot \| \A_{j_0} (x-\wt{x}) \|_{2} \notag \\
\leq & ~ \sqrt{n} \exp(R^2) \cdot \| \A_{j_0} (x-\wt{x}) \|_2 \notag \\
\leq & ~ \sqrt{n} \exp(R^2)  \cdot \| \A_{j_0} \| \cdot \| x - \wt{x} \|_2 \notag\\
\leq & ~ \sqrt{n} R \exp(R^2) \cdot \|x - \wt{x}\|_2,
% \leq & ~ \sqrt{n} \exp(2 R^2)\cdot \|x - \wt{x}\|_2 
\end{align*}
where the first step is due to Definition~\ref{def:u}, the second step is because of Fact~\ref{fac:vector_norm}, the third step is based on  Fact~\ref{fac:vector_norm}, the fourth step follows from Fact~\ref{fac:matrix_norm}, and fifth step is due to $\|\A_{j_0}\| \leq R$.

% We should have
% \begin{align*}
%     \exp(\| \A_{j_0}x \|_2 )  \cdot \| \A_{j_0} (x-\wt{x}) \|_{2}
%     \leq & ~ \exp(\| \A_{j_0}\| \|x \|_2 )  \cdot \| \A_{j_0} (x-\wt{x}) \|_{2}\\
%     \leq & ~ \exp( R^2 )  \cdot \| \A_{j_0} (x-\wt{x}) \|_{2}\\
% \end{align*}

% }

{\bf Proof of Part 2}

We have
\begin{align*}
    |\alpha(x)^{-1}_{j_0} - \alpha(\wt{x})^{-1}_{j_0}| \leq & ~ \alpha(x)^{-1} \alpha(\wt{x})^{-1} \cdot | \alpha(x) - \alpha(\wt{x})| \\
    \leq & ~ \beta^{-2} \cdot |\alpha(x) - \alpha(\wt{x})| \\
    \leq & ~ \beta^{-2} \cdot |\langle u(x)_{j_0} , {\bf 1}_n \rangle - \langle u(\wt{x})_{j_0}, {\bf 1}_n \rangle  | \\
    \leq & ~ \beta^{-2} \cdot \sqrt{n} \| u(x)_{j_0} - u(\wt{x})_{j_0} \|_2 \\
     \leq & ~  2 \beta^{-2} \cdot n R \exp(R^2)\|x - \wt{x}\|_2 \\
     \leq & ~ n \exp(4R^2) \cdot \|x - \wt{x}\|_2 
\end{align*}
where the first step is due to simple algebra, the second step is due to $\beta \geq \langle u(x)_{j_0}, {\bf 1}_n\rangle$, the third step follows from Definition of $\alpha(x)$ (see Definition~\ref{def:alpha}), the fourth step is based on Fact~\ref{fac:circ_rules} and Fact~\ref{fac:vector_norm}, the fifth step is because of {\bf Part 1}, and the sixth step follows from $R>4$ and $\beta^{-1} \leq \exp(R^2)$.


{\bf Proof of Part 3.}

We have
\begin{align} 
  \| f(x)_{j_0} - f(\wt{x})_{j_0} \|_2 \nonumber = & ~ \| \alpha(x)_{j_0}^{-1} u(x)_{j_0} - \alpha(\wt{x})_{j_0}^{-1} u(\wt{x})_{j_0} \|_2 \nonumber \\
    \leq & ~ \| \alpha(x)_{j_0}^{-1} u(x)_{j_0} - \alpha(\wt{x})_{j_0}^{-1} u(x)_{j_0} \|_2 + \| \alpha(\wt{x})_{j_0}^{-1} u(x)_{j_0} - \alpha(\wt{x})_{j_0}^{-1} u(\wt{x})_{j_0} \|_2 \nonumber \\
    = & ~ |\alpha(x)_{j_0}^{-1} - \alpha(\wt{x})_{j_0}^{-1} | \cdot \| u(x)_{j_0} \|_2 + | \alpha(\wt{x})_{j_0}^{-1} | \cdot \| u(x)_{j_0} -u(\wt{x})_{j_0} \|_2 \notag \\ 
    \leq & ~ n^{1.5} \exp(6R^2) \cdot \| x - \wt{x} \|_2 \notag 
\end{align}
where the first step is due to Definition~\ref{def:f}, the second step is based on triangle inequality, the third step follows from Fact~\ref{fac:vector_norm}, the fourth follows from combination of {\bf Part 1}, {\bf Part 2} and Lemma~\ref{lem:upper_bound}.

{\bf Proof of Part 4.}

We have 
\begin{align*}
    |\gamma_{j_0}(x) - \gamma_{j_0}(\wt{x})|= & ~ | \langle f(x)_{j_0}, v \rangle - \langle f(\wt{x})_{j_0}, v \rangle| \\
    \leq & ~ |\langle f(x)_{j_0} - f(\wt{x})_{j_0},v\rangle| \\
    \leq & ~ \| v \|_2 \cdot \| f(x)_{j_0} - f(\wt{x}) \|_2\\
    \leq & ~ n^{1.5} \exp(7R^2) \cdot \| x - \wt{x} \|_2
\end{align*}
where the first step is based on the definition of $\gamma_{j_0}(x)$, the second is because of Fact~\ref{fac:circ_rules}, the third step is due to Cauchy–Schwarz inequality, and the last step follows from {\bf Part 3}, $\| v \| \leq R^2$ and $R \geq 4$. 

{\bf Proof of Part 5.} 

We have 
\begin{align*}
    | c(x,:)_{j_0,i_0} - c(\wt{x},:)_{j_0,i_0} | = & ~ |\langle f(x)_{j_0}, v \rangle - \langle f(\wt{x})_{j_0}, v \rangle| \\
    \leq & ~  |\gamma_{j_0}(x) - \gamma_{j_0}(\wt{x})| \\
    \leq & ~ n^{1.5} \exp(7 R^2) \cdot \| x - \wt{x} \|_2 
\end{align*}
where the first step follows from Definition~\ref{def:c}, the second step is based on the definition of $\gamma_{j_0}(x)$ and the last step follows from {\bf Part 4}.
\end{proof}

For convenient, we define
\begin{definition}\label{def:R_0}
We define $R_0$ as follows
\begin{align*}
    R_0 := n^{1.5} \exp(10 R^2).
\end{align*}
\end{definition}

\subsection{Calculation: Step 1 Lipschitz for Matrix Function \texorpdfstring{$c(x,:)_{j_0,i_0} \cdot \diag( f(x)_{j_0} \circ v )$}{}}\label{sub:lips_H_xx:step1}


In this section, we introduce our calculation of Lipschitz for $c(x,:)_{j_0,i_0} \cdot \diag( f(x)_{j_0} \circ v )$.

\begin{lemma}\label{lem:lipschitz_G1}
If the following conditions
\begin{itemize}
    \item Let $G_1(x) = c(x,:)_{j_0,i_0} \cdot \diag( f(x)_{j_0} \circ v )$ 
    \item Let $R_0$ be defined as Definition~\ref{def:R_0}
    \item Let $\A \in \R^{n^2 \times d^2}$ and $u(x)_{j_0} \in \R^n$ be defined as Definition~\ref{def:u}
    \item Let $\alpha(x)_{j_0} \in \R$ be defined as Definition~\ref{def:alpha}
    \item Let $f(x)_{j_0} \in \R^n$ be defined as Definition~\ref{def:f}
    \item Let $c(x,:)_{j_0,i_0} \in \R$ be defined as Definition~\ref{def:c}
    \item Let $\gamma(x)_{j_0} = \langle f(x)_{j_0}, v \rangle \in \R$
    \item $\| A_1 \|, \| A_2 \| , \| A_3 \| \leq R$, $\| \A_{j_0} \| \leq R$, $\| x \|_2 \leq R$,$| b_{j_0,i_0} | \leq R$, $\| v \|_2 \leq R^2$
    \item Let $R \geq 4$
\end{itemize}
Then, we have
\begin{align*}
    \|G_1(x) - G_1( \wt{x} ) \| \leq 10R^4 \cdot R_0 \cdot \|x - \wt{x} \|_2 
\end{align*}
\end{lemma}

\begin{proof}
    We define
    \begin{align*}
        G_{1,1} = & ~  c(x,:)_{j_0,i_0} \cdot \diag( f(x)_{j_0} \circ v ) -  c(\wt{x},:)_{j_0,i_0} \cdot \diag( f(x)_{j_0} \circ v )  \\
        G_{1,2} = & ~ 
         c(\wt{x},:)_{j_0,i_0} \cdot \diag( f(x)_{j_0} \circ v ) - c(\wt{x},:)_{j_0,i_0} \cdot \diag( f(\wt{x})_{j_0} \circ v ) 
    \end{align*}
    we have
    \begin{align*}
         \| G_{1,1} \| = & ~ \| c(x,:)_{j_0,i_0} \cdot \diag( f(x)_{j_0} \circ v ) -  c(\wt{x},:)_{j_0,i_0} \cdot \diag( f(x)_{j_0} \circ v ) \|\\ 
         \leq & ~ | c(x,:)_{j_0,i_0} -  c(\wt{x},:)_{j_0,i_0} | \cdot \| \diag( f(x)_{j_0} \circ v )\| \\
         \leq & ~ R^2 \cdot | c(x,:)_{j_0,i_0} -  c(\wt{x},:)_{j_0,i_0} | \\
         \leq & ~ R^2  R_0 \cdot  \| x - \wt{x} \|_2
    \end{align*}
    where the first step is based on definition~$G_{1,1}$, the second step is due to Fact~\ref{fac:matrix_norm}, the third step follows from Lemma~\ref{lem:upper_bound}, and the fourth step is because of Lemma~\ref{lem:basic_lips}.
    
    Additionally, we have
    \begin{align*}
    \| G_{1,2} \| = & ~ \| c(\wt{x},:)_{j_0,i_0} \cdot \diag( f(x)_{j_0} \circ v ) - c(\wt{x},:)_{j_0,i_0} \cdot \diag( f(\wt{x})_{j_0} \circ v ) \|\\
     \leq & ~ | c(\wt{x}, :)_{j_0,i_0} | \cdot \| v \|_2 \cdot \| \diag(f(x)_{j_0}) - \diag (f(\wt{x})_{j_0})\| \\
     \leq & ~ 2 R^4 \cdot \| f(x)_{j_0} - f( \wt{x})_{j_0} \|_2 \\
     \leq & ~  2 R^4 \cdot R_0  \cdot \| x - \wt{x} \|_2
    \end{align*}
    where the first step is because of definition of $G_{1,2}$, the second step is due to Fact~\ref{fac:matrix_norm}, the third step follows from Lemma~\ref{lem:upper_bound}, and the fourth step is because of Lemma~\ref{lem:basic_lips}.

Combining the above two equations, we complete the proof.
\end{proof}

\subsection{Calculation: Step 2 Lipschitz for Matrix Function \texorpdfstring{$-\gamma_{j_0}(x) \cdot c(x,:)_{j_0,i_0} \cdot \diag( f(x)_{j_0} \circ v )$}{}}\label{sub:lips_H_xx:step2}

In this section, we introduce our calculation of Lipschitz for $-\gamma_{j_0}(x) \cdot c(x,:)_{j_0,i_0} \cdot \diag( f(x)_{j_0} \circ v )$.


\begin{lemma}\label{lem:lipschitz_G2}
If the following conditions hold
\begin{itemize}
    \item Let $G_2(x) = -\gamma_{j_0}(x) \cdot c(x,:)_{j_0,i_0} \cdot \diag( f(x)_{j_0} \circ v )$
    \item Let $\alpha(x)_{j_0} \in \R$ be defined as Definition~\ref{def:alpha}
        \item Let $f(x)_{j_0} \in \R^n$ be defined as Definition~\ref{def:f}
        \item Let $c(x,:)_{j_0,i_0} \in \R$ be defined as Definition~\ref{def:c}
        \item Let $\gamma(x)_{j_0} = \langle f(x)_{j_0}, v \rangle \in \R$
        \item Let $R \geq 4$
\end{itemize}
Then, we have
\begin{align*}
    \|G_2(x) - G_2(\wt{x}) \| \leq 10 R^4 \cdot R_0 \|x -\wt{x} \|_2 
\end{align*}
\end{lemma}

\begin{proof}
    We define
    \begin{align*}
        G_{2,1} = & ~ -\gamma_{j_0}(x) \cdot c(x,:)_{j_0,i_0} \cdot \diag( f(x)_{j_0} \circ v ) - (-\gamma_{j_0}(\wt{x})) \cdot c(x,:)_{j_0,i_0} \cdot \diag( f(x)_{j_0} \circ v )  \\
        G_{2,2} = & ~ 
        -\gamma_{j_0}(\wt{x}) \cdot c(x,:)_{j_0,i_0} \cdot \diag( f(x)_{j_0} \circ v ) - (-\gamma_{j_0}(\wt{x})) \cdot c(\wt{x},:)_{j_0,i_0} \cdot \diag( f(x)_{j_0} \circ v ) \\ 
       G_{2,3} =  & ~
       -\gamma_{j_0}(\wt{x}) \cdot c(\wt{x},:)_{j_0,i_0} \cdot \diag( f(x)_{j_0} \circ v ) - (-\gamma_{j_0}(\wt{x})) \cdot c(\wt{x},:)_{j_0,i_0} \cdot \diag( f(\wt{x})_{j_0} \circ v ) 
    \end{align*}
    We have
    \begin{align*}
        \|G_{2,1}\| = & ~ \|(-\gamma_{j_0}(x)) \cdot c(x,:)_{j_0,i_0} \cdot \diag( f(x)_{j_0} \circ v ) - (-\gamma_{j_0}(\wt{x})) \cdot c(x,:)_{j_0,i_0} \cdot \diag( f(x)_{j_0} \circ v ) \|  \\
        \leq & ~ | \gamma_{j_0}(x) - \gamma_{j_0}(\wt{x}) | \cdot | c(x,:)_{j_0,i_0} | \cdot \| \diag( f(x)_{j_0} \circ v ) \|\\
        \leq & ~ 2 R^4 \cdot \| \gamma_{j_0}(x) - \gamma_{j_0}(\wt{x})\| \\
        \leq & ~ 2 R^4 \cdot R_0 \cdot \| x - \wt{x} \|_2,
    \end{align*}
     where the first step is because of definition of $G_{2,1}$, the second step is due to Fact~\ref{fac:matrix_norm}, the third step follows from Lemma~\ref{lem:upper_bound}, and the fourth step is because of Lemma~\ref{lem:basic_lips}.
     
    Additionally, we have 
    \begin{align*}
    \| G_{2,2} \| = & ~ 
        \| -\gamma_{j_0}(\wt{x}) \cdot c(x,:)_{j_0,i_0} \cdot \diag( f(x)_{j_0} \circ v ) - (-\gamma_{j_0}(\wt{x})) \cdot c(\wt{x},:)_{j_0,i_0} \cdot \diag( f(x)_{j_0} \circ v ) \| \\ 
         \leq & ~ \| \gamma_{j_0}(\wt{x}) \cdot \diag(f(\wt{x})_{j_0} \circ v)\| \cdot \|c(x,:)_{j_0,i_0} - c(\wt{x},:)_{j_0,i_0}  \| \\
         \leq & ~ R^4 \cdot |c(x,:)_{j_0,i_0} - c(\wt{x},:)_{j_0,i_0}  | \\
        \leq & ~ R^4 R_0 \cdot  \| x - \wt{x} \|_2
    \end{align*}
     where the first step is because of definition of $G_{2,2}$, the second step is due to Fact~\ref{fac:matrix_norm}, the third step follows from Lemma~\ref{lem:upper_bound}, and the fourth step is because of Lemma~\ref{lem:basic_lips}.

    Additionally, we have
    \begin{align*}
        \| G_{2,3} \|=  & ~
       \|-\gamma_{j_0}(\wt{x}) \cdot c(\wt{x},:)_{j_0,i_0} \cdot \diag( f(x)_{j_0} \circ v ) - (-\gamma_{j_0}(\wt{x})) \cdot c(\wt{x},:)_{j_0,i_0} \cdot \diag( f(\wt{x})_{j_0} \circ v ) \|\\
        \leq & ~ \| \gamma_{j_0}(\wt{x}) \| \cdot \| c(\wt{x},:)_{j_0,i_0} \| \cdot \| c(x,:)_{j_0,i_0} - c(\wt{x},:)_{j_0,i_0} \| \\
        \leq & ~ 2R^4 \cdot R_0 \cdot \| x - \wt{x} \|_2
    \end{align*}
     where the first step is because of definition of $G_{2,3}$, the second step is due to Fact~\ref{fac:matrix_norm}, the third step follows from Lemma~\ref{lem:upper_bound} and Lemma~\ref{lem:basic_lips}.
     
    Combining all the above equations finish the proof.
\end{proof}


\subsection{Calculation: Step 3  
 Lipschitz for Matrix Function \texorpdfstring{$ - 2 \gamma_{j_0}(x) \cdot   (f(x)_{j_0} \circ v ) f(x)_{j_0}^\top $}{}}\label{sub:lips_H_xx:step3}

In this section, we introduce our calculation of Lipschitz for $- 2 \gamma_{j_0}(x) \cdot   (f(x)_{j_0} \circ v ) f(x)_{j_0}^\top$.


 
\begin{lemma}\label{lem:lipschitz_G3}
    If the following conditions hold
    \begin{itemize}
        \item Let $G_3(x) = - 2 \gamma_{j_0}(x) \cdot   (f(x)_{j_0} \circ v ) f(x)_{j_0}^\top$.
        \item  Let $R_0$ be defined in Definition~\ref{def:R_0}.
         \item Let $\alpha(x)_{j_0} \in \R$ be defined as Definition~\ref{def:alpha}
        \item Let $f(x)_{j_0} \in \R^n$ be defined as Definition~\ref{def:f}
        \item Let $c(x,:)_{j_0,i_0} \in \R$ be defined as Definition~\ref{def:c}
        \item Let $\gamma(x)_{j_0} = \langle f(x)_{j_0}, v \rangle \in \R$
        \item $\| A_1 \|, \| A_2 \| , \| A_3 \| \leq R$, $\| \A_{j_0} \| \leq R$, $\| x \|_2 \leq R$,$| b_{j_0,i_0} | \leq R$, $\| v \|_2 \leq R^2$
        \item Let $R \geq 4$
    \end{itemize}
    
\end{lemma}

Then, we have
\begin{align*}
    \|G_3(x) - G_3(\wt{x}) \| \leq 10 R^4 \cdot R_0 \|x -\wt{x} \|_2
\end{align*}
\begin{proof}
    We define
    \begin{align*}
        G_{3,1} = & ~ - 2 \gamma_{j_0}(x) \cdot   (f(x)_{j_0} \circ v ) f(x)_{j_0}^\top - (- 2 \gamma_{j_0}(\wt{x}) \cdot   (f(x)_{j_0} \circ v ) f(x)_{j_0}^\top) \\
        G_{3,2} = & ~ - 2 \gamma_{j_0}(\wt{x}) \cdot   (f(x)_{j_0} \circ v ) f(x)_{j_0}^\top - (- 2 \gamma_{j_0}(\wt{x}) \cdot   (f(\wt{x})_{j_0} \circ v ) f(x)_{j_0}^\top) \\
        G_{3,3} = & ~ - 2 \gamma_{j_0}(\wt{x}) \cdot   (f(\wt{x})_{j_0} \circ v ) f(x)_{j_0}^\top - (- 2 \gamma_{j_0}(\wt{x}) \cdot   (f(\wt{x})_{j_0} \circ v ) f(\wt{x})_{j_0}^\top)
    \end{align*}

For $G_{3,1}$, we have
\begin{align*}
    \| G_{3,1} \| 
    \leq & ~ 2 \cdot | \gamma(x)_{j_0} - \gamma( \wt{x} )_{j_0} | \cdot \| f(x)_{j_0} \circ v \|_2 \cdot \| f(x)_{j_0} \|_2 \\
    \leq & ~ 2 R_0 \cdot R^2 \| x - \wt{x} \|_2
\end{align*}
where the first step is based on Fact~\ref{fac:matrix_norm} and the second step is due to Lemma~\ref{lem:upper_bound} and Lemma~\ref{lem:basic_lips}.

Similarly, we have
\begin{align*}
    \| G_{3,2} \| \leq 2 R_0 \cdot R^4 \| x - \wt{x} \|_2
\end{align*}
and
\begin{align*}
    \| G_{3,3} \| \leq 2R_0 \cdot R^4 \| x - \wt{x} \|_2
\end{align*}


\end{proof}

 \subsection{Calculation: Step 4  
 Lipschitz for Matrix Function \texorpdfstring{$ -c(x,:)_{j_0,i_0} \cdot   (f(x)_{j_0} \circ v ) f(x)_{j_0}^\top$}{}}\label{sub:lips_H_xx:step4}

In this section, we introduce our calculation of Lipschitz for $-c(x,:)_{j_0,i_0} \cdot   (f(x)_{j_0} \circ v ) f(x)_{j_0}^\top$.



 
\begin{lemma}\label{lem:lipschitz_G4}
If the following conditions hold
\begin{itemize}
     \item Let $\alpha(x)_{j_0} \in \R$ be defined as Definition~\ref{def:alpha}
    \item Let $f(x)_{j_0} \in \R^n$ be defined as Definition~\ref{def:f}
    \item Let $c(x,:)_{j_0,i_0} \in \R$ be defined as Definition~\ref{def:c}
    \item Let $\gamma(x)_{j_0} = \langle f(x)_{j_0}, v \rangle \in \R$
    \item $\| A_1 \|, \| A_2 \| , \| A_3 \| \leq R$, $\| \A_{j_0} \| \leq R$, $\| x \|_2 \leq R$,$| b_{j_0,i_0} | \leq R$, $\| v \|_2 \leq R^2$
    \item Let $R \geq 4$
    \item Let $G_{4}(x) = -c(x,:)_{j_0,i_0} \cdot   (f(x)_{j_0} \circ v ) f(x)_{j_0}^\top$
\end{itemize}
    Then, we have 
    \begin{align*}
        \|G_4(x) - G_4(\wt{x}) \| \leq 10 R^4 \cdot R_0 \|x -\wt{x} \|_2
    \end{align*}
\end{lemma}

\begin{proof}
    We define
    \begin{align*}
        G_{4,1} = & ~ 
        -c(x,:)_{j_0,i_0} \cdot   (f(x)_{j_0} \circ v ) f(x)_{j_0}^\top - (-c(\wt{x},:)_{j_0,i_0} \cdot   (f(x)_{j_0} \circ v ) f(x)_{j_0}^\top)\\
        G_{4,2} = & ~ 
        -c(\wt{x},:)_{j_0,i_0} \cdot   (f(x)_{j_0} \circ v ) f(x)_{j_0}^\top - (-c(\wt{x},:)_{j_0,i_0} \cdot   (f(\wt{x})_{j_0} \circ v ) f(x)_{j_0}^\top) \\
        G_{4,3} = & ~ -c(\wt{x},:)_{j_0,i_0} \cdot   (f(\wt{x})_{j_0} \circ v ) f(x)_{j_0}^\top - (-c(\wt{x},:)_{j_0,i_0} \cdot   (f(\wt{x})_{j_0} \circ v ) f(\wt{x})_{j_0}^\top)
    \end{align*}

For $G_{4,1}$, we have
\begin{align*}
    \| G_{4,1} \| \leq R^2 \cdot R_0 \cdot \| x - \wt{x} \|_2
\end{align*}
For $G_{4,2}$, we have
\begin{align*}
    \| G_{4,2} \| \leq 2 R^4 \cdot R_0 \cdot \| x - \wt{x} \|_2
\end{align*}
For $G_{4,3}$, we have
\begin{align*}
    \| G_{4,3} \| \leq 2 R^4 \cdot R_0 \cdot \| x - \wt{x} \|_2
\end{align*}
\end{proof}

  \subsection{Calculation: Step 5  
 Lipschitz for Matrix Function \texorpdfstring{$ - 2 \gamma_{j_0}(x)  \cdot  f(x)_{j_0} (f(x)_{j_0} \circ v)^\top$}{}}\label{sub:lips_H_xx:step5}

In this section, we introduce our calculation of Lipschitz for $- 2 \gamma_{j_0}(x)  \cdot  f(x)_{j_0} (f(x)_{j_0} \circ v)^\top$.


 
\begin{lemma}\label{lem:lipschitz_G5}
If the following conditions hold
\begin{itemize}
    \item Let $R_0$ be defined as Definition~\ref{def:R_0}
     \item Let $\alpha(x)_{j_0} \in \R$ be defined as Definition~\ref{def:alpha}
    \item Let $f(x)_{j_0} \in \R^n$ be defined as Definition~\ref{def:f}
    \item Let $c(x,:)_{j_0,i_0} \in \R$ be defined as Definition~\ref{def:c}
    \item Let $\gamma(x)_{j_0} = \langle f(x)_{j_0}, v \rangle \in \R$
    \item $\| A_1 \|, \| A_2 \| , \| A_3 \| \leq R$, $\| \A_{j_0} \| \leq R$, $\| x \|_2 \leq R$,$| b_{j_0,i_0} | \leq R$, $\| v \|_2 \leq R^2$
    \item Let $R \geq 4$
    \item Let $G_{5}(x) = - 2 \gamma_{j_0}(x)  \cdot  f(x)_{j_0} (f(x)_{j_0} \circ v)^\top$
\end{itemize}
    Then, we have
    \begin{align*}
        \|G_5(x) - G_5(\wt{x}) \| \leq 10R^4 \cdot R_0 \|x -\wt{x} \|_2
    \end{align*}
\end{lemma}
\begin{proof}
    This proof is similar to the proof of Lemma~\ref{lem:lipschitz_G3}, so we omit it here.
\end{proof}

  \subsection{Calculation: Step 6  
 Lipschitz for Matrix Function \texorpdfstring{$ - c(x,:)_{j_0,i_0} \cdot  f(x)_{j_0} (f(x)_{j_0} \circ v)^\top$}{}}\label{sub:lips_H_xx:step6}

In this section, we introduce our calculation of Lipschitz for $ - c(x,:)_{j_0,i_0} \cdot  f(x)_{j_0} (f(x)_{j_0} \circ v)^\top$.


 
\begin{lemma}\label{lem:lipschitz_G6}
If the following conditions hold
\begin{itemize}
     \item Let $\alpha(x)_{j_0} \in \R$ be defined as Definition~\ref{def:alpha}
    \item Let $f(x)_{j_0} \in \R^n$ be defined as Definition~\ref{def:f}
    \item Let $c(x,:)_{j_0,i_0} \in \R$ be defined as Definition~\ref{def:c}
    \item Let $\gamma(x)_{j_0} = \langle f(x)_{j_0}, v \rangle \in \R$
    \item $\| A_1 \|, \| A_2 \| , \| A_3 \| \leq R$, $\| \A_{j_0} \| \leq R$, $\| x \|_2 \leq R$,$| b_{j_0,i_0} | \leq R$, $\| v \|_2 \leq R^2$
    \item Let $R \geq 4$
    \item Let $G_{6}(x) = - c(x,:)_{j_0,i_0} \cdot  f(x)_{j_0} (f(x)_{j_0} \circ v)^\top$
\end{itemize}
    

    Then, we have
    \begin{align*}
        \|G_5(x) - G_5(\wt{x}) \| \leq 10 R^4 \cdot R_0  \|x -\wt{x} \|_2
    \end{align*}
\end{lemma}
\begin{proof}
    This proof is similar to the proof of Lemma~\ref{lem:lipschitz_G4}, so we omit it here.
\end{proof}


   \subsection{Calculation: Step 7  
 Lipschitz for Matrix Function \texorpdfstring{$ 2 \gamma_{j_0}(x) c(x,:)_{j_0,i_0}  \cdot f(x)_{j_0} f(x)_{j_0}^\top$}{}}\label{sub:lips_H_xx:step7}

In this section, we introduce our calculation of Lipschitz for $2 \gamma_{j_0}(x) c(x,:)_{j_0,i_0}  \cdot f(x)_{j_0} f(x)_{j_0}^\top$.

 
 \begin{lemma}\label{lem:lipschitz_G7}
 If the following conditions hold
 \begin{itemize}
     \item Let $\alpha(x)_{j_0} \in \R$ be defined as Definition~\ref{def:alpha}
    \item Let $f(x)_{j_0} \in \R^n$ be defined as Definition~\ref{def:f}
    \item Let $c(x,:)_{j_0,i_0} \in \R$ be defined as Definition~\ref{def:c}
    \item Let $\gamma(x)_{j_0} = \langle f(x)_{j_0}, v \rangle \in \R$
    \item $\| A_1 \|, \| A_2 \| , \| A_3 \| \leq R$, $\| \A_{j_0} \| \leq R$, $\| x \|_2 \leq R$,$| b_{j_0,i_0} | \leq R$, $\| v \|_2 \leq R^2$
    \item Let $R \geq 4$
    \item  Let $G_{7}(x) = 2 \gamma_{j_0}(x) c(x,:)_{j_0,i_0}  \cdot f(x)_{j_0} f(x)_{j_0}^\top$
 \end{itemize}
   

     Then, we have 
     \begin{align*}
         \|G_7(x) - G_7(\wt{x}) \| \leq 10 R^4 R_0 \|x -\wt{x} \|_2
     \end{align*}
 \end{lemma}
 \begin{proof}
     We define
     \begin{align*}
         G_{7,1} = & ~ 2 \gamma_{j_0}(x) c(x,:)_{j_0,i_0}  \cdot f(x)_{j_0} f(x)_{j_0}^\top - 2 \gamma_{j_0}(\wt{x}) c(x,:)_{j_0,i_0}  \cdot f(x)_{j_0} f(x)_{j_0}^\top \\
        G_{7,2} = & ~ 2 \gamma_{j_0}(\wt{x}) c(x,:)_{j_0,i_0}  \cdot f(x)_{j_0} f(x)_{j_0}^\top - 2 \gamma_{j_0}(\wt{x}) c(\wt{x},:)_{j_0,i_0}  \cdot f(x)_{j_0} f(x)_{j_0}^\top \\
        G_{7,3} = & ~ 2 \gamma_{j_0}(\wt{x}) c(\wt{x},:)_{j_0,i_0}  \cdot f(x)_{j_0} f(x)_{j_0}^\top - 2 \gamma_{j_0}(\wt{x}) c(\wt{x},:)_{j_0,i_0}  \cdot f(\wt{x})_{j_0} f(x)_{j_0}^\top \\
        G_{7,4} = & ~ 2 \gamma_{j_0}(\wt{x}) c(\wt{x},:)_{j_0,i_0}  \cdot f(\wt{x})_{j_0} f(x)_{j_0}^\top - 2 \gamma_{j_0}(\wt{x}) c(\wt{x},:)_{j_0,i_0}  \cdot f(\wt{x})_{j_0} f(\wt{x})_{j_0}^\top 
     \end{align*}
    For $G_{7,1}$, we have
    \begin{align*}
        \| G_{7,1} \| =  & ~ \|2 \gamma_{j_0}(x) c(x,:)_{j_0,i_0}  \cdot f(x)_{j_0} f(x)_{j_0}^\top - 2 \gamma_{j_0}(\wt{x}) c(x,:)_{j_0,i_0}  \cdot f(x)_{j_0} f(x)_{j_0}^\top \|\\
        \leq & ~ 2|\gamma_{j_0}(x) - \gamma_{j_0}(\wt{x})| \| c(x,:)_{j_0,i_0}  \cdot f(x)_{j_0} f(x)_{j_0}^\top \| \\
        \leq & ~2 R_0 \cdot|c(x,:)_{j_0,i_0} | \cdot \|f(x)_{j_0} \| \cdot \| f(x)_{j_0}^\top \| \| x - \wt{x} \|_2 \\
        \leq & ~ 2 R_0 \cdot 2R^2 \cdot \| x - \wt{x} \|_2
    \end{align*}
    where the first step is due to the definition of $G_{7,1}$, the second step is because of Fact~\ref{fac:matrix_norm}, the third step is based on {\bf Part 4} of Lemma~\ref{lem:basic_lips} and Fact~\ref{fac:matrix_norm}, and the last step comes from {\bf Part 4 and Part 6} of Lemma~\ref{lem:upper_bound}.
    
    Similarly, for $G_{7,2}$, we have
    \begin{align*}
        \| G_{7,2} \| \leq 2 R_0 \cdot R^2 \cdot \| x - \wt{x} \|_2
    \end{align*}
    
   For $G_{7,3}$, we have
    \begin{align*}
        \| G_{7,3} \| \leq 2 R_0 \cdot 2R^4 \cdot \| x - \wt{x} \|_2
    \end{align*}
    
    For $G_{7,4}$, we have
    \begin{align*}
        \| G_{7,4} \| \leq 2 R_0 \cdot 2R^4 \cdot \| x - \wt{x} \|_2
    \end{align*}
 \end{proof}



\subsection{Calculation: Step 8  
 Lipschitz for Matrix Function \texorpdfstring{$ \gamma_{j_0}(x)^2  \cdot f(x)_{j_0} f(x)_{j_0}^\top$}{}}\label{sub:lips_H_xx:step8}

In this section, we introduce our calculation of Lipschitz for $\gamma_{j_0}(x)^2  \cdot f(x)_{j_0} f(x)_{j_0}^\top$.




\begin{lemma}\label{lem:lipschitz_G8}
 If the following conditions hold
 \begin{itemize}
     \item Let $\alpha(x)_{j_0} \in \R$ be defined as Definition~\ref{def:alpha}
    \item Let $f(x)_{j_0} \in \R^n$ be defined as Definition~\ref{def:f}
    \item Let $c(x,:)_{j_0,i_0} \in \R$ be defined as Definition~\ref{def:c}
    \item Let $\gamma(x)_{j_0} = \langle f(x)_{j_0}, v \rangle \in \R$
    \item $\| A_1 \|, \| A_2 \| , \| A_3 \| \leq R$, $\| \A_{j_0} \| \leq R$, $\| x \|_2 \leq R$,$| b_{j_0,i_0} | \leq R$, $\| v \|_2 \leq R^2$
    \item Let $R \geq 4$
    \item Let $G_{8,1} =\gamma_{j_0}(x)^2  \cdot f(x)_{j_0} f(x)_{j_0}^\top $
 \end{itemize}
 

    Then, we have 
    \begin{align*}
         \|G_8(x) - G_8(\wt{x}) \| \leq 10 R^4 R_0 \|x -\wt{x} \|_2
    \end{align*}
\end{lemma}
\begin{proof}
    We define
    \begin{align*}
        G_{8,1} = & ~ \gamma_{j_0}(x) \gamma_{j_0}(x)  \cdot f(x)_{j_0} f(x)_{j_0}^\top - \gamma_{j_0}(\wt{x}) \gamma_{j_0}(x) \cdot f(x)_{j_0} f(x)_{j_0}^\top \\
         G_{8,2} = & ~ \gamma_{j_0}(\wt{x}) \gamma_{j_0}(x)  \cdot f(x)_{j_0} f(x)_{j_0}^\top - \gamma_{j_0}(\wt{x})^2  \cdot f(x)_{j_0} f(x)_{j_0}^\top \\
        G_{8,3} = & ~ \gamma_{j_0}(\wt{x})^2  \cdot f(x)_{j_0} f(x)_{j_0}^\top - \gamma_{j_0}(\wt{x})^2  \cdot f(\wt{x})_{j_0} f(x)_{j_0}^\top \\
        G_{8,4} = & ~ \gamma_{j_0}(\wt{x})^2  \cdot f(\wt{x})_{j_0} f(x)_{j_0}^\top - \gamma_{j_0}(\wt{x})^2  \cdot f(\wt{x})_{j_0} f(\wt{x})_{j_0}^\top 
    \end{align*}
    We can show that
    \begin{align*}
        \max_{i\in [4] }\| G_{8,i} \| \leq R^4 \cdot R_0 \cdot \| x - \wt{x} \|_2
    \end{align*}
\end{proof}
 
\subsection{Calculation: Step 9  
 Lipschitz for Matrix Function \texorpdfstring{$ (f(x)_{j_0} \circ v) \cdot ( f(x)_{j_0} \circ v )^\top$}{}}\label{sub:lips_H_xx:step9}

In this section, we introduce our calculation of Lipschitz for $(f(x)_{j_0} \circ v) \cdot ( f(x)_{j_0} \circ v )^\top$.




 
\begin{lemma}\label{lem:lipschitz_G9}
 If the following conditions hold
 \begin{itemize}
     \item Let $\alpha(x)_{j_0} \in \R$ be defined as Definition~\ref{def:alpha}
    \item Let $f(x)_{j_0} \in \R^n$ be defined as Definition~\ref{def:f}
    \item Let $c(x,:)_{j_0,i_0} \in \R$ be defined as Definition~\ref{def:c}
    \item Let $\gamma(x)_{j_0} = \langle f(x)_{j_0}, v \rangle \in \R$
    \item $\| A_1 \|, \| A_2 \| , \| A_3 \| \leq R$, $\| \A_{j_0} \| \leq R$, $\| x \|_2 \leq R$,$| b_{j_0,i_0} | \leq R$, $\| v \|_2 \leq R^2$
    \item Let $R \geq 4$
    \item  Let $G_{9}(x) = (f(x)_{j_0} \circ v) \cdot ( f(x)_{j_0} \circ v )^\top$
 \end{itemize}
  

    Then, we have 
    \begin{align*}
        \|G_9(x) - G_9(\wt{x}) \| \leq 10 R^4 R_0 \|x -\wt{x} \|_2
    \end{align*}
\end{lemma}
\begin{proof}
    We define 
    \begin{align*}
        G_{9,1} = & ~ (f(x)_{j_0} \circ v) \cdot ( f(x)_{j_0} \circ v )^\top  - (f(\wt{x})_{j_0} \circ v) \cdot ( f(x)_{j_0} \circ v )^\top \\
        G_{9,2} = & ~ (f(\wt{x})_{j_0} \circ v) \cdot ( f(x)_{j_0} \circ v )^\top  - (f(\wt{x})_{j_0} \circ v) \cdot ( f(\wt{x})_{j_0} \circ v )^\top
    \end{align*}
    We can show that
    \begin{align*}
        \max_{i \in [2]} \| G_{9,i} \| \leq R^4 \cdot R_0 \cdot \| x - \wt{x} \|_2
    \end{align*}
\end{proof}