\paragraph{Roadmap.}


Section~\ref{app:preli} presents the basic definitions and lemmas. 
Section~\ref{app:technical} presents the technical claims for the proof of our main result. 
Section~\ref{app:data} consists of four subsections: Initialize part, Update part, Query part, and LSH part of our data structure. Each section presents the corresponding algorithm and proof of running time. 
We provide a proof sketch for correctness in Section~\ref{sec:correctness}.  
Section~\ref{app:correctness} presents the detailed proof of the correctness of our data structure. 
Section~\ref{app:adversary} presents how to change our algorithm into an adaptive algorithm. 
Section~\ref{sec:technical} presents the technical claims of this paper. 
% Section~\ref{app:lipschitz} presents the Lipschitz property of the kernel function. 
Section~\ref{app:discussion} presents elaborate discussion for our work.
 

\section{Preliminaries}\label{app:preli}


The goal of this subsection is to introduce some basic Definitions (Section~\ref{app:preli:definition}) and Lemmas (Section~\ref{app:preli:lemma}) that will be used to prove the main result.

\subsection{Definitions}\label{app:preli:definition}


We start by recalling the definition of geometric weight level.
\begin{definition}[Restatement of Definition~\ref{def:level} Geometric Weight Levels]\label{def:level_re}
Fix $R \in\mathbb{N}_+$ and $q\in\R^d$. 
We define
\begin{align*}
    w_i:=f(x_i,q)
\end{align*}

For any fix $r \in[R]:=\{1,2,\cdots,R\}$, we define  
\begin{align*}
    L_{r}:=\{x_{i}\in X ~|~ w_{i}\in(2^{-r+1},2^{-r}]\}
\end{align*}

We define the corresponding distance levels as
\begin{align*}
    z_r:=\max_{\mathrm{s.t.}f(z)\in(2^{-r},2^{-r+1}]}z.
\end{align*}
where $f(z):=f(x,q)$ for $z=\|x-q\|_2$.  

In addition, we define $L_{R+1}:=P\setminus \bigcup_{ r \in [R] } L_{r}$
\end{definition}

We restate the definition and some properties of Locality Sensitive Hashing.

\begin{definition}[Restatement of Definition~\ref{def:LSH_family}, Locally Sensitive Hash]\label{def:LSH_family_re}
A family $\mathcal{H}$ is called $(p_\mathrm{near},p_\mathrm{far},z,c)$-sensitive  where $p_\mathrm{near},p_\mathrm{far}\in [0,1],z \in\mathbb{R},c\geq 1$, if for any $x,q\in\mathbb{R}^d$:
\begin{itemize}
    \item $\Pr_{h\sim\mathcal{H}}[h(x)=h(q)~|~\| x-q\|_2\leq r]\geq p_\mathrm{near}$
    \item $\Pr_{h\sim\mathcal{H}}[h(x)=h(q)~|~\| x-q\|_2\geq cr]\leq p_{\mathrm{far}}$
\end{itemize}

\end{definition}

\subsection{Lemmas}\label{app:preli:lemma}

\begin{lemma}[Lemma 3.2 in page 6  
of \cite{ai06}]\label{lem:p_app}
Let $(a, b) \in \R^d \times \R^d $. Fixed $z > 0$, there is  
a hash family $\mathcal{H}$ such that, if $p_\mathrm{near}:=p_1(z):=\Pr_{h\sim\mathcal{H}}[h(a)=h(b)~|~\| a-b\|_2\leq z]$ and $p_\mathrm{far}:=p_2(z,c):=\Pr_{h\sim\mathcal{H}}[h(a)=h(b)~|~\| a-b\|_2\geq cz]$, 
% \Junze{The above 2 places: $\| a-b\|$ should be $\| a-b\|_2$}\Junze{Done.}
then
\begin{align*}
    \rho :=\frac{\log {1}/{p_\mathrm{near}}}{\log {1}/{p_\mathrm{far}}}\leq \frac{1}{c^2}+O(\frac{\log t}{t^\frac{1}{2}})
\end{align*}
for any $c\geq 1, t > 0$, where $p_\mathrm{near}\geq e^{-O(\sqrt{t})}$ and it requires $dt^{O(t)}$ time to evaluate.

\end{lemma}

\begin{remark}\label{rmk:p_near_app}
We find an upper bound for our definition of $\rho$ and evaluation time for hashing. For the rest part, we denote $t=\log^{\frac{2}{3}}n$. Thus we obtain $n^{o(1)}$ evaluation time and $\rho = \frac{1}{c^2}+o(1)$. Since $c=O(\log^\frac{1}{7}n)$, we have
\begin{align*}
    \frac{1}{\frac{1}{c^2}+O(\frac{\log t}{t^\frac{1}{2}})}=c^2(1-o(1)). \footnote{The above three $o(1)$ can be $\frac{\log \log^\frac{2}{3}n}{\log ^\frac{1}{3}n}, \frac{\log \log^\frac{2}{3}n}{\log ^\frac{1}{3}n}, \frac{\log \log^\frac{2}{3}n}{\log ^\frac{1}{21}n}$ respectively.}
\end{align*}
\end{remark}

In the next lemma, we show the existence of an LSH family that can separate the near points and the far points from the query with high probability.

\begin{lemma}[probability bound for separating points in different level sets, formal version of Lemma~\ref{lem:LSH}]\label{lem:LSH_formal}
 

Given kernel function $f$, we have corresponding weight level sets $L_r$'s and distance levels $z_r$'s (Definition~\ref{def:level}). Given query $q\in\R^d$ and integer $i\in [R+1]$, $r\in[R]$ satisfying $i>r$, let $x\in L_r$, $x^\prime \in L_i, c_{i,r}:=\min\{\frac{z_{i-1}}{z_r},\log^{1/7}n\}$. We set up an Andoni-Indyk LSH family $\mathcal{H}$ (Definition~\ref{def:LSH_family}) with near distance $z_r$. 

We define
\begin{align*}
    p_{\mathrm{near},r}&~:=\Pr_{h\sim\mathcal{H}}[h(x)=h(q)~|~\| x-q\|_2\leq z]\\
    p_{\mathrm{far},r}&~:=\Pr_{h\sim\mathcal{H}}[h(x)=h(q)~|~\| x-q\|_2\geq cz]
\end{align*}

Then the following inequalities holds for any integer $k \in \mathbb{N}_+$
\begin{enumerate}
    \item $\Pr_{h^*\sim \mathcal{H}^k}[~h^*(x)=h^*(q)~]\geq p_{\mathrm{near},r}^k$
    \item $\Pr_{h^*\sim \mathcal{H}^k}[~h^*(x^\prime)=h^*(q)~]\leq p_{\mathrm{near},r}^{kc_{i,r}^2(1-o(1))}$
\end{enumerate}
 
\end{lemma}
\begin{proof}
Since $x\in L_r$, by Lemma~\ref{def:level}, we have
\begin{align}\label{eq:p_r_j}
    \|x-q\|_2\leq z_r
\end{align}
For $x^\prime \in L_i$, since we assume the $f$ is decaying radial kernel, we have
\begin{align}\label{eq:p_prime_r_j}
    \|x^\prime-q\|_2\geq z_{i-1}\geq c_{i,r}z_r
\end{align}

where the first step follows from Definition~\ref{def:level}, the last step follows from $c_{i,r} \geq \tilde{c}_r$. 

By Lemma~\ref{lem:p} and Eq.~\eqref{eq:p_r_j}, Eq.~\eqref{eq:p_prime_r_j}, we have
\begin{enumerate}
    \item $\Pr_{h\sim \mathcal{H}}[h(x)=h(q)]\geq p_{\mathrm{near},r}$
    \item $\Pr_{h\sim \mathcal{H}}[h(x^\prime)=h(q)]\leq p_{\mathrm{far},r}$
\end{enumerate}

By remark~\ref{rmk:p_near}, we have
\begin{align}\label{eq:p_far_leq_p_near}
    p_{\mathrm{far},r}\leq p_{\mathrm{near},r}^{c_{i,r}(1-o(1))}
\end{align}

Then for any integer $k>1$, we have
\begin{align*}
    \Pr_{h^*\sim \mathcal{H}^k}[h^*(x)=h^*(q)]&~\geq~p_{\mathrm{near},r}^k\\
\Pr_{h^*\sim \mathcal{H}^k}[h^*(x^\prime)=h^*(q)]&~\leq~p_{\mathrm{far},r}^{k}
\end{align*}

By Eq.~\eqref{eq:p_far_leq_p_near}, we obtain the final result
\begin{enumerate}
    \item $\Pr_{h^*\sim \mathcal{H}^k}[h^*(x)=h^*(q)]\geq p_{\mathrm{near},r}^k$
    \item $\Pr_{h^*\sim \mathcal{H}^k}[h^*(x^\prime)=h^*(q)]\leq p_{\mathrm{near},r}^{kc_{i,r}^2(1-o(1))}$
\end{enumerate}

Thus, we complete the proof.
\end{proof}

 


