
\section{Adversary}\label{app:adversary}

In this section, we provide the detailed proofs for the lemmas in Section~\ref{sec:adversary}.

{\bf Starting Point} In Section~\ref{sec:correctness}, we have already obtained a query algorithm with constant success probability for a fixed query point.

\begin{lemma}[Starting with constant probability, restatement of Lemma~\ref{lem:single_estimator}]\label{lem:single_estimator_app}
Given $\epsilon \in (0,0.1)$, a query point $q \in \R^d$ and a set of data points $X = \{ x_{i}\}_{i=1}^{n} \subset \R^d$, let  $f_{\mathsf{KDE}}^*(q) := \frac{1}{|X|} \sum_{x \in X} f(x,q)$ be
an estimator $\mathcal{D}$ can answer the query which satisfies:
\begin{align*}
(1-\epsilon) \cdot f_{\mathsf{KDE}}^*(q) \leq \mathcal{D}.\textsc{query}(q, \epsilon) \leq (1 + \epsilon)\cdot f_{\mathsf{KDE}}^*(q)
\end{align*}
with probability $0.9$.
\begin{align*}
\end{align*}
\end{lemma}

\begin{proof}
By Lemma~\ref{lem:unbias_query_formal} and Lemma~\ref{lem:variance_query_formal}, our \textsc{Query} procedure can provide an estimator that answers kernel density estimation correctly with constant probability. 
\end{proof}


\paragraph{Boost the constant probability to high probability.}

Next, we begin to boost the success probability by repeating the query procedure and taking the median output.

\begin{lemma}[Boost the constant probability to high probability, restatement of Lemma~\ref{lem:fixed_points}]\label{lem:fixed_points_app}
Let $\delta_1 \in (0,0.1)$ denote the failure probability. Let $\epsilon \in (0,0.1)$ denote the accuracy parameter.
Given $L = O( \log(1/\delta_1) )$  estimators $\{\mathcal{D}_j\}_{j=1}^{L}$. For each fixed query point $q \in \R^d$, the median of queries from $L$ estimators satisfies that:
\begin{align*}
    (1-\epsilon) \cdot f_{\mathsf{KDE}}^*(q) \leq & ~  \mathrm{Median}(\{\mathcal{D}_j.\textsc{query}(q, \epsilon)\}_{j=1}^{L})
    \\
    \leq & ~ (1 + \epsilon)\cdot f_{\mathsf{KDE}}^*(q)
\end{align*}
with probability $1 - \delta_1$.
\end{lemma}

\begin{proof}
From Lemma~\ref{lem:single_estimator} we know each estimator $\mathcal{D}_j$ can answer the query that satisfies:
\begin{align*}
(1-\epsilon) \cdot f_{\mathsf{KDE}}^*(q) \leq \mathcal{D}.\textsc{query}(q, \epsilon) \leq (1 + \epsilon)\cdot f_{\mathsf{KDE}}^*(q)
\end{align*}
with probability $0.9$.

From the chernoff bound we know the median of $L =O( \log(1/\delta_1))$ queries from $\{\mathcal{D}_j\}_{j=1}^{L}$ satisfies:
\begin{align*}
    (1-\epsilon) \cdot f_{\mathsf{KDE}}^*(q) \leq & ~ \mathrm{Median}(\{\mathcal{D}_j.\textsc{query}(q, \epsilon)\}_{j=1}^{L}) 
    \\
    \leq & ~ (1 + \epsilon)\cdot f_{\mathsf{KDE}}^*(q)
\end{align*}
with probability $1 - \delta_1$.

Therefore, we complete the proof.
\end{proof}



\paragraph{From each fixed point to all the net points.}

So far, the success probability of our algorithm is still for a fix point. We will introduce $\epsilon$-net on a unit ball and show the high success probability for all the net points. 

\begin{fact}\label{fac:number_of_net_points_app}
Let $N$ denote the $\epsilon_0$-net of $\{ x \in \R^d ~|~ \| x \|_2 \leq 1 \}$. We use $|N|$ to denote the number of points in $N$. Then $|N|\leq (10/\epsilon_0)^d$.
\end{fact}

This fact shows that we can bound the size of an $\epsilon$-net with an inverse of $\epsilon$. We use this fact to conclude the number of repetitions we need to obtain the correctness of \textsc{Query} on all net points.


\begin{lemma}[From each fixed points to all the net points, restatement of Lemma~\ref{lem:net_points}]\label{lem:net_points_app}
Let $N$ denote the $\epsilon_0$-net of $\{ x \in \R^d ~|~ \| x \|_2 \leq 1 \}$. We use $|N|$ to denote the number of points in $N$. Given $L = \log(|N|/\delta)$  estimators $\{\mathcal{D}_j\}_{j=1}^{L}$. 

With probability $1 - \delta$, we have: for all $q \in N$, the median of queries from $L$ estimators satisfies that:
\begin{align*}
   (1-\epsilon) \cdot f_{\mathsf{KDE}}^*(q) \leq & ~ \mathrm{Median}(\{\mathcal{D}_j.\textsc{query}(q, \epsilon)\}_{j=1}^{L})
   \\
   & ~ \leq (1 + \epsilon)\cdot f_{\mathsf{KDE}}^*(q).
\end{align*}
\end{lemma}

\begin{proof}
There are $|N|$ points on the $d$ dimension $\epsilon$-net when $\| q\|_2 \leq 1$. From Lemma~\ref{lem:fixed_points_app} we know that for each query point $q$ on $N$, we have :
\begin{align*}
    (1-\epsilon) \cdot f_{\mathsf{KDE}}^*(q) \leq & ~ \mathrm{Median}(\{\mathcal{D}_j.\textsc{query}(q, \epsilon)\}_{j=1}^{L}) 
    \\
    \leq & ~ (1 + \epsilon)\cdot f_{\mathsf{KDE}}^*(q)
\end{align*}
with probability $1 - \delta/|N|$.

By union bound all $|N|$ points on $N$, we have:
\begin{align*}
    \forall \| q\|_2 \leq 1 , ~~~  (1-\epsilon) \cdot f_{\mathsf{KDE}}^*(q) \leq & ~ \mathrm{Median}(\{\mathcal{D}_j.\textsc{query}(q, \epsilon)\}_{j=1}^{L}) 
    \\
    \leq & ~ (1 + \epsilon)\cdot f_{\mathsf{KDE}}^*(q)
\end{align*}
with probability $1 - \delta$.
\end{proof}

\paragraph{From net points to all points.}
With Lemma~\ref{lem:net_points_app}, we are ready to extend the correctness for net points to the whole unit ball. We demonstrate that all query points  
$\| q \|_2 \leq 1$ can be answered approximately with high probability in the following lemma.

\begin{lemma}[From net points to all points, restatement of Lemma \ref{lem:from_net_points_to_all_points}
]
Let $\epsilon \in (0,0.1)$. Let ${\cal L} \geq 1$. Let $\delta \in (0,0.1)$. Let $\tau \in [0,1]$. 
Given $L = O(\log(( \mathcal{L}/\epsilon \tau )^d/\delta))$  estimators $\{\mathcal{D}_j\}_{j=1}^{L}$, with probability $1 - \delta$, for all query points $\|p\|_2 \leq 1$,  we have the median of queries from $L$ estimators satisfies that:
\begin{align*}
    \forall \| p\|_2 \leq 1, ~~~ (1-\epsilon) \cdot f_{\mathsf{KDE}}^*(p) \leq & ~ \mathrm{Median}(\{\mathcal{D}_j.\textsc{query}(q, \epsilon)\}_{j=1}^{L})
    \\
    \leq & ~ (1 + \epsilon)\cdot  f_{\mathsf{KDE}}^*(p).
\end{align*}
where $q$ is the closest net point of $p$.

\end{lemma}

\begin{proof}

We define an event $\xi$ to be the following,
\begin{align*}
    \forall q \in N, ~~~ (1-\epsilon) \cdot f_{\mathsf{KDE}}^*(q) \leq & ~ \mathrm{Median}(\{\mathcal{D}_j.\textsc{query}(q, \epsilon)\}_{j=1}^{L}) 
    \\
    \leq & ~ (1 + \epsilon)\cdot f_{\mathsf{KDE}}^*(q)
\end{align*}

Using Lemma~\ref{lem:net_points_app} with $L= \log(|N|/\delta)$, we know that 
\begin{align*}
    \Pr[~\text{~event~} \xi \text{~holds~} ] \geq 1 - \delta
\end{align*}

Using Fact~\ref{fac:number_of_net_points_app}, we know that
\begin{align*}
    L
    = & ~ \log(|N|/\delta ) \\
    = & ~ \log( ( 10 /\epsilon_0 )^d / \delta )\\ 
    = & ~ \log((10 \mathcal{L}/\epsilon \tau )^d/\delta)
\end{align*}
where the last step follows from $\epsilon_0 = \epsilon \tau / \mathcal{L}$. 

We condition the above event $E$ to be held. (Then the remaining proof does not depend on any randomness, for each and for all becomes the same.)

For each point $p \notin N$, there exists a $q \in N$ such that
\begin{align}\label{eq:diff_p_q_app}
    \| p - q \|_2 \leq \epsilon_0
\end{align}
For each $p$, we know
\begin{align*}
    & ~ |\mathrm{Median}_j\mathcal{D}_j.\textsc{query}(q, \epsilon) - f_{\mathsf{KDE}}^*(p) | \\
    \leq & ~ |\mathrm{Median}_j\mathcal{D}_j.\textsc{query}(q, \epsilon)-f_{\mathsf{KDE}}^*(q)|+|f_{\mathsf{KDE}}^*(q)-f_{\mathsf{KDE}}^*(p)|\\
    \leq & ~  \epsilon f_{\mathsf{KDE}}^*(q)+\mathcal{L}\cdot \| p - q \|_2 \\
    \leq & ~ \epsilon(f_{\mathsf{KDE}}^*(p)+\mathcal{L}\epsilon_0) + \mathcal{L} \cdot \epsilon_0 \\
    \leq & ~ \epsilon (f_{\mathsf{KDE}}^*(p)+2\tau) 
\end{align*}
where the first step follows from Lipschitz, the second step follows from Eq.~\eqref{eq:diff_p_q_app}, the third step follows from $\epsilon_0 \leq \epsilon \tau / \mathcal{L}$.

 
Using $ \forall j \in [L]: \mathcal{D}_j.\textsc{query}(p, \epsilon) \geq \tau$, we have 
\begin{align*}
    (1-3\epsilon) \cdot f_{\mathsf{KDE}}^*(p)  \leq & ~ \mathrm{Median}(\{\mathcal{D}_j.\textsc{query}(q, \epsilon)\}_{j=1}^{L})
    \\
    \leq & ~ (1 +3 \epsilon)\cdot f_{\mathsf{KDE}}^*(p) .
\end{align*}
Rescaling the $\epsilon$ completes the proof.
\end{proof}

Thus, we obtain an algorithm that could respond to adversary queries robustly.





