\newpage\section{Follower's pessimistic manipulation}\label{proof:pessimistic tie-breaking rule}
We denote $\mQ(\mF) = \argmax_{a\in\mA}\mu_l(a,\mathcal{F}(a))$. Because there may be multiple actions in $\mA$ with the same largest $\mu_l(a,\mathcal{F}(a))$, so there may be more than one element in $\mQ(\mF)$. From the follower's perspective, pessimistically, the leader will break the tie using $a = \argmin_{a\in \mQ(\mF)} \mu_f(a,\mathcal{F}(a))$. Assume pessimistically tie-breaking is more reasonable considering that the leader uses no-regret learning algorithm, since the leader who uses no-regret learning algorithm may not play one action in $\mQ(\mF)$ stably. So it is important for the follower to choose an appropriate manipulation strategy that will maximize its own reward in the long run taking into account the leader's tendency. When the follower makes the assumption that the leader will break the tie pessimistically, the optimization problem of the follower is 
% \hp{can we add annotations}
\begin{equation}\label{eq: opt1}
\begin{aligned}
\max_{\mathcal{F}}  \min_{(a^\prime,b^\prime)\in \mA\times \mB} \quad & \mu_f(a^\prime,b^\prime) \\
\text{s.t.} \quad & a^\prime \in \argmax_{a\in \mA} \mu_l(a,\mF(a)) \\
\quad & b^\prime = \mF(a^\prime)
\end{aligned}
\end{equation}

We present the Algorithm~\ref{alg:FM for opt1} for solving optimization problem~\eqref{eq: opt1}, which is similar to Algorithm~\ref{alg:FMS}. 

\begin{algorithm}[h!]
\caption{Follower's best manipulation towards a pessimistic leader}
\label{alg:FM for opt1}
\renewcommand{\algorithmicrequire}{\textbf{Input:}}
\renewcommand{\algorithmicensure}{\textbf{Output:}}
\begin{algorithmic}[1]
\REQUIRE Candidate set $\mathcal{K}=\mathcal{A} \times \mathcal{B}$, $\mathbf{H}=\{\}$, $\mu_l(\cdot,\cdot)$,  $\mu_f(\cdot,\cdot)$
% \WHILE{$\max_{a\neq a^\prime} \mu_l(a,\mathcal{F}(a))>\mu_l(a^\prime,b^\prime)$}
 \STATE Candidate manipulation pair $(a^\prime,b^\prime)=\argmax_{(a,b)\in\mathcal{K}}\mu_f(a,b)$
 \IF{$\mu_f(a_p,b_p)< \mu_f(a^\prime,b^\prime)$}
 \STATE $\mathcal{F}=\{\mathcal{F}(a^\prime)=b^\prime\}\cup\{\mathcal{F}(a)=\argmin_{b\in\mathcal{B}}\mu_l(a,b): a\neq a^\prime\}$
 \STATE Let $\mathbf{Q} = \argmax \mu_l(a,\mathcal{F}(a))$
 \IF{$(a^\prime,b^\prime) \in \mathbf{Q}$}
 \STATE Denote the current $\mF$ as $\mF_{a_p,b_p}$, $\mathbf{H}\cup \argmin_{(a,b)\in \mathbf{Q}} \mu_f(a,b)$, $(a_p,b_p)=\argmax_{(a,b)\in \mathbf{H}} \mu_f(a,b)$
 \ENDIF
 \STATE Eliminate $(a,b)$ from candidate set: $\mathcal{K}\leftarrow \mathcal{K} \backslash (a^\prime,b^\prime)$ and return to Line 1
 \ELSE
 \STATE $\mathcal{F}_{opt}=\mF_{a_p,b_p}$
 \ENDIF
\ENSURE The response function $\mathcal{F}_{opt}$
\end{algorithmic}
\end{algorithm}
