%\documentclass{uai2023} % for initial submission
\documentclass[accepted]{uai2023} % after acceptance, for a revised
                                    % version; also before submission to
                                    % see how the non-anonymous paper
                                    % would look like
%% There is a class option to choose the math font
% \documentclass[mathfont=ptmx]{uai2023} % ptmx math instead of Computer
                                         % Modern (has noticable issues)
% \documentclass[mathfont=newtx]{uai2023} % newtx fonts (improves upon
                                          % ptmx; less tested, no support)
% NOTE: Only keep *one* line above as appropriate, as it will be replaced
%       automatically for papers to be published. Do not make any other
%       change above this note for an accepted version.

%% Choose your variant of English; be consistent
\usepackage[american]{babel}
% \usepackage[british]{babel}

%% Some suggested packages, as needed:
\usepackage{natbib} % has a nice set of citation styles and commands
    \bibliographystyle{plainnat}
    \renewcommand{\bibsection}{\subsubsection*{References}}
\usepackage{mathtools} % amsmath with fixes and additions
% \usepackage{siunitx} % for proper typesetting of numbers and units
\usepackage{booktabs} % commands to create good-looking tables
\usepackage{tikz} % nice language for creating drawings and diagrams

%% Provided macros
% \smaller: Because the class footnote size is essentially LaTeX's \small,
%           redefining \footnotesize, we provide the original \footnotesize
%           using this macro.
%           (Use only sparingly, e.g., in drawings, as it is quite small.)
\usepackage{amssymb}
\usepackage{bm}
\usetikzlibrary{quantikz}
\usepackage[ruled,linesnumbered]{algorithm2e}
\usepackage{algorithmic}
\usepackage[switch]{lineno}
\usepackage{accents}
\usepackage{amsthm}
%\usepackage{tikz}
%\usetikzlibrary{calc,positioning}

%% Self-defined macros
%\newcommand{\swap}[3][-]{#3#1#2} % just an example
\newtheorem{theorem}{Theorem}
\newtheorem{lemma}{Lemma}
\newtheorem{techlemma}{Technical Lemma}
\newtheorem{corollary}{Corollary}
\newtheorem{proposition}{Proposition}
\newtheorem{example}{Example}

\renewcommand{\topfraction}{0.9}
\renewcommand{\floatpagefraction}{0.9}
\renewcommand{\textfraction}{0.1}

\newcommand{\BibTeX}{\rm B\kern-.05em{\sc i\kern-.025em b}\kern-.08em\TeX}
\newcommand{\zero}{|0\rangle}
\newcommand{\one}{|1\rangle}
\newcommand{\x}{|x\rangle}
\newcommand{\hn}{\accentset{\circ}{n}}
\newcommand{\hist}{\text{\rm \textbf{hist}}}
\newcommand{\hhist}{\widehat{\hist}}
\newcommand{\thist}{\overline{\hist}}
\newcommand{\calV}{\mathcal{V}}
\newcommand{\calG}{\mathcal{G}}
\newcommand{\calH}{\mathcal{H}}
\newcommand{\MOV}{\text{\rm MoV}}
\newcommand{\NMOV}{\text{\rm NMoV}_{\text{Q}}}
\newcommand{\NMOVC}{\text{\rm NMoV}_{\text{C}}}
\newcommand{\llceil}{\left\lceil}
\newcommand{\rrceil}{\right\rceil}
\newcommand{\lnorm}{\left|\left|}
\newcommand{\rnorm}{\right|\right|}
\newcommand{\qps}{\rm QPS}
\newcommand{\tone}{s}
\newcommand{\score}{\text{Score}}
\newcommand{\vv}{\boldsymbol{V}}
\newcommand{\SM}{\rm SM}
\newcommand{\NSM}{\rm NSM}
\newcommand{\prc}{\Pr\left[\text{\rm correct}\right]}
\newcommand{\nwi}{n_{\text{\rm win}}}
\newcommand{\nlo}{n_{\text{\rm lose}}}
\newcommand{\cp}{{\text{\rm Cap}}}

\newcommand\lirong[1]{{\color{red} \footnote{\color{red}Lirong: #1}} }
\newcommand\qishen[1]{{\color{blue} \footnote{\color{blue}Qishen: #1}} }
\newcommand\ao[1]{{\color{cyan}Ao: #1} }

\title{Accelerating Voting by Quantum Computation}

% The standard author block has changed for UAI 2023 to provide
% more space for long author lists and allow for complex affiliations
%
% All author information is authomatically removed by the class for the
% anonymous submission version of your paper, so you can already add your
% information below.
%
% Add authors
\author[1]{\href{mailto:<aoliu.cs@gmail.com>?Subject=Your UAI 2023 paper}{Ao Liu}{}}
\author[1]{Qishen Han}
\author[1]{Lirong Xia}
\author[2]{Nengkun Yu}
% Add affiliations after the authors
\affil[1]{%
    Department of Computer Science\\
    Rensselaer Polytechnic Institute\\
    Troy, NY, USA
}
\affil[2]{%
    Department of Computer Science\\
    Stony Brook University\\
    Stony Brook, NY, USA
}
  
\begin{document}

\maketitle

\begin{abstract}
Studying the computational complexity and designing fast algorithms for determining winners under voting rules are classical and fundamental questions in computational social choice. In this paper, we accelerate voting by leveraging quantum computation: we propose a quantum-accelerated voting algorithm that can be applied to any anonymous voting rule. We  show that our algorithm can be quadratically faster than any classical algorithm (based on sampling with replacement) under a wide range of common voting rules, including positional scoring rules, Copeland, and single transferable voting (STV). Precisely, our quantum-accelerated voting algorithm outputs the correct winner with high probability in  $\Theta\left(\frac{n}{\MOV}\right)$ time, where $n$ is the number of votes and $\MOV$ is {\em margin of victory}, the smallest number of voters to change the winner. In contrast, any classical voting algorithm based on sampling with replacement requires  $\Omega\left(\frac{n^2}{\MOV^2}\right)$ time under a large class of voting rules. Our theoretical results are supported by experiments under plurality, Borda, Copeland, and STV. 

% In this paper, we propose a quantum algorithm for majority voting. We prove that the runtime of quantum majority voting could be quadratically smaller than its classical algorithms, which is supported by our experimental studies.
%Voting has been largely applied in complex systems to make high-frequency and large-scale decisions. These scenarios create requirements for fast voting algorithms where small errors are acceptable. Existing voting algorithms are usually at least in linear time and cannot satisfy the fast computing requirements. \lirong{I suggest removing this paragraph.}
\end{abstract}

%\linenumbers

\section{Introduction}
Driven by the critical public need  of revolutionalizing modern democratic systems~\citep{mancini2015time,brill2018interactive}, voting has been   widely applied in many collective decision-making scenarios beyond political elections. Examples include search engines~\citep{dwork2001rank}, crowdsourcing~\citep{mao2013better}, database management~\citep{Belardinelli_2019}, and blockchain governance~\citep{grossi2022social}, just to name a few. In such large-scale, high-frequency collective decision-making scenarios, it is desirable that the winner is computed as soon as possible, ideally in sub-linear time in the number of votes, and perhaps at a (small) cost of its correctness. In fact, the study of computational complexity and algorithmic aspects of voting rules has been a key topic of {\em computational social choice}~\citep{brandt2016handbook}. 


% In recent years, the classical methodology of voting has been increasingly applied in high-frequency decision-making in the AI domain~\citep{Xia2019:Learning}. 
% % Voting is a widely used methodology to make collective decisions in a wide range of applications~\citep{Xia2019:Learning}\qishen{bad ref: change to voting into more scenarios.}.
% Voting has been discovered to be a powerful tool in many complex systems, 
% such as search engine~\citep{dwork2001rank}, crowdsourcing~\citep{mao2013better}, computer vision~\citep{Zhang2011CUDA},  and blockchain governance~\citep{Abramowitz2021:Democratic,grossi2022social}, just to name a few. These applications of voting in large-scale and high-frequency scenarios create an urgent requirement for fast voting, i.e. computing the winner in a short amount of time. Although many voting rules, such as plurality and single transferable vote (STV), can be computed in polynomial time, this is still too slow in large-scale systems like databases. As many such scenarios are low-stakes,  randomized algorithms, and small ``errors'' are acceptable. 

% \begin{example}
% \label{ex:motive}
% An application of voting is database management. For example, a database is created from multiple sources, and a voting algorithm is applied to aggregate the information and ensure the consistency of the new database~\citep{Belardinelli_2019}. For a large database, such aggregating procedure contains thousands of votes, each incorporating a mass of information, and a linear voting scheme would still be too time-costly. On the other hand, the database is able to tolerate a certain level of inconsistency through its self-examination protocol. Can we design a fast-voting algorithm for the database while preserving high accuracy? 
% \end{example}

One natural approach is to randomly sample a subset of votes (with or without replacement) and compute the winner of the sampled votes. The idea can be dated back to Venetian elections in the 13th century~\citep{walsh2012lot} and has recently attracted much attention from the computational social choice community~\citep{Bhattacharyya2021sample,Flanigan2020sortition,flanigan2021fair}. However, the performance of a sampling algorithm is restricted by the number of samples needed to guarantee a certain level of correctness, which determines its runtime. Specifically, the runtime of a sampling algorithm would be quadratically related to the number of votes (see Table~\ref{tab:summary1}). Is there a faster algorithm, for example, sub-linear to the number of votes, that still preserves a high probability of correctness? %\lirong{mention the bound in previous work, otherwise people do not know what is the baseline we compare to.}

Quantum computation appears to be a promising approach, as it has successfully accelerated many computational tasks such as  search~\citep{10.1145/237814.237866}, optimization~\citep{hogg2000quantum}, and machine learning~\citep{PhysRevA.94.022308,AJAGEKAR2020107119,AJAGEKAR2021117628}. However, we are not aware of previous work on accelerating voting using quantum computation. Thus, the following problem remains open. 
\begin{center}
    \textbf{Can voting be accelerated by quantum computation?}
\end{center}

% \lirong{say that by ``accelated'', we want to design sublinear algorithm.}
We address this question with YES both theoretically and experimentally. We accelerate voting by designing a sub-linear quantum-accelerated voting algorithm where a small probability of ``errors'' is allowed, which outperforms the classical sampling-based voting algorithms.
Our contributions are three-fold. First, we propose the quantum-accelerated voting algorithm (Algorithm~\ref{alg:quantum_multi}). Our algorithm leverages the widely-used techniques of quantum counting~\citep{Brassard1998counting} to generate the histogram of the votes. The simple architecture guarantees that our algorithm will be easy to implement in the future. Second, we theoretically prove that our algorithm is quadratically faster than any classical sampling-based algorithm for many common voting rules, including positional scoring rule, STV, Copeland, and maximin (see Table~\ref{tab:summary1}). Third, we experimentally verify our theoretical results under the plurality, Borda, Copeland, and STV (Section~\ref{sec:exp}). In Section~\ref{sec:heuristic}, we provide heuristics that may further improve the performance of quantum-accelerated voting. 

\begin{table}[htp]
    \centering
    %\resizebox{.7\textwidth}{!}{
    \begin{tabular}{cccc}
    \toprule
         & Runtime & Space Requirement\\ \hline
        {Quantum} (Thm.~\ref{thm:gsr}) &  {$\Theta\left(\frac{n}{\MOV}\right)$} & {$\Theta\left(\log(\frac{n}{\MOV})\right)$}\\
        Classical (Thm.~\ref{thm:classical}) & $\Omega\left(\frac{n^2}{\MOV^2}\right)$ & $\Omega\left(\log(\frac{n^2}{\MOV^2})\right)$\\
    \bottomrule
    \end{tabular}%}
    \caption{Summary for the theoretical results, where $n$ is the number of votes, and $\MOV$ is the margin of victory. All results in the table assume a constant error rate (\emph{e.g.,} $1\%$).}\label{tab:summary1}
\end{table}

Our quantum-accelerated voting algorithm accelerates voting most significantly in the case where the margin of victory is sub-linear in $n$, \emph{e.g.,}  $\MOV = \Theta(n^c)$ with $c \in (0, 1)$. In this case, $\MOV$ is relatively small compared with $n$, and a $\Theta (\frac{n}{\MOV})$ acceleration from classical to quantum algorithm is significant. The ratio $\frac{n}{\MOV} = \Theta ( n^{1 -c})$ implies that the algorithm is sub-linear. See Section~\ref{sec:compare} for detailed discussions. %a detailed explanation of when quantum computation accelerates.

% \lirong{IMPORTNAT: add more discussions about our alg. Under which conditions is it good? Think about it, the current version of the paper never explicitly address the question. We still don't know if the alg is sub linear time.}
 
\noindent\textbf{Related works and discussions. } To the best of our knowledge, our work is the first to use quantum computation to accelerate voting. \citet{vaccaro2007quantum}introduced the idea of quantum  computation to voting. The quantum voting algorithm in \citet{vaccaro2007quantum} provides security guarantees (against colluding attacks~\citep{lian2009handbook}). \citet{xue2017simple} improved the result in~\citet{vaccaro2007quantum} by proposing a simpler voting protocol but with stronger security guarantees. \citet{khabiboulline2021efficient} focuses on achieving anonymity without losing security guarantees. However, all approaches above require $\Omega(n)$ quantum communication cost and thus take $\Omega(n)$ time.%\lirong{modified. is it correct?}

There is a large literature on efficient (classical) algorithms for the winner determination problem. \citet{Wang2019PUT} purposed fast algorithms to compute winners in ranked pairs and STV under parallel-universes tiebreaking~\citep{conitzer2009preference}, which is known to be NP-complete. Various papers have shown that the winner of Dodgson rule, while is NP-hard to compute in the worst case~\citep{bartholdi1989voting}, can be efficiently computed with high probability when the ranking is generated $i.i.d.$~\citep{mccabe2008approximability, homan2009guarantees} and under semi-random models~\citep{xia2022beyond}. This line of work focuses on designing algorithms for NP-hard winner determination problems, while our paper focuses on further accelerating voting whose winner determination problem is in P. %Most of these works focus on providing efficient algorithms for the NP-hard winner determination problem, instead of fast voting. 

\section{Preliminaries}\label{sec:prelim}
\textbf{VOTING.}\\
In voting, $n > 1$ voters cast their votes on $m > 1$ candidates. The candidates are denoted as $c_1,\cdots,c_m$. A vote represents a voter's preference towards the candidates, which is a full-ranking (linear order) over candidates. Since there are $m!$ types of full rankings for $m$ candidates, a vote can be represented as an $m!$-dimensional unit vector. That means if the vote is the $j$-th type, the $j$-th dimension of the vector is $1$, and all other dimensions are $0$'s. The vote of the $i$-th voter is denoted as $\vv_i = \left(V_{i,1},\cdots,V_{i,m!}\right)$. For example, if the $i$-th vote is the $j$-th type, we have that $\vv_{i,j} = 1$ and $V_{i,j'} = 0$ for all $j'\neq j$. A profile $P$ is a collection of $n$ voters' rankings. A voting rule $r$ is a mapping from the profile $P$ to the winner(s) among $m$ candidates. 

A histogram $\hist$ is an $m!$ dimension vector that records the number of each type of ranking in the profile. We use $r(\hist)$ to denote the winner under an anonymous voting rule $r$ and a profile with histogram $\hist$. In this paper, we assume that the voting rule $r$ satisfies {\em anonymity} and {\em canceling out}~\citep{ao2020private}. An anonymous voting rule selects the winner only based on the histogram of the profile and does not depend on the identity of the voter. A voting rule satisfies canceling out if the winner does not change after adding one copy of each ranking to the profile. Most common voting rules satisfy both anonymity and canceling-out, such as plurality, Borda, Copeland, and STV.

\noindent\textbf{Plurality.} The candidate ranked top in the most number of votes is chosen as the winner. 

\noindent\textbf{Borda.} Firstly, the rule calculates the Borda score of each candidate. A candidate ranked $i$-th in a vote gains a score of $(m-i)$ from that vote. For example, the Borda scores for the vote $[c_1 \succ c_2 \succ c_3 \succ c_4]$ are $\{c_1:3,\, c_2:2,\, c_3:1,\, c_4:0\}$. The Borda score of a candidate is the sum of scores it gains from each vote. Then, the candidate with the largest Borda score is chosen as the winner. %For Borda, we also set the number of candidates $m = 2$ (Figure~\ref{fig:bor_m_2} in Appendix~\ref{app:exp}) and $m=4$ (Figure~\ref{fig:bor_m_4} in Appendix~\ref{app:exp}).

\textbf{Copeland. } Copeland compares each pair of candidates, where the winner gets $1$ point, and the loser gets $0$ point. If two candidates are tied, both get $0.5$ points. After finishing all pairwise comparisons, the candidate receiving the most points is chosen as the winner.

\textbf{Single transferable vote (STV). } STV is an $(m-1)$-round voting rule. In each round, the candidate receiving the least number of top-ranked votes is eliminated. When all $(m-1)$ rounds are finished, the remaining candidate is chosen as the winner.

\textbf{Margin of victory.} \emph{Margin of victory} (MoV) is the smallest number $k$ such that there exist a set of $k$ voters who can change the winner by voting differently.\\


\textbf{QUANTUM COMPUTATION. }\\
%For the quantum computation, we introduce the technique of {\em quantum counting}~\citep{Brassard1998counting}, which is applied in our quantum-accelerated voting algorithm. An introduction to quantum computing and implementation can be found in Appendix~\ref{apx:basic}. 
\noindent\textbf{Quantum counting algorithm\footnote{This paper adopts the same notation system as~\citet{nielsen2002quantum}, which is a textbook about quantum computation.}~\citep{Brassard1998counting}}. Quantum counting is one of the key parts of our proposed quantum-accelerated voting algorithm. It counts the number of solutions to a search problem. Given a binary function $f: \{0,1, \cdots, 2^t -1\} \to \{0, 1\}$, the quantum counting circuit for $f$ computes the number of $x \in \{0,1, \cdots, 2^t -1\}$ such that $f(x) = 1$. A quantum counting circuit uses $t$ quantum bits to encode the function and $\tone$ quantum bits to calculate and record the output. More specifically, supposing $n_1$ is the number of $x$ such that $f(x) = 1$. The quantum counting circuit with $t + \tone$ quantum bits outputs a binary decimal $\hat{\varphi} = 0.b_1b_2\cdots b_s$, which estimates $\varphi = \arcsin\left(\sqrt{n_1\cdot 2^{-t}}\right)/\pi$. For example, binary decimal $0.011$ represents $(2^{-2} + 2^{-3}) = 3/8$. %An introduction to quantum computing and implementation can be found in Appendix~\ref{apx:basic}. 
In the next lemma, we present three useful properties of quantum counting. 

\begin{lemma}[Properties of quantum counting]\label{lem:q_count_biased}
The quantum counting algorithm has the following three properties\\
1 (Tail bound, Inequality (5.34) in \citep{nielsen2002quantum}). For any $\delta > 2^{-\tone}$,
\begin{equation}\nonumber
\Pr[|\hat{\varphi} - \varphi| \geq 2^{-s} + \delta] \leq \frac{1}{2(\delta\cdot 2^{\tone}-1)}.
\end{equation}
2. Its runtime is $\Theta(2^\tone)$.\\
3. Its space requirement is $(t+\tone)$ quantum bits (qubits).
\end{lemma}

%The number of quantum bits $\tone$ affects both the precision and the runtime of the quantum counting algorithm. 
The first property in Lemma~\ref{lem:q_count_biased} says that a larger $\tone$ provides a stronger theoretical guarantee on the accuracy of quantum counting. However, a larger $\tone$ also corresponds to longer runtime. The detailed implementation of quantum counting and the reasoning behind why it accelerates can be found in Appendix~A.%~\ref{apx:quantum}. 

\noindent\textbf{Applying quantum counting to voting.}
We apply the quantum counting algorithm to estimate the histogram of a profile. For any $j\in\{1,\cdots,m!\}$, we estimate the $j$-th type of votes by setting the following binary function:
\begin{equation}\label{equ:fj}
f_j(x) = \left\{
\begin{array}{ll}
1 &  
\begin{array}{ll}\text{if candidate } x\text{'s vote}\\
\text{is of the } j \text{-th type}
\end{array}\\
& \\
0 & \text{otherwise} 
\end{array}\right..
\end{equation}
The number of $x$'s with  $f_j(x) = 1$ is  the number of votes of $j$-th type, \emph{i.e.},  $\hist_j$. The histogram of the votes is generated by enumerating all the $j$'s. We assume that the information in $\hist_j$ is stored in quantum RAM, which means the information can be efficiently encoded into quantum circuits ~\citep{giovannetti2008arch,giovannetti2008quantum,park2019circuit}.

\section{Quantum-Accelerated Voting Algorithm}
\label{sec:proto}

\noindent\textbf{Formal definition of quantum-accelerated voting. } We formally define quantum-accelerated voting in Algorithm~\ref{alg:quantum_multi}. In classical voting, votes are usually sent to an ``aggregator'', who is responsible for aggregating the votes and announcing the winner. Our quantum-accelerated voting follows a similar procedure, where the ``aggregator'' uses an algorithm accelerated by quantum computation. Basically, Algorithm~\ref{alg:quantum_multi} repeats the quantum counting algorithm by $K$ rounds. In each round, quantum counting estimates the histogram of the profile $\hist$ and applies the voting rule to the estimated histogram $\hhist$ to compute an estimated winner $c^{(k)} = r(\hhist)$. Then, the classical plurality voting rule is used to aggregate the estimated winners of $K$ rounds, \emph{i.e.} $c^{(1)},\cdots,c^{(K)}$. That is: the ``aggregator'' announces the candidate who is the estimated winner of the most rounds as the (final) winner. A tie-breaking rule (\emph{e.g.,} random tie-breaking) is applied when there are multiple candidates with the most rounds as the estimated winner. In Section~\ref{sec:theo_quantum}, we will show that Algorthm~\ref{alg:quantum_multi} (a combination of quantum and classical algorithms) has a better runtime than the quantum algorithm only. %Next, we will introduce each step of Algorithm~\ref{alg:quantum_multi} in detail.


\begin{algorithm}[htp]
\caption{Quantum-Accelerated Voting Algorithm}\label{alg:quantum_multi}
\begin{algorithmic}[1]
\STATE {\bfseries Inputs:} $n$ voters' votes $\vv_0, \cdots, \vv_{n-1}$, a voting rule $r$, number of iteration $K$, and the number of qubits $\tone \geq 2$
\STATE {\bfseries Initialization:} Construct the binary functions $f_1, f_2, \cdots, f_{m!}$ based on $\vv_0, \cdots, \vv_{n-1}$
\FOR{$k\in\{1,\cdots,K\}$}
\STATE Initialize an $m!$-dimensional vector $\hhist$
\FOR{$j\in\{1,\cdots,m!\}$}
\STATE Construct and apply quantum counting circuit for $f_j$ with $\tone$ qubits. Denote the output of the quantum counting circuit as $0.b_1\cdots b_{\tone}$.
\STATE {Set the $j$-th component of $\hhist$ as $2^t\cdot \sin^2\left(\pi\cdot 0.b_1\cdots b_{\tone}\right)$}
\ENDFOR
\STATE Set $c^{(k)} = r(\hhist)$ as the winner of the $k$-th round
\ENDFOR 
%\STATE Aggregate $c^{(1)},\cdots,c^{(K)}$ using (classical) plurality
\STATE {\bfseries Output} the (classical) plurality winner of $c^{(1)},\cdots,c^{(K)}$. %aggregation result as the winner
\end{algorithmic}
\end{algorithm}


\noindent\textbf{Construct binary functions.} 
We construct a binary function $f_j$ to store the information about the $j$-th type of vote. $f_j(x)=1$ if and only if the $x$-th voter casts the $j$-th type of vote. Formally, $f_j:\{0,1,\cdots, 2^t -1\} \to \{0, 1\}$ is defined according to Equation (\ref{equ:fj}),  
where $t = \lceil \log n \rceil$ is the number of bits to encode $n$, and the voters are numbered from $0$ to $(n-1)$. For $x \in \left\{ n, \cdots,  2^{t}-1\right\}$, we just set $f_j(x) = 0$ for padding. Then, the number of $x$ such that $f_j(x) = 1$ is exactly the number of votes of the $j$-th type, \emph{i.e.} $\hist_j$. 

\noindent\textbf{Count the histogram.}
For each type $j$, a quantum counting circuit is constructed and used to estimate $\hist_j$. The output of the counting circuit is $\hat{\varphi} = 0.b_1b_2\cdots b_{\tone}$, which estimates $\varphi = \arcsin\left(\sqrt{\hist_j\cdot 2^{-t}}\right)/\pi$. Therefore, $\hhist_j = 2^t\cdot \sin^2\left(\pi\cdot 0.b_1\cdots b_{\tone}\right)$ estimates $\hist_j$. By enumerating all types $j$, we get $\hhist$, which estimates the histogram $\hist$.

\noindent\textbf{Decide the winner.} The quantum counting procedure (and the voting rule) runs for $K$ rounds. Each round's estimated winner is computed according to the estimated histogram $\hhist$. Finally, the quantum-accelerated voting algorithm outputs the candidate that wins in the most number of rounds.

\section{Theoretical Analysis of Quantum-Accelerated Voting}
\label{sec:theo_quantum}
%In Section~\ref{sec:proto}, we proposed our quantum-accelerated voting algorithm (Algorithm~\ref{alg:quantum_multi}). 
In this section, we  provide theoretical guarantees about Algorithm~\ref{alg:quantum_multi}'s $\prc$ \footnote{Throughout this paper, we use $\prc$ to represent the probability (for an algorithm) to output the correct winner. Formally, $\prc \triangleq \Pr[\text{the algorithm's output} = r(P)]$, where $P$ is the voting profile and $r$ is the voting rule.}, runtime, and space requirements. %Theorem~\ref{thm:gsr} shows the theoretical bounds of Algorithm~\ref{alg:quantum_multi}. The bounds depend on three factors: the number of votes $n$, the margin of victory $\MOV$, and the error probability $\varepsilon$.
In our analysis, the number of candidates $m$ is fixed.  Figure~\ref{fig:thm_chain} illustrates a roadmap of the results in this section. %shows how the theorems are logically related. 


\begin{figure}[ht]
    \centering
    \includegraphics[width = 0.48\textwidth]{thm_chain.pdf}
    \caption{The logical chain of the theorems, lemmas, and propositions about Algorithm~\ref{alg:quantum_multi}. For example, the arrow from Theorem~\ref{lem:gsr_K=1} to Theorem~\ref{thm:gsr} represents that Theorem~\ref{thm:gsr} is proved based on Theorem~\ref{lem:gsr_K=1}.}
    \label{fig:thm_chain}
\end{figure}

In Theorem~\ref{lem:gsr_K=1}, we show the theoretical guarantee of Algorithm~\ref{alg:quantum_multi} when $K=1$. Note that when $K = 1$, the outer for loop in Algorithm~\ref{alg:quantum_multi} only runs for one round, which means the classical plurality voting rule directly outputs $c^{(1)}$. In other words, Algorithm~\ref{alg:quantum_multi} only contains quantum counting (and the voting rule $r$) when $K=1$. To simplify notations, we define a function $\sigma(\cdot)$ as follows.
{\small
\begin{equation}\nonumber
\begin{split}
\sigma(\varepsilon) &= 2+ \llceil t+ \log\Big(\frac{m!}{2\varepsilon}+2\Big) +\log \big(\pi\cdot(m!)\big) - \log(\MOV) \rrceil\\
&= \Theta\left(\log\big(\frac{n}{\varepsilon\cdot\MOV}\big)\right). 
\end{split}
\end{equation}
}
Throughout this paper, the logarithm function $\log(\cdot)$ represents $\log_2(\cdot)$ and $\ln(\cdot)$ represents $\log_e(\cdot)$.


\begin{theorem}[Theoretical guarantee of Algorithm~\ref{alg:quantum_multi} when $K=1$]
\label{lem:gsr_K=1}
For any given $\varepsilon\in (0,1) $, Algorithm~\ref{alg:quantum_multi} with $K=1$ and $\tone = \sigma(\varepsilon)$ has the following three properties. \\
1. Its $\prc \geq 1-\varepsilon$.\\
2. Its runtime is $\Theta\left(\frac{n}{\varepsilon \cdot \MOV}\right)$.\\
3. Its space requirement is  $\Theta\left(\log(\frac{n}{\varepsilon\cdot\MOV})\right)$.
% For arbitrary constant $\varepsilon\in (0,1) $, quantum voting (Algorithm~\ref{alg:quantum_multi}) has the following three properties when $K=1$ and $\tone = \max\{2,\, M+1\}$ with $M=$
% $$\llceil t + \log \left(\frac{\pi\left(\frac{m!}{2\varepsilon}+2\right)(m!)((m!+1)n + (m!)\MOV)}{n\cdot \MOV}\right)\rrceil.$$\\
% 1. It outputs the correct voting outcome with at least $1-\varepsilon$ probability.\\
% 2. Its runtime is $\Theta\left(\frac{n}{\varepsilon \cdot \MOV}\right)$.\\
% 3. Its space requirement is  $\Theta\left(\log(\frac{n}{\varepsilon\cdot\MOV})\right)$.
\end{theorem}
For readability, we will present the proof of Theorem~\ref{lem:gsr_K=1} after the proof of Theorem~\ref{thm:gsr}. In Theorem~\ref{thm:gsr}, we will present the theoretical guarantee of Algorithm~\ref{alg:quantum_multi} when parameter $K$ is set properly. Under this setting, Algorithm~\ref{alg:quantum_multi} contains both quantum and classical aggregation methods. Comparing Theorem~\ref{lem:gsr_K=1} with Theorem~\ref{thm:gsr}, we know the (classical) plurality voting can reduce the $(1/\epsilon)$ term in runtime to $\log(1/\epsilon)$.


\begin{theorem}[Theoretical guarantee of Algorithm~\ref{alg:quantum_multi}]\label{thm:gsr}
For any given $\varepsilon\in (0,1) $, Algorithm~\ref{alg:quantum_multi} with $K=\lfloor24\ln(1/\varepsilon)\rfloor+1$ and $\tone = \sigma(1/4) = \Theta\big(\log(n/\MOV)\big)$ has the following three properties.\\
% $K=24\ln(1/\varepsilon)$ and $\tone = \max\{2,\, M+1\}$ with $M=$
% $$\llceil t + \log \left(\frac{\pi(2(m!)+2)(m!)((m!+1)n + (m!)\MOV)}{n\cdot \MOV}\right)\rrceil.$$\\
1. Its $\prc \geq 1-\varepsilon$.\\
2. Its runtime is $\Theta\left(\frac{n\log(1/\varepsilon)}{\MOV}\right)$.\\
3. Its space requirement is  $\Theta\left(\log(\frac{n\log(1/\varepsilon)}{\MOV})\right)$.
\end{theorem}
\begin{proof}
%Theorem~\ref{thm:gsr} holds by applying Theorem~\ref{lem:gsr_K=1} with $\varepsilon = \frac14$. 
Setting $\tone = \sigma(1/4)$, we know that Algorithm~\ref{alg:quantum_multi} outputs the correct winner in each round with at least $p = \frac34$ probability according to Theorem~\ref{lem:gsr_K=1}. By Chernoff bound,%By Chernoff bound, the probability that the correct winner is chosen for more than $K/2$ rounds (which guarantees to be the most rounds without ties) is
\begin{equation}\nonumber%\label{equ:chernoff}
\begin{split}
    \prc & \geq \Pr[r(P)\text{ wins in more than  } K/2 \text{ rounds}]\\
    & > 1 - \exp\left(-\Big(1-\frac{1}{2p}\Big)^2\cdot K \cdot \frac{p}{2}\right).
\end{split}
\end{equation}
Thus, $\prc \geq 1-\varepsilon$ holds when
\begin{equation}\nonumber
K > \frac{2p\cdot\ln(1/\varepsilon)}{(p-1/2)^2} = 24\ln(1/\varepsilon).
\end{equation}
Then, Theorem~\ref{thm:gsr} follows by the monotonicity of Chernoff bound towards $K$.
\end{proof}

Now, we have presented the two main theorems about Algorithm~\ref{alg:quantum_multi} and are ready to show the full proof of Theorem~\ref{lem:gsr_K=1}.

\begin{proof}[Proof~of~Theorem~\ref{lem:gsr_K=1}]
    Theorem~\ref{lem:gsr_K=1} follows by setting $s=\sigma(\varepsilon)$ for the following lemma, which bounds $\prc$, runtime, and space complexity of quantum-accelerated voting for different settings on the numbers of qubits $\tone$.
    \begin{lemma}\label{thm:hist_same} 
        For any $\tone \ge 2$, quantum-accelerated voting (Algorithm~\ref{alg:quantum_multi}) with $K=1$ has the following three properties.\\
        1. Its $\prc\geq1 - \frac{m!}{2(\delta\cdot 2^{\tone} - 1)}$ for any $ \delta \in (2^{-\tone}, \frac{\MOV}{2^{t+1}\pi\cdot(m!)} -2^{-\tone})$\\
        2. Its runtime is $\Theta(2^{\tone})$\\
        3. Its space requirement is $\Theta(\log(n) + \tone)$. \\
        Note that Property 1 holds only when the feasible region of $\delta$ is non-empty, which sets a constraint for $\tone$.
    \end{lemma}
    




\begin{proof}%[Proof~of~Lemma~\ref{thm:hist_same}]
\noindent\textbf{Runtime and space requirement.} The runtime and the space requirement properties come from the corresponding properties of quantum counting (see Lemma~\ref{lem:q_count_biased}). As the anonymous rule $r$ computes the winner based on an $m!$ dimension histogram, its runtime and space requirement will only depend on the number of candidates $m$, which is $\Theta(1)$ in our analysis. Thus, when $K=1$, Algorithm~\ref{alg:classical_multi} has the following two properties.
\begin{equation}\nonumber
\begin{split}
\text{runtime}
=\;& \underbrace{\Theta(1)}_{\text{the voting rule }r} + \underbrace{\Theta(2^{\tone})}_{\text{quantum counting}} = \Theta(2^{\tone}).
\end{split}
\end{equation}
\begin{equation}\nonumber
\begin{split}
\text{space requirement} =\;&\underbrace{\Theta(1)}_{\text{the voting rule }r} + \underbrace{t+\tone}_{\text{quantum counting}}\\
=\;& \Theta(1)+\lfloor\log(n)\rfloor+s\\
=\;& \Theta(\log(n) + \tone).
\end{split}
\end{equation}

\noindent\textbf{$\bm{\Pr[\text{\textbf{correct}}]}$.} To simplify the notation, let $\thist_j$ be the histogram by adding (or removing) the same fraction of each ranking to $\hhist$ so that the sum of the histogram is $n$: for all dimension $j$,  $\thist_j =\hhist_j +  (||\hist||_1 - ||\hhist||_1)/(m!)$ (recall that $||\hist||_1 = n$). By the assumption of canceling-out (see the second paragraph in Section~\ref{sec:prelim} for its definition), we know that $r(\thist) = r(\hhist)$.

% \textcolor{red}{Ao: Can Qishen also modify the following paragraph according to the new versions of propositions?}

The proof of the $\prc$ property is obtained by the following two propositions. Proposition~\ref{prop:hist_bounded} guarantees that the $\ell_1$-norm between $\hist$ and $\thist$ is bounded by $\MOV$ with at least $1 - \frac{m!}{2(\delta\cdot 2^{\tone} - 1)}$ probability. Proposition~\ref{prop:MOV} guarantees that any histogram in the neighborhood of $\hist$ with $\ell_1$-norm smaller than $2\MOV$ shares the same winner with $\hist$. Therefore, with at least $1 - \frac{m!}{2(\delta\cdot 2^{\tone} - 1)}$ probability, $\thist$ (and therefore $\hhist$) leads to the correct winner. 

% \textcolor{red}{Ao: Can Qishen modify Proposition 1? We need a proposition about the $\ell_1$-norm distance between two histograms.}

The next proposition shows that $\thist_j$ is close to $\hist_j$ with high probability. %Therefore, it is sufficient to show that the difference between $\hist_j$ and $\thist_j$ is bounded.

% In the following lemma, let $\thist_j$ be the normalize $\hhist$ such that the sum of the histogram is $n$: for all dimension $j$,  $\thist_j = \frac{\hhist_j}{\lnorm\hhist\rnorm_1}\cdot n$.

\begin{proposition}
    \label{prop:hist_bounded}
    For all $ \delta \in (2^{-\tone}, \frac{\MOV }{2^{t+1}\pi\cdot(m!)} -2^{-\tone})$, the probability that
    $\lnorm\hist-\thist\rnorm_1 < \MOV$
    is at least $1 - \frac{m!}{2(\delta\cdot 2^{\tone} - 1)}$.  
\end{proposition}

% \begin{lemma}
%     \label{prop:hist_bounded}
%     For all $ \delta \in (2^{-\tone}, \frac{\MOV \cdot n}{2^t\pi(m!)((m!+1)n + (m!)\cdot \MOV)} -2^{-\tone})$, the probability that $|\thist_j - \hist_j| < \frac{\MOV}{m!}$ for all dimension $j$ is at least $1 - \frac{m!}{2(\delta\cdot 2^{\tone} - 1)}$.  
% \end{lemma}

\begin{proof}
    This proof fixes an arbitrary pair of $\tone$ and $\delta$ satisfying the condition. We prove a stronger result that the probability that for all dimension $j$, $|\thist_j - \hist_j| < \frac{\MOV}{m!}$ is at least $1 - \frac{m!}{2(\delta\cdot 2^{\tone} - 1)}$. When the stronger result holds, 
    \begin{equation}\nonumber
    \begin{split}
        \lnorm\hist-\thist\rnorm_1 \le &\ \sum_{j=1}^{m!}|\hist_j - \thist_j| < m!\cdot\frac{\MOV}{m!} = \MOV. 
    \end{split}
    \end{equation}
    Therefore, the probability that for all dimension $j$, $|\thist_j - \hist_j| < \frac{\MOV}{m!}$ is at least $1 - \frac{m!}{2(\delta\cdot 2^{\tone} - 1)}$ directly implies that the probability that
    $\lnorm\hist-\thist\rnorm_1 < \MOV$
    is at least $1 - \frac{m!}{2(\delta\cdot 2^{\tone} - 1)}$.
    % To show that $\lnorm\hist-\thist\rnorm_1 < \MOV$, it is suffice to show that $|\thist_j - \hist_j| < \frac{\MOV}{m!}$ for all dimension $j$ for any dimension $j$.    
    
    By applying the union bound on Lemma~\ref{lem:q_count_biased} for all dimensions $j$, we know that for all dimension $j$, the probability that $|\hat{\varphi}_j - \varphi_j| < 2^{-\tone} + \delta$ is at least $1 - \frac{m!}{2(\delta\cdot 2^{\tone} - 1)}$. Then we show that $|\hat{\varphi}_j - \varphi_j| < 2^{-\tone} + \delta$ for all dimension $j$ implies $|\thist_j - \hist_j| < \frac{\MOV}{m!}$ for all $j$. 

    Suppose $|\hat{\varphi}_j - \varphi_j| < 2^{-\tone} + \delta$ holds for all dimension $j$.  Let $h(x) = 2^t\sin^2(\pi x)$. We have $h(\hat{\varphi}_j) = \hhist_j$ and $h({\varphi}_j) = \hist_j$. Note that $\frac{dh(x)}{dx} = 2^t\pi\sin(2\pi x) \le 2^t\pi$ holds for arbitrary $x$. Therefore,  
    \begin{equation}\nonumber
    |\hhist_j - \hist_j| \le 2^t\pi |\hat{\varphi}_j - \varphi_j| < 2^t\pi\cdot(\delta + 2^{-s}).
    \end{equation}

    Let $d = 2^t\pi\cdot(\delta + 2^{-s})$. 
    By summing over all dimensions $j$, we have \begin{equation}\nonumber
        \left|||\hhist ||_1- \lnorm\hist \rnorm_1\right| \le \sum_{j=1} ^{m!} |\hhist_j - \hist_j| < (m!)d.
    \end{equation}
    Given the bound of difference between $\hhist$ and $\hist$, we show that since $\thist$ is the modified $\hhist$, the difference between $\thist$ and $\hist$ is also bounded. Now we consider the difference between $\thist_j$ and $\hist_j$ for any dimension $j$. 

    For the upper bound, we have $\hhist_j < \hist_j + d$ and $(||\hist||_1 - ||\hhist||_1) < (m!)d$. Therefore, 
    \begin{equation}\nonumber
        \begin{split}
            \thist_j = &\; \hhist_j + (||\hist||_1 - ||\hhist||_1)/(m!)\\
            < & \; \hist_j + 2d. 
        \end{split}
    \end{equation}
    % \begin{align*}
    %     \thist_j =\; &  \frac{\hhist_j\cdot n}{\lnorm \hhist\rnorm_1}\\
    %     < \;& \frac{(\hist_j + d)\cdot n}{n - (m!)d}\\
    %     = \;& \hist_j + \frac{nd + (m!)d\cdot \hist_j}{n - (m!)d}.
    % \end{align*}
    % Note that $0\le \hist_j \le n$. Therefore, 
    % \begin{align*}
    %     \thist_j <& \hhist_j + \frac{n(m!+1)d}{n - (m!)d}.
    % \end{align*}
    Similarly, for the lower bound, we have $\hhist_j > \hist_j - d$. Therefore, $\thist_j > \hist_j - 2d.$
    % \begin{align*}
    %     \thist_j = \;&  \frac{\hhist_j\cdot n}{\lnorm\hhist\rnorm_1}\\
    %     > \;& \frac{(\hist - d)\cdot n}{n + (m!)d}\\
    %     = \;& \hhist_j - \frac{nd + (m!)d\cdot \hist_j}{n + (m!)d}\\
    %     \ge \;& \hhist_j - \frac{n(m!+1)d}{n + (m!)d}.
    % \end{align*}

    Therefore, for all dimension $j$, $|\thist_j - \hist_j | < 2d$. The condition that $ \delta < \frac{\MOV}{2^{t+1}\pi\cdot(m!)} -2^{-\tone}$ guarantees that $2d = 2^{t+1}\pi\cdot(\delta + 2^{-\tone}) < \frac{\MOV}{m!}$. Therefore, for all dimension $j$, $|\hist_j - \thist_j| <  \frac{\MOV}{m!}$, which finishes our proof. 
    % Therefore, for all dimension $j$, $|\hist_j - \thist_j| < \frac{n(m!+1)d}{n - (m!)d}$.
    % The condition that $ \delta < \frac{\MOV \cdot n}{2^t\pi(m!)((m!+1)n + (m!)\cdot \MOV)} -2^{-\tone}$ guarantees that $\frac{n(m!+1)d}{n - (m!)d} < \frac{\MOV}{m!}$. Therefore, for all dimension $j$, $|\hist_j - \thist_j| <  \frac{\MOV}{m!}$, which finishes our proof.   
\end{proof}


%\textcolor{red}{Ao: Can Qishen modify Proposition 2? It's better to replace $\hhist$ with $\thist$.}

\begin{proposition}\label{prop:MOV}
    For any histogram $\thist$ such that $\lnorm\hist\rnorm_1 = \lnorm\thist\rnorm_1$ and $\lnorm\hist-\thist\rnorm_1 < 2\MOV$, $r(\hist) = r(\thist)$.
\end{proposition}

\begin{proof}
    We consider the voting rule $r$ that allows voters to vote fractionally. That is, each voter has a total weight of 1 and can assign the weight arbitrarily to every ranking. Accordingly, $\MOV$ is the smallest amount of weight of votes to change the winner. 
    
    Suppose the statement is not true, and there exists a $\thist$ such that $\lnorm\hist-\thist\rnorm_1 < 2\MOV$ and  $r(\hist) \neq r(\thist)$. Let $J_1$ be the set of dimension $j$ such that $\thist_j > \hist _j$, and $J_2$ be the set of $j$ such that $\thist_j < \hist _j$. Since $\lnorm \hist\rnorm_1 = \lnorm \thist\rnorm_1 = n$, there exists a way of transforming $\thist$ to $\hist$ by accumulating all the excess weights of the dimensions in  $J_1$ and assigning it to the dimensions in $J_2$. The changes in the weight \begin{equation}\nonumber
    \sum_{j\in J_1} |\thist_j - \hist _j| = \sum_{j\in J_2} |\thist_j - \hist _j|\ge \MOV
    \end{equation}
    by the definition of $\MOV$. However, this contradicts the assumption that 
    \begin{equation}\nonumber
    \lnorm\hist-\thist\rnorm_1 = \sum_{j\in (J_1\cup J_2)} |\thist_j - \hist _j| < 2\MOV.
    \end{equation}
    Therefore, for any histogram $\thist$ such that $\lnorm\hist-\thist\rnorm_1 < 2\MOV$, $r(\hist) = r(\thist)$.
\end{proof}
Then, the $\prc$ property of Lemma~\ref{thm:hist_same} follows by combining Proposition~\ref{prop:hist_bounded} and Proposition~\ref{prop:MOV}.
\end{proof}
    According to Lemma~\ref{thm:hist_same}, Algorithm~\ref{alg:quantum_multi}'s $\prc \geq 1 - \frac{m!}{2(\delta\cdot 2^{\tone} - 1)}$. In order to achieve $\prc$ of $1 - \varepsilon$, constraint $\delta \ge 2^{-\tone}(\frac{m!}{2\varepsilon}+1)$ needs to be satisfied. Combining the constraint and the feasible region in Lemma~\ref{thm:hist_same}, we know that $\delta\in\left[2^{-\tone}(\frac{m!}{2\varepsilon}+1), \; \frac{\MOV }{2^{t+1}\pi\cdot(m!)} -2^{-\tone}\right)$, which must not be empty, \emph{i.e.}
    % \begin{equation*}
    %     2^{-\tone}(\frac{m!}{2\varepsilon}+1)  < \frac{\MOV \cdot n}{2^t\pi(m!)((m!+1)n + (m!)\cdot \MOV)} -2^{-\tone}. 
    % \end{equation*}
    \begin{equation}\label{equ:delta}
        2^{-\tone}\left(\frac{m!}{2\varepsilon}+1\right)  <  \frac{\MOV }{2^{t+1}\pi\cdot(m!)} -2^{-\tone}.
    \end{equation}
    It's not hard to verify that $\tone = \sigma(\varepsilon)$ satisfies the constraint in (\ref{equ:delta}). Then, Theorem~\ref{thm:gsr} follows by setting $\delta = 2^{-\tone}(\frac{m!}{2\varepsilon}+1)$ and $\tone = \sigma(\varepsilon)$ for Lemma~\ref{thm:hist_same}.  
\end{proof}

\section{Compare Quantum and Classical Voting}
\label{sec:compare}
This section compares quantum-accelerated voting with (the best performance of) classical voting algorithms. The classical algorithm is designed according to the idea of sampling (either with or without replacement). At the high level, it uses the randomly sampled votes to estimate the winner. We analyze the runtime and space requirements for classical sampling algorithms and compare them with those of our quantum-accelerated voting algorithm. 

\noindent\textbf{When does quantum (may) accelerate voting?}
Firstly, we provide an intuitive explanation of when quantum would accelerate voting the most. 
We first think about the cases where classical algorithms (\emph{e.g.}, randomly sampling a subset of votes and using the subset to predict the winner) do not need to be improved or cannot be improved. When the margin of victory $\MOV = \Theta(n)$, classical algorithms are already very fast according to the Chernoff bound, which says the classical algorithms' error rate can be exponentially small in terms of runtime~\citep{Bhattacharyya2021sample}. Another case is when $\MOV$ is very small (\emph{e.g.}, $\MOV = \Theta(1)$) where classical algorithms' performance is close to the optimal. In this case, any algorithm has to look into each vote to decide the winner. Since the complexity of counting every vote is $\Theta(n)$, there is not a lot of space for the classical algorithms to be improved.  
%In order to improve readability, we let ``tie'' ($\MOV \leq 1$) be a special case of $\MOV = \Theta(1)$. 

Between these two extremes is the case where quantum accelerates voting most significantly, for example,  when the margin of victory $\MOV = \Theta(n^{c})$, where $c\in(0,1)$ is a constant. In this case, the classical voting would be as slow as $\Omega(\frac{n^2}{\MOV^2})$ for a fixed error rate $\epsilon$. %, and the acceleration of $\Theta(\frac{n}{\MOV})$ from quantum-accelerated voting is significant. 
On the other hand, the runtime of the quantum-accelerated voting, $\Theta(\frac{n}{\MOV})$, is quadratically faster. This comparison is also shown in our experiment of $m=2$ and $\MOV = 1024$ for plurality (the middle column in Figure~\ref{fig:plu_m_2}), where the number of voters $n\approx 10^6$ and $\MOV = \sqrt{n}$, \emph{i.e.} the winner gets $\sim$$0.2\%$ more votes than the loser. 



Theorem~\ref{thm:classical} establishes a theoretical ``complexity lower bound'' %\lirong{IMPORTANT: should it be ``lower bound''} 
of any classical voting algorithms (based on sampling with replacement) for many common voting rules. Consequently,  sampling-based algorithm with replacement is  at least quadratically slower than quantum-accelerated voting. Here, an algorithm being `` sampling-based'' means the sampling method is the only method for the algorithm to get information about the voting profile $P$. We say one voting rule reduces to majority voting for two candidates if the voting rule always has the same winner as majority (using whatever tie-breaking method) when $m=2$. Most commonly used voting rules reduce to majority for two candidates (\emph{e.g.,} any positional scoring rules, STV, Copeland, and maximin, just to name a few). %We note Theorem~\ref{thm:classical} also covers the algorithms using a non-fixed number of samples (\emph{e.g.,} stopping the sampling process based on a non-deterministic rule).\lirong{This sentence might be confusing, so, maybe remove it?} %Theorem~\ref{thm:with_without} in Appendix~\ref{app:with_witout} shows that sampling without replacement has the same asymptotic manner as sampling with replacement.

% \textcolor{red}{Ao: Can Qishen help with the following things?
% \begin{enumerate}
%     \item Generalize the below lemma as a theorem for $m\geq 2$.
%     \item Add a discussion to compare the above theorem with the literature results (see the example below.)
%     \item Add and prove a statement that sampling with replacement is similar to sampling without replacement under suitable conditions.
%     \item Update this chapter and the introduction according to our new changes.
% \end{enumerate}
% }

\begin{theorem}
    \label{thm:classical}
    Given any fixed $m \ge 2$, for any $\varepsilon\in (0, 0.5]$, any fast voting algorithm based on sampling with replacement for the voting rule such that reduces to majority voting for two candidates %\lirong{define this somehwere?} 
    requires at least $\Omega\left(\frac{n^2\cdot\left(\frac{1}{2}-\varepsilon\right)^2}{\MOV^2}\right)$ (expected) runtime and at least $\Omega\left(\log\big(\frac{n^2\cdot\left(\frac{1}{2}-\varepsilon\right)^2}{\MOV^2}\big)\right)$ (expected) space to achieve $\prc\geq 1-\varepsilon$ in the worst case. %\lirong{IMPORTANT: I think the theorem assumes fixed $m$ but variable $\epsilon$, in the sense that the constant in $\Omega(\dot)$ only depends on $m$ but not $\epsilon$. Am I right?}
\end{theorem}

% \ao{what is Cordorcetified rules? It would be better to give examples here because I don't even know what this represents.}

When $\varepsilon$ is a constant, the bound in Theorem~\ref{thm:classical} becomes $\Omega\left(\frac{n^2}{\MOV^2}\right)$, which is tight according to \citet{Bhattacharyya2021sample}. We note Theorem~\ref{thm:classical} is more general than the bounds in \citet{Bar-Yossef2001:sampling} (require a lower bound for $\varepsilon$) and \citet{Canetti1995sample} (only holds for small-scale samplings). %\lirong{general than which bounds in the literature? It is a bound for a special algorithm.}

Appendix~B.2 %\ref{app:with_witout}
shows that sampling without replacement has the same asymptotic manner as sampling with replacement when the number of samples $T = o(\sqrt{n})$, which is the setting of fast majority voting in many application scenarios.



% Throughout this paper, we assume that the margin of victory $\MOV = \Theta(n^{c})$, where $c\in(0,1)$ is a constant. For example, in one of the settings in our experimental verification\qishen{Ref?}, the number of voters $n\approx 10^6$ and $\MOV = \sqrt{n}$. In this example, the winner only got $\sim$$0.2\%$ more votes than the loser.\\




\begin{proof}[Proof of Theorem~\ref{thm:classical}]
    \textbf{Step 1. } A lower bound of runtime and space requirement for any fast majority voting algorithm for two candidates (Lemma~\ref{lem:classical_m2}).

    % The idea of this proof is to show that distinguishing the winner in such a voting rule is at least as difficult as distinguishing the winner in a majority vote. 
    \begin{lemma}\label{lem:classical_m2}
    For any $\varepsilon\in(0,0.5]$, any fast (2-candidate) majority voting algorithm based on sampling with replacement requires at least $\Omega\left(\frac{n^2\cdot\left(\frac{1}{2}-\varepsilon\right)^2}{\MOV^2}\right)$ (expected) runtime and at least $\Omega\left(\log\big(\frac{n^2\cdot\left(\frac{1}{2}-\varepsilon\right)^2}{\MOV^2}\big)\right)$ (expected) space to achieve $\prc\geq 1-\varepsilon$.
    \end{lemma}
    The proof of Lemma~\ref{lem:classical_m2} can be found in Appendix~B.1%\ref{app:proof}
    . Note that the $\varepsilon$ part of the bound in Lemma~\ref{lem:classical_m2} is not tight when $\varepsilon$ is close to $0$. This is because our bound is given by the information limit, which cannot be reached when reconstructing a limited number of bits. In particular, our problem only reconstructs 1-bit information (which candidate wins out of the two candidates).
    
    \textbf{Step 2.}  The lower bound for the fast voting algorithm for $m>2$ candidates cannot be smaller than the lower bound for the two-candidate case. 
    
    Suppose Theorem~\ref{thm:classical} is not true, and there exists a fast voting algorithm $A$ for voting rule $r$ such that for any profile $P$, $A$ has a runtime of $o\left(\frac{n^2\cdot\left(\frac{1}{2}-\varepsilon\right)^2}{\MOV^2}\right)$ and achieves $\Pr[A(P) \text{ is correct}] \ge 1 - \varepsilon$ (the reasoning for space complexity will be similar). And suppose $A$ takes a profile $P$ of $m$ candidates $a, b, c_3,\cdots, c_m$ as the input and sample votes from $P$ with replacement. We show that there exists a fast algorithm for majority voting $A'$ with the same runtime and accuracy. Let $P'$ be a voting profile for two candidates $a$ and $b$, and let $n_a$ and $n_b$ be the number of votes for $a$ and for $b$ respectively. We construct algorithm $A'$ as follows: 

    $A'$ is almost the same as $A$ except for the different input and sampling. $A'$ takes a profile $P'$ of two candidates $a$ and $b$ as the input. Whenever there needs a sample, $A$ samples a vote from $P'$. If the voter votes for $a$, then $A'$ convert it to $a \succ b \succ c_3\succ \cdots \succ c_m$; and if it votes for $b$, then $A'$ convert it to $b \succ a \succ c_3\succ \cdots \succ c_m$.
    If the winner calculated is neither $a$ nor $b$, $A'$ will set $a$ to the winner. 
    Except for the sampling, $A'$ running on $P'$ is equivalent to $A$ running on the following profile $P$ and set the same winner as $A$ does: there are $n_a$ votes of $a \succ b \succ c_3\succ \cdots \succ c_m$ and $n_b$ votes of $b \succ a \succ c_3\succ \cdots \succ c_m$.
    % \begin{algorithm}[htp]
    % \caption{Fast majority voting algorithm $A'$}\label{alg:oracle}
    % \begin{algorithmic}[1]
    % \STATE {\bfseries Inputs:} Profile $P'$. 
    % \STATE Construct profile $P$ for $m$ candidates based on $P'$.
    % \begin{itemize}
    %     \item The candidates are $a, b, c_3, \cdots, c_m$. 
    %     \item There are $n_a$ votes of $a \succ b \succ c_3\succ \cdots \succ c_m$ and $n_b$ votes of $b \succ a \succ c_3\succ \cdots \succ c_m$.
    % \end{itemize}
    % \STATE Run algorithm $A$ on $P$.  
    % \STATE If $A(P) = a$, set $a$ as the winner. Otherwise, set $b$ as the winner.  
    % \end{algorithmic}
    % \end{algorithm}

    If $a$ is the winner in $P'$, then $n_a \ge n_b$, and the margin of victory for the majority vote is $\MOV' = \frac12(n_a - n_b)$. Then it is not hard to verify that when $r$ is one of the rules mentioned in the statement, $a$ is also the winner in $P$, and the margin of victory in $P$ is $\MOV = \MOV'$. Therefore, $A$ set the winner as $A$ with probability at least $1 - \varepsilon$ under runtime $o\left(\frac{n^2\cdot\left(\frac{1}{2}-\varepsilon\right)^2}{\MOV^2}\right)$. Then $A'$, with the same operation to $A$, will also set the winner as $A$ with probability at least $1 - \varepsilon$ under the same runtime. Similarly, if $b$ is the winner, $A'$ can output the correct winner with probability at least $1 - \varepsilon$ under the same runtime. Therefore, $A'$ is a fast majority voting algorithm based on sampling with a replacement that can achieve $\Pr[\text{correct}] \ge 1 - \varepsilon$ under runtime $o\left(\frac{n^2\cdot\left(\frac{1}{2}-\varepsilon\right)^2}{\MOV^2}\right)$, which contradicts with Lemma~\ref{lem:classical_m2}. 
    % Consider a set of voting profiles such that for each profile $P$ in the set: for some pair of candidate $(a, b)$,
    % \begin{enumerate}
    %     \item there are $(\lfloor n/2\rfloor + \MOV)$ votes of $a\succ b\succ X$, and
    %     \item there are $(\lceil n/2\rceil - \MOV)$ votes of $b\succ a\succ X$,
    % \end{enumerate}
    % where $X$ denotes all other candidates with arbitrary order. It's not hard to verify that the margin of victory of any such profile $P$ is $\MOV$ in scoring rule, Copeland, maximin, and STV.
\end{proof}

% \ao{Can Qishen use our notation system?}

% When $n\to \infty$, $H(n, \hist_j, T)$ also converges to $\mathcal{N}(\hist_j, \hist_j \cdot (1-\hist_j/n))$. Therefore, the samples with replacement and without replacement will converge as $n\to \infty$. 


\begin{figure*}[ht]
    \centering
    \includegraphics[width = 0.98\textwidth]{fig_m_2.pdf}
    \caption{Compare quantum-accelerated voting (blue circles) with classical fast voting (red squares) for plurality, Borda, Copeland, and STV when $m=2$. The horizontal axis can be seen as the logarithm of the algorithms' runtime.}
    \label{fig:plu_m_2}
\end{figure*}


\section{Experimental Results}
\label{sec:exp}
%\lirong{maybe say a few words about the simulation environment for quantum computation?}
\noindent\textbf{Basic settings. } We numerically compare the proposed quantum-accelerated voting (Algorithm~\ref{alg:quantum_multi}) with a fast classical voting based on sampling with replacement (Algorithm~\ref{alg:classical_multi}). We set the number of samples $T$ in Algorithm~\ref{alg:classical_multi} to be $K\cdot 2^s$, where $s$ and $K$ are the parameters of Algorithm~\ref{alg:quantum_multi}. By doing this, the runtime of both algorithms is $\Theta(K\cdot 2^s)$.  We set the number of voters $n = 2^{20} \approx 10^6$, which is at a similar order of magnitude as the number of voters in a typical state of the United States. For example, the number of registered voters in New Hampshire is 1,009,004 $\approx$ $10^6$~\citep{nh2020}. We compare Algorithm~\ref{alg:quantum_multi} and Algorithm~\ref{alg:classical_multi} on four widely-used voting rules, which are two scoring rules (plurality and Borda), a pairwise rule (Copeland), and an elimination-based rule (STV). The formal definitions of the four rules can be found in Section~\ref{sec:prelim}. Note that all four rules  are covered by Theorem~\ref{thm:classical}. The implementation details can be found in Appendix~C.1.%\ref{app:detail_exp}. %In Figure~\ref{fig:plu_m_2}. we set $\MOV = \sqrt{n} = 2^{10} \approx 10^3$. Or equivalently, one candidate got $2^{19}+2^{10} = 525,312$ votes while the other candidate got $2^{19}-2^{10} = 523,264$ votes. Figure~\ref{fig:plu_m_4} sets $\MOV = 2\sqrt{n} = 2^{11} \approx 2\times 10^3$ \\


%\vspace{-0.8em}
\begin{algorithm}[htp]
\caption{Fast Classical Voting Algorithm}\label{alg:classical_multi}
\begin{algorithmic}[1]
\STATE {\bfseries Inputs:} $n$ voters' votes $\vv_0, \cdots, \vv_{n-1}$, a voting rule $r$, number of samples $T$
\STATE Sample $T$ votes uniformly at random with replacement
\STATE Build the histogram $\hhist$ of the sampled votes. 
\STATE {\bfseries Output} $r(\hhist)$ as the winner. 
\end{algorithmic}
\end{algorithm}
%\vspace{-1em}

%For quantum majority voting, we directly calculate the probability of outputting the correct winner $\Pr[\text{correct}]$ through equation (5.26) in~\citet{nielsen2002quantum}, which is the output distribution of quantum counting algorithm. The classical majority algorithm's $\Pr[\text{correct}]$ is calculated from the distribution of $T_1$ (the number of sampled votes for the first candidate, follows binomial distribution). Our experiment also plots a lower bound for quantum majority voting (Inequality (\ref{equ:quantum_k_1}) for $K=1$ and Inequality (\ref{equ:quantum_k_large}) for $K > 1$) and an asymptotic bound for classical majority voting (Inequality (\ref{equ:classic_lower1})). As mentioned above, none of our experimental results rely on random sampling. Thus, the curves in Figure~\ref{fig:plu_m_2} and Figure~\ref{fig:plu_m_4} have no randomness (thus have no error bar on them). All experiments of this paper are implemented through MATLAB 2022b and run on a Windows 11 desktop with AMD Ryzen 9 5900X CPU and 32GB RAM. \\
\noindent\textbf{Detailed settings. } We use random tie-breaking to break ties for all voting rules above. For example, if $c_1$ and $c_2$ are tied, each of them will win with $1/2$ probability. We set the number of candidates $m \in \{2,4\}$ for all rules.  %In all experiments of this paper, we first draw $10^5$ independent trails of the sampled profile and calculate the winner for each trail. 
In all experiments of this paper, we estimate the probability of outputting the correct winner ($\Pr[\text{correct}]$) by the frequency of observing the correct winner in $10^5$ independent trails.  We set $K \in \{1,3,5\}$ to avoid ties in the classical part of quantum-accelerated voting algorithm. We set $\MOV \in \{256, 512, 1024, 2048, 4096\}$, or equivalently, $\MOV \in \{n^{0.4}, n^{0.45}, n^{0.5}, n^{0.55}, n^{0.6}\}$. Since all four rules reduce to the majority rule when there are only two candidates, we consider the following profile as for $m=2$. 
\begin{equation}\nonumber\left\{
\begin{array}{l}
(n/2+\MOV) \text{ votes for } c_1\succ c_2\\
(n/2-\MOV) \text{ votes for } c_2\succ c_1
\end{array}
\right..
\end{equation}
It's easy to check that its margin of victory is $\MOV$ under all four rules above. Figure~\ref{fig:plu_m_2} compares quantum-accelerated voting with a classical fast voting algorithm (Algorithm~\ref{alg:classical_multi}). The horizontal axis of Figure~\ref{fig:plu_m_2}, $\log_2(K\cdot 2^s)$, can be seen as the logarithm of the algorithms' runtime. For all curves, we set $s = 4,5,\cdots,16$ for the twelve points from left to right, respectively. The detailed settings and experimental results of $m=4$ are shown in Appendix~C.2.%\ref{app:exp}.








\noindent\textbf{Observations. } First, with the same order of runtime, the quantum-accelerated voting algorithm has better $\prc$ than classical fast voting no matter under which setting. For example, in Figure~\ref{fig:plu_m_2}, $\MOV=1024$, $K=1$, and $s = 14$, the quantum-accelerated voting algorithm outputs the correct winner almost for certain. However, the classical algorithm only has $\sim$$60\%$ probability of outputting the correct winner. Second, quantum-accelerated voting requires much less runtime to achieve the same $\prc$. For example, in Figure~\ref{fig:plu_m_2}, $\MOV=1024$, and $K=1$, to achieve $\sim$$90\%$ $\Pr[\text{correct}]$, the quantum algorithm requires $2^{10}$ runtime. In comparison, the classical algorithm with $2^{16}$ runtime can only achieve $\sim$$70\%$ $\Pr[\text{correct}]$. Both observations match our theoretical result: the proposed algorithm is quadratically faster than any classical algorithm. %It is not surprising that the accuracy of quantum and classical voting both increase with runtime. %We also observed that the lower bound of $K=69$ and $K=139$ for quantum majority voting are looser than the $K=1$ case. We believe that this behavior is caused by the Chernoff bound, which is not asymptotically tight, used in Inequality~(\ref{equ:quantum_k_large}). We also note that providing an asymptotically tight tail bound for binomial distribution is too far from the main topic of this paper.

%We also observe that the quantum-accelerated voting algorithm's $\Pr[\text{correct}]$ may not monotonically increase with the increase of $\log_2(K\cdot 2^{\tone})$. For example, in Figure~\ref{fig:plu_m_4}, $K=1$, and $\MOV=256$, the $\Pr[\text{correct}]$ for $s=15$ is smaller than $s=14$. The non-monotonicity is not an uncommon phenomenon in quantum algorithms (\emph{e.g.,} \citealp{kerenidis2019q,chen2020low,bausch2020recurrent}). This phenomenon comes from the discrete manner of quantum noises, which differs from classical noise.  We also note that our theoretical analysis bounds the asymptotic manner of $\Pr[\text{correct}]$, instead of its monotonicity. Also see Appendix~\ref{app:discuss} for a slightly more technical discussion.



\iffalse
\begin{corollary}
    \label{coro:quantum_inverse}
    Algorithm~\ref{alg:quantum_multi} with runtime $T$ and $K =1$ has an accuracy of  $1-\Theta(\frac{n}{\MOV\cdot T})$. 
    
    (More specifically, given $T = \Theta(2^{\tone})$, and let $\delta = \frac{\MOV}{2^{t+1}\pi\cdot(m!)} - 2\cdot 2^{\tone}$, The lower bound of the accuracy is $1 - \frac{m!}{2\left( \frac{\MOV\cdot \Theta (T)}{2^{t+1}\pi\cdot(m!)}-3\right)}$.
\end{corollary}

\begin{corollary}
    \label{coro:classical_inverse}
    A classical sampling algorithm with runtime $T$ has an accuracy of $1-2^{\Theta(\frac{n^2}{\MOV^2\cdot T})}$
\end{corollary}
\fi

\section{Further accelerating quantum voting}
\label{sec:heuristic}
Can quantum-accelerated voting algorithm be further accelerated? This section discusses some heuristics. 

\noindent\textbf{Pre-sampling.} One way to improve the average performance of the quantum-accelerated voting algorithm is to pre-sample a small subset of the votes. For example, in the majority vote for binary candidates, if the pre-sample votes indicate an almost irreversible win of a candidate, then we directly announce the winner and skip the quantum computing. By carefully setting the pre-sampling size and the skipping thresholds, we may improve the average run-time while keeping high $\prc$. 

\noindent\textbf{Sampling + quantum.} Another natural idea is to apply the quantum-accelerated voting algorithm on a sampled subset of the votes. Sampling decreases the number of votes, so the quantum circuit consumes fewer bits and operators, which reduces the time and space cost. However, such improvement sacrifices $\prc$, as both sampling and quantum computing has a probability to make a mistake. It is still unclear if such a sampling-quantum algorithm would be faster to achieve the same level of $\prc$. 



\section{Conclusions and Future Works}
In this paper, we took the first step in using quantum computation to accelerate voting. Our proposed quantum-accelerated voting algorithm can quadratically accelerate various widely-used voting rules and may potentially improve the efficiency of voting in large-scale and/or high-frequency decision-making scenarios. 

An extension of this paper is to further accelerate the proposed algorithm by combining existing acceleration techniques in classical fast voting algorithms. Since voting is widely used in artificial intelligence, it would also be interesting to apply the proposed methods to accelerate the algorithms in other fields (\emph{e.g.,} search engine, crowdsourcing, database management, and blockchain governance). %It would also be interesting to extend the theoretical guarantee to a broader range of voting rules, such as generalized scoring rules~\cite{xia2013generalized,ao2020private}, which contain most of the widely-used voting rules. %in real-world elections.%, and preference functions whose output is aggregated preference among all the candidates. 

As real quantum computers may come across quantum errors caused by quantum interference and environmental effects, another interesting extension is to test the robustness of the proposed algorithm. For example, testing its performance on real quantum computers and/or running experiments with quantum errors taken into account.
% A simple extension of this paper is applying quantum computation on biased majority voting, where the threshold of winning is not half-by-half. It would also be interesting to apply quantum computation to accelerate other widely used voting rules. For example, Borda, STV, Copeland, Ranked Pairs, or even generalized scoring rules~\cite{xia2013generalized,ao2020private}, which contain most of the widely-used voting rules in real-world elections.

\begin{acknowledgements}
We thank the anonymous reviewers for their helpful comments. Lirong Xia is supported by NSF \#1453542 and a gift fund from Google. %Ao Liu is supported by RPI-IBM AIHN scholarship.
\end{acknowledgements}

%\bibliographystyle{ACM-Reference-Format} 
\bibliography{sample}

%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%

%\clearpage
%\onecolumn











% \iffalse
% \section{Additional comparisons}
% The detailed comparison between this paper and related works is summarized in Table~\ref{tab:summary}
% \begin{table*}[htp]
%     \centering
%     \begin{tabular}{cccc}
%     \toprule
%          & quantum communication cost & runtime after the last vote & space requirement\\ \hline
%         \textbf{This Work} &  \bm{$0$} & \bm{$\Theta\left(\frac{n}{\varepsilon\cdot\MOV}\right)$} & \bm{$O\left(\log(\frac{n}{\varepsilon\cdot\MOV})\right)$}\\
%         \citet{vaccaro2007quantum} & $\Theta(n)$ & unclear & $\Theta(n)$ \\
%         \citet{xue2017simple} & $\Theta(n)$ &  unclear  & $\Theta(n)$    \\
%         \citet{khabiboulline2021efficient} & $\Theta(n^4\cdot\log n)$ &  $\Omega(n\cdot\log n)$ (unclear)  & $\Theta(n\cdot \log n)$    \\
%         Classical Majority Voting &  $0$ & $\Theta\left(\frac{n^2}{\varepsilon^2\cdot\MOV^2}\right)$ & $\Theta\left(\log(\frac{n^2}{\varepsilon^2\cdot\MOV^2})\right)$\\
%     \bottomrule
%     \end{tabular}
%     \caption{The main contribution of this work and comparison with literature about quantum majority voting. All algorithms in the table assume the algorithm output the winner with no less than $1-\varepsilon$ probability.}
%     \label{tab:summary}
% \end{table*}
% \fi



\end{document}

