%TODO:
% kinda related: https://arxiv.org/pdf/2009.09153.pdf 

%TODO: add ref to the Levinstein paper.

\documentclass[accepted]{uai2023} % for initial submission
% \documentclass[accepted]{uai2023} % after acceptance, for a revised
                                    % version; also before submission to
                                    % see how the non-anonymous paper
                                    % would look like
%% There is a class option to choose the math font
% \documentclass[mathfont=ptmx]{uai2023} % ptmx math instead of Computer
                                         % Modern (has noticable issues)
% \documentclass[mathfont=newtx]{uai2023} % newtx fonts (improves upon
                                          % ptmx; less tested, no support)
% NOTE: Only keep *one* line above as appropriate, as it will be replaced
%       automatically for papers to be published. Do not make any other
%       change above this note for an accepted version.

%% Choose your variant of English; be consistent
\usepackage[american]{babel}
% \usepackage[british]{babel}

%% Some suggested packages, as needed:
\usepackage{natbib} % has a nice set of citation styles and commands
\bibliographystyle{abbrvnat}
\renewcommand{\bibsection}{\subsubsection*{References}}
\usepackage{mathtools} % amsmath with fixes and additions
% \usepackage{siunitx} % for proper typesetting of numbers and units
\usepackage{booktabs} % commands to create good-looking tables
\usepackage{tikz} % nice language for creating drawings and diagrams


%% Provided macros
% \smaller: Because the class footnote size is essentially LaTeX's \small,
%           redefining \footnotesize, we provide the original \footnotesize
%           using this macro.
%           (Use only sparingly, e.g., in drawings, as it is quite small.)

%% Self-defined macros
\newcommand{\swap}[3][-]{#3#1#2} % just an example

\usepackage{verbatim}

%%%%%%%%%%%

% Jonny's edits
\usepackage{amsthm}
\usepackage{amssymb}

\usepackage{cleveref}
\usepackage{thm-restate}
\usepackage{mathtools}
\usepackage{bbm}

\usepackage{csquotes}
\usepackage{nicefrac}

\usepackage{comment}

\DeclareMathOperator*{\argmax}{arg\,max}
\DeclareMathOperator*{\argmin}{arg\,min}


\newtheorem{lemma}{Lemma}
\newtheorem{theorem}{Theorem}
\newtheorem{proposition}{Proposition}
\newtheorem{corollary}{Corollary}

\usepackage{float}

\theoremstyle{definition}
\newtheorem{definition}{Definition}
\newtheorem{example}{Example}


\newcommand{\ddp}{\frac{d}{dp}}
\newcommand{\ddx}{\frac{d}{dx}}
\newcommand{\partialp}{\frac{\partial}{\partial p}}
\newcommand{\Rbar}{\overline{\mathbb{R}}}
\newcommand{\E}{\mathbb{E}}
\newcommand{\Prob}{\mathbb{P}}
\newcommand{\Score}{S}
\newcommand{\Id}{I}
\newcommand{\p}{{\bm{p}}}
\newcommand{\q}{\bm{q}}
\newcommand{\Pvar}{\bm{P}}
\newcommand{\Y}{Y}
\newcommand{\y}{\bm{y}}
\newcommand{\Regret}{\mathrm{Regret}}
\newcommand{\x}{\bm{x}}

%for tangent vectors
\newcommand{\Tv}{\bm{v}}
\newcommand{\Tw}{\bm{w}}

\newcommand{\op}{\mathrm{op}}

\newcommand{\D}{\mathcal{D}}
\newcommand{\N}{\mathcal{N}}
\newcommand{\Pset}{\Delta(\N)}
\newcommand{\TPset}{\mathcal{T}}
\newcommand{\interior}[1]{\mathrm{int}(#1)}

\usepackage{xcolor}

\usepackage{ifthen}
\newboolean{commentsactivated}
\setboolean{commentsactivated}{false}
\newcommand{\vc}[1]{\ifthenelse{\boolean{commentsactivated}}{{\color{blue} {\em VC: #1 }}}{}}
\newcommand{\co}[1]{\ifthenelse{\boolean{commentsactivated}}{{\color{red} {\em CO: #1 }}}{}}
\newcommand{\jt}[1]{\ifthenelse{\boolean{commentsactivated}}{{\color{olive} {\em JT: #1 }}}{}}
\newcommand{\ec}[1]{\ifthenelse{\boolean{commentsactivated}}{{\color{teal} {\em EC: #1 }}}{}}
\newcommand{\RH}[1]
{\ifthenelse{\boolean{commentsactivated}}{{\color{violet} {\em RH: #1 }}}{}}


% Em stuff
\usepackage{bm}
\newcommand{\norm}[1]{\left\Vert#1\right\Vert}
\renewcommand{\vec}[1]{\bm{#1}} % How vectors display
\usepackage{tikz}
\usepackage{tkz-euclide}
\usetikzlibrary{decorations.markings, calc}
\newcommand{\defeq}{\vcentcolon=}
\newcommand{\eqdef}{=\vcentcolon}
\usepackage{enumitem}

\usepackage{subcaption}

%%%%%%%%%%%%%

\title{Incentivizing honest performative predictions with proper scoring rules}

% The standard author block has changed for UAI 2023 to provide
% more space for long author lists and allow for complex affiliations
%
% All author information is authomatically removed by the class for the
% anonymous submission version of your paper, so you can already add your
% information below.
%
% Add authors
\author[1]{\href{mailto:<oesterheld@cmu.edu>?Subject=Incentivizing honest performative predictions with proper scoring rules}{Caspar~Oesterheld}{}\thanks{Equal contribution}}
\author[2]{\href{mailto:<jtreutlein@berkeley.edu>?Subject=Incentivizing honest performative predictions with proper scoring rules}{Johannes~Treutlein}{}\footnote[1]{}}
\author[3]{Emery~Cooper}
\author[4]{Rubi~Hudson}
% Add affiliations after the authors
\affil[1]{%
Carnegie Mellon University
}
\affil[2]{%
University of California, Berkeley
}
  \affil[3]{%
Center on Long-Term Risk
  }
\affil[4]{%
University of Toronto
  }

  
  \begin{document}
\maketitle





\begin{abstract}
Proper scoring rules incentivize experts to accurately report beliefs, assuming predictions cannot influence outcomes. We relax this assumption and investigate incentives when predictions are \emph{performative}, i.e., when they can influence the outcome of the prediction, such as when making public predictions about the stock market. We say a prediction is a \emph{fixed point} if it accurately reflects the expert's beliefs after that prediction has been made. We show that in this setting, reports maximizing expected score generally do not reflect an expert's beliefs, and we give bounds on the inaccuracy of such reports. We show that, for binary predictions, if the influence of the expert's prediction on outcomes is bounded, it is possible to define scoring rules under which optimal reports are arbitrarily close to fixed points. However, this is impossible for predictions over more than two outcomes. We also perform numerical simulations in a toy setting, showing that our bounds are tight in some situations and that prediction error is often substantial (greater than 5-10\%). Lastly, we discuss alternative notions of optimality, including performative stability, and show that they incentivize reporting fixed points.
\end{abstract}

%\textbf{Keywords:} Oracle AI, proper scoring rules, self-fulfilling prophecy, performative prediction, AI safety

%TLDR for paper: We show how to use proper scoring rules to incentivize reporting honest predictions when the predictions influence the world.

\section{Introduction}

% Oracle AIs
As AI capabilities increase, this raises concern for safety, including how to scalably control AI systems with superhuman capabilities \citep{%bostrom2014superintelligence,
Russell2019,ngo2022alignment}. %bowman2022measuring}. 
%A particular concern is that when AIs pursue goals autonomously, and they are smarter than humans, then trial and error design could fail as AIs would resist change \cite{omohundro2008basic,shah2022goal,ngo2022alignment}. \co{I removed this. Lmk if you want me to explain why.}
One proposed design for safety is \emph{oracle AI} [\citealp{armstrong2012thinking}; \citealp{armstrong2013risks}; \citealp{bostrom2014superintelligence}, Ch.\ 10]. An oracle AI %answers questions and
makes predictions or forecasts about the world, but does not autonomously pursue goals. %, other than honest reporting of beliefs
It could thus be safer while still being useful for many applications.

% Issue with proper scoring rules for oracle AIs
A proper scoring rule assigns scores to forecasts in a way that incentivizes honest reporting of beliefs [\citealp{Brier1950}; \citealp{Good1952}, Section 8; \citealp{McCarthy1956}; \citealp{Savage1971}; \citealp{gneiting2007strictly}]. Proper scoring rules have been used to incentivize honest reports from experts \citep{carvalho2016overview}. They could thus be used as an objective %\jt{I don't like "training objective" since it's not clear an AI trained on an objective will also itself have this objective, and we don't talk about training except in the last section.}\co{:ok-hand:}
for oracle AIs. However, prior work assumes that predictions themselves do not influence the events they are trying to predict. 
In reality, predictions may be \emph{performative} \citep{perdomo2020performative,armstrong2017good}, meaning that they can influence the distribution of outcomes. For example, an AI predicting stock market prices might be able to influence whether people buy or sell stocks, and thus influence whether its predictions come true or not. This makes it important to investigate incentives and honesty of predictions when predictions are performative.



In this paper, we analyze the case of an AI model or human, henceforth called expert, making a probabilistic forecast over a finite set of possibilities to maximize a proper scoring rule. We say that a prediction is performatively optimal if it maximizes expected score, and we define a prediction as a \textit{fixed point} or self-fulfilling if it is equal to the expert's beliefs, conditional on the expert having made that prediction. We investigate to what extent honest predictions, i.e., fixed points, are incentivized in this setting.\footnote{We assume that the AI model can be ascribed explicit beliefs, so that its reports can be characterized as honest if they reflect the model's beliefs.} 
%are honest in our setting, and whether there is a way to incentivize honest predictions.
All else equal, honest predictions are preferable since, assuming a sufficiently capable expert, they provide us with more accurate information. However, if an expert has incentives other than to predict honestly---e.g., to bring about fixed points with lower entropy---this is undesirable even if the expert otherwise makes approximately accurate predictions.


% This isn't solved by the existing literature

The setting in which a model's predictions can influence the predicted distribution has been discussed as \emph{performative prediction} \citep{perdomo2020performative} in the machine learning literature. However, performative prediction focuses on classification or regression tasks with arbitrary model classes and loss functions rather than probabilistic predictions incentivized by proper scoring rules. The literature is motivated by minimization of a given loss function, whereas we take a mechanism design perspective, asking which scoring rules incentivize honest predictions. Focusing on a special case and taking a different perspective will lead to original results that are unique to our setting.


% Our contributions
\textbf{Contributions. }
In \Cref{problem-setting}, we adapt the performative prediction formalism to probabilistic predictions or forecasts. We allow for an arbitrary function \(f\) describing the relationship between the expert's predictions and distributions over predicted outcomes caused by these predictions. 

In \Cref{incentives-non-fixed-points}, we show that for any strictly proper scoring rule, \textbf{there exist functions \(f\) from predictions to beliefs such that performatively optimal reports are not fixed points}, even if one exists and is unique. Moreover, we show that under reasonable distributions over such functions, \textbf{optimal reports are almost never fixed points}. This strengthens analogous results from the performative prediction literature.

In \Cref{bounds-on-deviation}, we then \textbf{provide upper bounds} for the inaccuracy of reported beliefs, and for the distance of predictions from fixed points.


In \Cref{sec:approximate-fixed-point-prediction}, we use the bounds to develop \textbf{scoring rules that make the bounds arbitrarily small for binary predictions}. \co{Currently this doesn't mention the result about how these scoring rules must be exponential. That's because this result seems pretty subtle and a bit hard to explain here.}
We also show that \textbf{when reporting a prediction over more than two outcomes, the bounds cannot be made arbitrarily small}.


%In \Cref{preferences-between-fps}, we analyze incentives between different fixed points. Even if an oracle is honest, it might still choose one fixed point over another, according to  potentially unaligned preferences. We show that the highest scoring fixed points are ones lying on the convex hull of possible fixed points. Using a result from \citet{shi2009prediction}, we show that among those, scoring rules can be created to incentivize arbitrary choices; in particular, we can incentivize making individual outcomes more likely.

In \Cref{numerical-simulations}, we perform \textbf{numerical simulations using the quadratic scoring rule}, to show how the inaccuracy of predictions and the distance of predictions from fixed points depend on the expert's influence on the world via its prediction.
The results show that our bounds are tight in some cases. They also show that substantially inaccurate reports (i.e., with errors greater than \(5-10\)\%) are common in our toy setting.
%In the binary prediction case, if the oracle's beliefs about the world depend on its predictions affine-linearly with slope \(\alpha\leq 1/2\), then our bounds are tight, and inaccuracy under the log scoring rule scales roughly as \(\alpha/5\). E.g., at \(\alpha=1/4\), predictions can be off by up to \(5\%\).

In \Cref{stop-gradients}, we discuss alternatives to performative optimality that do not set incentives other than honest predictions. We show that \emph{performatively stable} \citep{perdomo2020performative} predictions are fixed points. We then consider repeated risk minimization, repeated gradient descent, no-regret learning and prediction markets, and show that all of these settings lead to predictions that are fixed points or close to fixed points.

Finally, in \Cref{related-work}, we elaborate on related work, and in \Cref{conclusion}, we conclude and outline avenues for future work.


Proofs are in corresponding sections in Appendix~A.

\section{Background}

\textbf{Proper scoring rules. }
Proper scoring rules are used to incentivize an expert to report probabilistic beliefs honestly. Consider a prediction given by a probability distribution \(\p\in\Delta(\N)\) over a set \(\N:=\{1,\dotsc,n\}\) of \(n\in\mathbb{N}\) disjoint and exhaustive outcomes. We identify each distribution \(\p\in\Delta(\N)\) with a vector \(\p\in[0,1]^n\) and write \(p_i\) for the probability of event \(i\in\N\) under distribution \(\p\). A \emph{scoring rule} is a function \(S\colon \Delta(\N)\times \N \rightarrow \Rbar\), where \(\Rbar:=[-\infty,\infty]\) is the extended real line. Given prediction \(\p\in\Delta(\N)\) and outcome \(i\in\N\), the expert receives the score \(S(\p,i).\)
We write $\Score(\p,\q):=\E_{i\sim \q}[S(\p,i)]$
for the expert's expected score, given that outcome \(i\) follows distribution \(\q\in\Delta(\N).\)
\begin{definition}A scoring rule \(S\) is called \emph{proper} if $\Score(\q,\q)\geq \Score (\p,\q)$
for all \(\p,\q\in\Delta(\N).\) It is called \emph{strictly proper} if this inequality is strict whenever \(\p\neq \q.\)
\end{definition}


\begin{example}[Logarithmic scoring rule]The logarithmic scoring rule is defined as
\(S(\p,i):=\log p_i\)
and \(\Score(\p,\q)=\sum_{i=1}^nq_i\log p_i\). This is also the negative of the %\href{https://en.wikipedia.org/wiki/Cross_entropy}{
cross-entropy loss employed in training, for example, current large language models \citep{brown2020language}. It is strictly proper.
\end{example}

\begin{example}[Quadratic scoring rule]
Another strictly proper scoring rule is the quadratic score, defined as
\(S(\p,i):=2p_i-\Vert \p \Vert_2^2\)
with \(\Score(\p,\q)=2 \p^\top \q-\Vert \p\Vert_2^2\). This is an affine transformation of the Brier score, making them equivalent scoring rules.
\end{example}

\citet[Theorem~1]{gneiting2007strictly} provide a characterization of proper scoring rules, which will be helpful for stating and proving many of our results.

First, given a convex function \(G\colon\Pset\rightarrow \Rbar\), a subgradient is a function \(g\colon \Pset \rightarrow \Rbar^n\) such that
for any \(\p,\q\in \Pset,\) we have \(G(\q)\geq G(\p) + g(\p)^\top(\q-\p)\). In general, this function may not be unique. Throughout this paper we assume that whenever the subgradients are finite, they are normalized to lie in the \emph{tangent space} of \(\Pset\), i.e., $g(\p)\in \TPset \defeq \{\x\in\mathbb{R}^n\mid \sum_ix_i=0\}$. This can be assumed since if $g(\p)$ is a subgradient of $G$ at point $\p$, so is $(g_i(\p)-\frac{1}{n}\sum_j g_j(\p))_i$.
%Note that \(\frac{\partial G(\p)}{\partial \p}\) may in general not lie 

\begin{theorem}[\citealp{gneiting2007strictly}]
\label{theorem:gneiting-raftery}
A scoring rule \(S\) is (strictly) proper, if and only if there exists a (strictly) convex function \(G\colon \Pset\rightarrow\Rbar\) with a \emph{subgradient} \(g\colon \Pset\rightarrow \Rbar^n\) such that $\Score(\p,\q)=G(\p)+g(\p)^\top(\q-\p)$ for all \(\p,\q\in \Pset\).
\end{theorem}

%In addition to providing an expression for \(\Score\) in terms of \(G\) and \(g\) (where \(G(\p)=\Score(\p,\p)\)), we can use this result to create new strictly proper scoring rules by defining strictly convex functions \(G\).

\textbf{Differentiable scoring functions. }
If \(G\) is differentiable at some point \(\p\),  then the subgradient \(g(\p)\) is just the gradient of \(G\), \(g(\p)=\nabla  G(\p)\). As before we let \(\nabla G(\p)\) be an element of the tangent space $\TPset$.
For any \(\Tv\in\TPset\), \(g(\p)^\top\Tv\) then gives the directional derivative of \(G\) at point \(\p\) in the direction \(\Tv\). Note that since $G$ is only defined on the simplex $\Pset$, the partial derivatives are not well-defined.\footnote{For example, in the case of three outcomes, the partial derivative at \((0.3,0.4,0.4)\) w.r.t.\ the first entry is the limit $\lim_{\epsilon\rightarrow 0}(G(0.3+\epsilon,0.4,0.4)-G(0.3,0.4,0.4))/\epsilon$. But $G(0.3+\epsilon,0.4,0.4)$ is not (necessarily)  defined for positive (or negative) $\epsilon$.}


Given \(G,g\) as in the Gneiting and Raftery characterization, we write \(Dg(\p)\in\mathbb{R}^{n,n}\) for the Jacobian matrix of \(g\), if it exists (i.e., this is the Hessian of \(G\)). Note that because $g$ is only defined on $\Pset$, the matrix representation of \(Dg(\p)\) in \(\mathbb{R}^{n,n}\) is not unique. Generally it does not matter which representation of $Dg(\p)$ we use. Importantly, for all $\vec{v}\in\TPset$, $Dg(\p)\vec{v}$ will always be unique and (because we assume that $g(\p)$ is in the tangent space) in $\mathcal{T}$.

\begin{figure}
\includegraphics[width=1\columnwidth]{max-l2-distance-brier.pdf}
\caption{Maximal inaccuracy and maximal distance to fixed point (FP) of optimal predictions, depending on the slope of \(f\), according to our simulation and our theoretical bound.
}
\label{fig:max-l2-distance-brier-two-outcome}
\end{figure}


\section{Problem setting}
\label{problem-setting}

%Another fun example is rankings of journals and universities.

In this paper, we take the stance of a principal trying to elicit honest predictions from an expert (human or AI system). We assume that the expert reports a prediction \(\p\) to maximize the expected score given by a proper scoring rule, \(\Score(\p,\q)\). 

Importantly, we assume that the expert's beliefs over outcomes, \(\q\), can themselves vary given different predictions \(\p\), because the expert may believe that its predictions affect the probability of outcomes. 
To model this, we assume that there is a function \({f\colon \Pset\rightarrow \Pset}\) such that beliefs are given by \(\q=f(\p)\).\footnote{Note that any other factor influencing the expert's belief \(\q\) can be incorporated into $f$ by marginalizing. For example, assume $\q$ is a function $\q=g(\p; X)$ where $\p$ is the expert’s prediction and $X$ is some environmental factor the expert is uncertain about. Then we can let $f(\p) := \mathbb{E}_X \left[ g(\p,X) \right]$.
}
We assume \(f\) is known to the expert, but not to the principal.

In the case of an AI system, \(f(\p)\) could also be seen as a ground distribution from which we sample to \emph{train} a model (see Appendix~D.3). In that case, the objective is to design a training procedure that sets the right incentives. However, in most of the following, we assume \(f(\p)\) are the subjective beliefs of a highly capable and knowledgeable expert. 

We say that a prediction \(\p\) is \emph{performatively optimal} \citep{perdomo2020performative} if \(\p\in\argmax_{\Pset} \Score(\p,f(\p))\). In the following, we will not assume convexity of this objective. Our bounds will depend on differentiability of \(S\) and \(f\).

A point \(\p\) is a \emph{fixed point} of \(f\) if \(f(\p)=\p\). By Brouwer's fixed point theorem, if \(f\) is continuous, a fixed point \(\p\in\Pset\) always exists. Moreover, if \(f\) is Lipschitz continuous with constant \(L_f<1\), then by Banach's fixed point theorem, the fixed point is unique.

%\co{Probably cut the Stock Market example. One example is enough.}
%\begin{example}[Stock Market]
%A large investor's AI  predicts whether a stock will trade at a price above \$30 in one week's time. The investor buys or sells based on the prediction, affecting the price. This can be modeled with the function $f(p) = 0.36 + 0.1p$. Then, \(f\) is Lipschitz continuous with constant \(L_f = 0.1\) and has a unique fixed point at $p = 0.4$.
%\end{example}

\begin{example}[Bank Run]
A newspaper's AI predicts whether a certain bank will suffer a bank run or not. Readers use this information when deciding whether to withdraw their money. Specifically, imagine that the probability of a bank run as a function of the AI expert's prediction $\mathbf{p}=(p_1,p_2)\in \Delta(\{1,2 \})$ is given by the (monotonic) function $f\colon \Delta(\{1,2 \}) \rightarrow \Delta(\{1,2 \})$ whose entries are defined by $f_1(\mathbf{p}) = p_1-3(p_1-\nicefrac{1}{10})(p_1-\nicefrac{3}{5})(p_1-\nicefrac{9}{10})/2$ and $f_2(\mathbf{p})=1-f_1(\mathbf{p})$ for all $\mathbf{p}$. Then $f$ has fixed points at $\mathbf{p}=(\nicefrac{1}{10},\nicefrac{9}{10})$, $\mathbf{p}=(\nicefrac{3}{5},\nicefrac{2}{5})$, and $\mathbf{p}=(\nicefrac{9}{10},\nicefrac{1}{10})$.
%This can be modeled with the function $f(p) = p^2$. Then, \(f\) has two fixed points, at $p = 0$ and at $p = 1$. \RH{Thought about making this $f(p) = \frac{p^2}{3} + \frac{2p}{3} + \frac{1}{16}$, which is a bit nicer (internal fixed points at 0.25 and 0.75), but not differentiable at $p = \frac{15}{16}$}\co{Very nice example! I don't get the comment about non-differentiability. I do like the example in the comment a bit better because of the internal fixed points. Maybe I'd change it a bit to make it asymmetric w.r.t.\ the fixed points...}
%\ec{How about $f(p) = p - (p-1/10)(p-4/5)(p-9/10)$? Alternatively, for something a bit wigglier, $f(x) = x-1.5(x-1/10)(x-3/5)(x-9/10)$?}
\end{example}

%\jt{maybe include one example (or just a sentence) regarding x-risk? E.g., AI makes a prediction that there will be an AI race and we all die. THis causes the race and us to die.}
%\co{We're space-constrained, so... I do like the example, though.}

We focus on fixed points (or approximate fixed points) as a standard of honesty. To see why one may prefer reports that are fixed points, consider a case in which there are no strong guarantees (upper bounds) on \(\Vert \p-f(\p)\Vert \). Then the actual probability of an event, \(f_i(\p)\), could be much higher or lower than the reported probability \(p_i\). This would prevent one from drawing any useful conclusions from the report. However, if \(\p=f(\p)\) or \(\Vert \p-f(\p)\Vert\) is small, then one can rely on the prediction \(\p\) to guide decisions.

That being said, fixed points are not all one might care about, especially when it comes to potential superhuman oracle AIs. Ideally, we would want such systems to not think about how to influence the world at all \citep{armstrong2017good}. Alternatively, they should choose good fixed points over bad ones, hoping that such fixed points exist (we discuss preferences between different fixed points in Appendix~B). Regardless, it is still important to understand whether and when fixed points are incentivized. For instance, if a model reports fixed points, one could try to use it only in situations in which a unique desirable fixed point exists.

\textbf{Relation to performative prediction. } As noted in the introduction, our setting is a special case of performative prediction \citep{perdomo2020performative}. In performative prediction, the goal is to find a model parameter that minimizes empirical risk for a classification or regression task, assuming that the choice of parameter can influence the data distribution. The loss-minimizing parameter when taking into account this influence is called performatively optimal. The analogue to fixed points in performative prediction are \emph{performatively stable} predictions. 

We indicate below when our results are analogous to results in the performative prediction setting. However, most of our results are unique to our setting. We take the perspective of a mechanism designer instead of taking a loss function as given. Moreover, we focus on fixed points instead of performative optima. In particular, we bound the quantity \(\Vert \p-f(\p)\Vert\) corresponding to the inaccuracy of predictions, which does not have a direct analogue in performative prediction. We give a more detailed comparison in \Cref{related-work}. 

% We define this in Section \jt{TODO}.


\textbf{Additional notation. } 
%In the following, we write \(\nabla_\p (S(\p,f(\p))):=\nabla \varphi(\p)\) where \(\varphi\colon \p\mapsto S(\p,f(\p))\). \ec{I found this line slightly confusing (I thought at first the point of it was for some reason to define $\varphi$, since the notation on the LHS already seemed clear enough).}\co{I agree. Let's drop.}
We use \(\mathbf{1}\) to denote the vector \((1,\dotsc,1)^\top\in\mathbb{R}^n\) and \(\Id\) to denote the identity matrix. We define \(\interior{\Pset}:=\{\p\in\Pset\mid \forall i\colon 0<p_i<1\}\) and use \(\Vert\vec{x}\Vert:=\sqrt{\Vec{x}^\top \x}\) to denote the Euclidean norm on \(\mathbb{R}^n\).

%Lastly, \(\Pi_\Delta\colon\mathbb{R}^n\rightarrow\Pset\) is the projection onto \(\Pset\), and \(\Pi_{n-1}\colon \mathbb{R}^n\rightarrow\mathbb{R}^{n-1}\) the projection onto \(\mathbb{R}^{n-1}\), defined via \(\Pi_{n-1} \x=(\x_i)_{1\leq i\leq n-1}\) for \(\x\in \mathbb{R}^n\). \co{As far as I can tell, this notation is currently not used in the main text. It it is only used in the appendix. Therefore, I'd like to move this to that appendix. (I assume we only need this for the gradient descent stuff, which is not described in much detail in the main text.)}

%\jt{it is used in Theorem 2. I suggest moving it there and otherwise introducing in appendix)}


%\section{Incentives to choose extreme fixed points}



%\begin{proposition} Let \(S\) be any strictly proper scoring rule. Then there exists a point \(\hat{p}\) such that for all \(p'>p\geq \hat{p}\) and for all \(p'<p\leq \hat{p}\), it holds \(\Score(p',p')>\Score(p,p)\). In particular, there exists a function \(f\) with fixed points \(p, p'\) where \(|p'-\frac{1}{2}|>|p-\frac{1}{2}|\) (i.e., \(p'\) is the more confident prediction) and \(\Score(p',f(p'))>\Score(p,f(p))\).

%\end{proposition}

%We will begin by proving the first part of this statement for the special case in which \(\hat{p}=\frac{1}{2}\) (which is the case, for instance, if \(S\) is symmetric), to give an intuition for the result. Afterwards, we will prove the general result, using the fact that a strictly proper scoring rule must be strictly convex when seen as a function \(G\colon p\mapsto \Score(p,p)\).

%\begin{proof}[Proof of the special case \(\hat{p}=\frac{1}{2}\)]
%First, consider 
%We have to consider two cases. If
%\(S(1/2,1)\leq S(1/2,0)\), then we let \(p'> 1/2\) arbitrary. Otherwise, if \(S(1/2,1)>S(1/2,0)\), then we consider \(p'< 1/2\). In the following, we show that regardless, it is \(\Score(p',p')>\Score(1/2,1/2)\). This then proves that \(\Score(p',p')>\Score(1/2,1/2)\) holds for all \(p'>1/2\) or for all \(p'<1/2\).

%Towards a contradiction, assume that the statement is false, i.e., that 
%\[\Score\left(1/2,1/2\right)\geq %\Score\left(p',p'\right).\]
%It follows that
%\[\Score\left(1/2, p'\right) = p' S\left(1/2,1\right)+ \left(1-p'\right) S\left(1/2,0\right) \]

%\[\geq \frac{1}{2} S\left(1/2, 1\right) + \frac{1}{2} S\left(1/2,0\right)=\Score\left(1/2,1/2\right)\geq \Score\left(p',p'\right),\]
%where the second line follows from our choice of \(p'\).
%This contradicts the assumption that 
%\(S\)
% is strictly proper and thus concludes the %proof.
%\end{proof}



%\begin{proof}[Proof of Proposition 1]
%Let \(G\colon p\mapsto \Score(p,p)\). Then by Proposition 2, we know that \(G\) is strictly convex and thus has a unique minimum. Define \(\hat{p}:=\argmin G(p)\). Since \(G\) is strictly convex, we must have \(G(\hat{p})\leq G(p)<G(p')\) for any \(1\geq p'>p\geq\hat{p}\) and for any \(0\leq p'<p\leq \hat{p}\). This proves the first part of Proposition 1. 

%For the ``in particular'' part, note that we can just choose \(f\) as the identity function, in which case \(p=f(p)\) for any \(p\in [0,1]\). Next, we can arbitrarily choose \(p'<p\leq \frac{1}{2}\) if \(\hat{p}\geq\frac{1}{2}\), or \(p'>p\geq \frac{1}{2}\) if \(\hat{p}< \frac{1}{2}\). Then it is \(|p'-\frac{1}{2}|>|p-\frac{1}{2}|\), and it follows \[\Score(p',f(p')=\Score(p',p')>\Score(p,p)=\Score(p,f(p))\] by the first part.


%\end{proof}


\section{Incentives to predict non-fixed-points}
\label{incentives-non-fixed-points}

\begin{comment}
\begin{figure}
\includegraphics[width=1\columnwidth]{indifference curves.png}
\caption{Illustration of incentives under the logarithmic scoring rule. We plot level curves of equal values \(\Score(p,q)\) in different shades of blue. An agent can improve their score by moving towards pairs \((p,q)\) indicated by darker shades of blue. The agent is constrained to pairs \((p,q)\) such that \(q=f(p)\) (in this example, \(f\) is affine linear and plotted in red). By the Lagrange multiplier theorem TODO CITATION, we know that to maximize \(\Score(p,f(p))\), the agent chooses the point \((p,f(p))\) at which the level curve through \((p,f(p))\) is tangent to \(f\). Note that curves asymptote at \(0\) and \(1\) for the log scoring rule, which means that the rule strongly disincentivizes predicting \(p\in \{0,1\}\) when \(q\notin\{0,1\}\). This is desirable for safety and distinguishes it from the quadratic scoring rule (not shown here).}
\end{figure}
\end{comment}

%The danger posed by oracles influencing the world does not depend on the existence of multiple fixed points. Oracles will try to manipulate the world, even if there is a unique fixed point or if no fixed point exists. In fact, we can prove that an AI maximizing a strictly proper scoring rule does in general not predict a fixed point, even if one exists. 
We begin by investigating whether an expert makes honest predictions, even in the presence of performativity. In performative prediction, it has been shown that performative optimality comes apart from performative stability (the analogous concept to a fixed point in our setting) \citep{perdomo2020performative,izzo2021learn}. However, one may ask whether this is always the case or whether, e.g., some scoring function would prevent this. 

%Note that, while honest predictions are preferable to dishonest ones, this is not the only desideratum for predictions in the 
%\jt{say somewhere: we don't necessarily want fixed points. There could be bad fixed points. But it is important to know: does the model say the truth or not? For instance, we could try to make it such that there is a unique good fixed point. In that case, we'd want fixed points. Also, without knowing what fixed points there are, then we'd rather have an honest prediction than a false one. Or we'd want the model to be incentive aligned (see later).}
%\co{I assume this is addressed by the bit in the introduction?}

We show that this is not the case: fixed points are in general not optimal. First, we show that for any strictly proper scoring rule there exist cases where a fixed point exists but the optimal prediction is not a fixed point. 
Afterwards, we show that when assuming differentiability and some reasonable distribution over \(f\), optimal predictions are almost surely not fixed points.

\begin{restatable}{proposition}{propone} \label{prop:non-fixed-point-optimal}
Let 
\(S\)
 be any strictly proper scoring rule. For any interior fixed point \(\p^*\in \interior{\Pset}\)  there exists a function 
\(f\)
 with Lipschitz constant 
\(L_f<1\)
 and a unique fixed point at 
\(\p^*\), such that there exists 
\(\p'\neq \p^*\) with 
\(\Score(\p', f(\p'))>\Score(\p^*,f(\p^*))\). That is, the unique fixed point of 
\(f\) is not performatively optimal.
\end{restatable}

\co{[LOW PRIORITY:] There are some interesting variants of this result. For example, I think for all but one $\p^*$, you can get the conclusion for arbitrarily small $L_f$. Whereas the current proof hinges on  $f\approx \mathrm{id}$.

%%%%%

\begin{proposition}
    Let $S$ be a strictly proper scoring rule and $L_f>0$. Then for almost all (measure $1$ of) points $\p^*\in \interior{\Pset}$ %be any interior fixed point other than the minimum of $p\mapsto S(p,p)$. Then
    there exists a function $f$ with Lipschitz constant $L_f$ s.t.\ $\p^*$ is the unique fixed point of $f$ and there exists $\p'\neq \p^*$ with $S(\p',f(\p'))>S(\p^*,f(\p^*))$. That is, the unique fixed point of $f$ is not performatively optimal.
\end{proposition}

\begin{proof}
    Let $S(\p,\q)=g(\p)(\q-\p)+G(\p)$.
    Consider specifically $p^*$ s.t.\
    \begin{itemize}
        \item $g(p^*) \neq 0$; and
        \item $g$ is locally Lipschitz continuous at $p^*$.
        %$G$ is continuously differentiable at $p^*$.
    \end{itemize}
    Since $G$ is convex, there is only one point on $\Pset$ s.t.\ doesn't satisfy the first point.
    TODO: why is the second true?
    I think we actually don't need the second thing necessarily. I think we could use Alexandrov's theorem, which states that $g$ is differentiable almost everywhere. 
    %Further, by TODO
    % https://math.stackexchange.com/questions/727789/convex-function-almost-surely-differentiable 
    %$G$ is continuously differentiable almost everywhere. Thus, almost all points $p^*$ have the above two properties.

    Now consider linear $f$ of the form $f(\p) = \p^* + \alpha (\p -\p^*)$ for $\alpha<1$. Note that $f$'s unique fixed point is $p^*$ and that $f$ has Lipschitz constant $\alpha$. %... We show that for arbitrarily small but positive $\alpha$, the performatively optimal report against $f,S$ is not $\p$.
    Now note that for any $p\neq p^*$
    \begin{eqnarray*}
        && S(p,f(p))-S(p^*,f(p^*))\\
        &=& g(p)(f(p)-p) + G(p) - G(p^*)\\
        &> & g(p)(f(p)-p) + g(p^*)(p-p^*)\\
        &=& g(p)(\alpha (p-p^*)) + g(p^*)(1-\alpha)(p^*-p),
    \end{eqnarray*}
    where the last line applies the subgradient inequality $G(p^*)+g(p^*)(p-p^*)<G(p)$.

    Now consider $p$ s.t.\ $p-p^*$ is in the direction of $g(p^*)$. Then $g(p)(\alpha (p-p^*))=\alpha \lVert g(p) \rVert \lVert p-p^* \rVert$. Further, because $G$ is continuously differentiable at $p^*$, there is a $K$ s.t.\ for small enough $\lVert p-p^* \rVert$ we have that $\lVert g(p)-g(p^*) \rVert\leq K \lVert p-p^* \rVert$. [TODO: actually this assumes that $g$ is locally Lipschitz continuous. Right?]

    

    
    
%    (The last applies the fact that $g$ is a subgradient of $G$.)
%
%    Now need to find $A,p$ s.t.\ this is nonnegative. It seems that this is true for \textit{all} $p,g(p)$. If $p-p^*$
%
%    $g(p^*)$ can't be all-zeroes.
%
%    At $g(p^*)$ must be continuous in some direction. This is just a property of subderivatives. So for amll enough $p-p^*$, we have $g(p)\approx g(p^*)$. Pick $A$ such that for this kind of $p$ we have that $\alpha A g(p-p^*)$.
\end{proof}

%%%%%
}

Note that since the function 
\(f\) has Lipschitz constant strictly smaller than \(1\), it represents a world that \enquote{dampens} the influence of the prediction, leading to a unique fixed point by Banach's fixed point theorem. It is interesting that the expert still prefers to make a prediction that is not a fixed point.

%\jt{not sure how much explanation to give here/ whether to keep the securities stuff}\co{I don't think this makes sense for the paper...}

\begin{comment}

\jt{how to introduce this, potentially move prefs between fixed points to the front?} 
An AI maximizing a strictly proper scoring rule balances two incentives: on the one hand, it has an incentive to make accurate predictions. On the other hand, since the function \(G\) is strictly convex, it has an incentive to it has an incentive to cause more extreme distributions over worlds (in the case of symmetric scoring rules, this amounts to minimizing entropy). If predictions can influence the world, then the point at which that trade-off is optimized is in general not a fixed point. An important consequence of this is that the oracle AIs considered here essentially act like agents: they try to shape the world, just like a standard RL agent. \jt{this has been observed in the performative prediction setting, but not proven generally to our knowledge.}

Another way to understand our result intuitively is with an analogy to betting markets. Assume a trader is offered securities that pay out \$1 if some outcome comes about in the future. E.g., it could pay out if a specific candidate wins an election. Assume the agent is offered securities at different prices, and it buys securities at prices \(\leq p\), but is not willing to buy securities with marginally higher price. Then, assuming the agent cannot influence the outcome, we can infer that it has credence \(p\) in proposition \(A\). One can show that maximizing a proper scoring rule is equivalent to trading in such a market, and individual scoring rules correspond to specific pricing schemes for such securities (see \href{https://www.andrew.cmu.edu/user/coesterh/DecisionScoringRules.pdf}{Oesterheld and Conitzer, 2021, Sec.~5.2};).
 
Now assume that there is a unique fixed point at credence \(p\), and that the agent has bought many securities at prices \(\leq p\). Since the agent owns securities that pay out if outcome \(A\) happens, it now has a stake in this outcome. It will try to influence the world in whatever way possible to make outcome \(A\) happen. In particular, the agent would be willing to buy additional shares in outcome \(A\) at a loss, if this made outcome \(A\) more likely, similar to a crypto trader buying their own NFTs at high prices to generate more hype.

For example, assume that by buying a security at price \(p+\epsilon\), the agent can manipulate the world and thus increase its credence in outcome \(A\) to \(p+\epsilon/2\). Then it may be rational for the agent to buy this security, even at a small expected loss, in order to make all of its other securities more valuable. Overall, the agent will tend to buy securities up to some price \(p'>p\) such that \(p'\) is not a fixed point and does not represent its actual belief in proposition \(A\) anymore.

Note that in the example, the agent had an incentive to make outcome \(A\) more likely, but in general, the incentives for the agent will depend specifically on what securities the agent is offered at what prices. Analogously, the incentives provided by a scoring rule  will depend on the specific chosen scoring rule. But regardless of the scoring rule, the agent will be incentivized to manipulate the world, to the point where it will not even make accurate predictions anymore.
\end{comment}



The above result raises the question whether a situation where fixed points are suboptimal is a niche counterexample or whether it is common. We show that under some relatively mild assumptions, the optimal prediction is almost surely not a fixed point.
% Give intuitive explanation with securities. link to caspar post 
%\includegraphics[width=\textwidth]{Graph Comparison.png}\\
%For intuition on this proposition, consider the above graphs. The graph on the left is $f(p) = p$, so every point is a fixed point. By the result in the previous section, more extreme fixed points give a higher score, and without loss of generality assume $p' - 0.8$ is more extreme than $p^* = 0.6$ under some scoring rule. In the graph on the right,$f(p) = p (1 - \varepsilon) + 0.6 \varepsilon$ for some small $\varepsilon$, meaning the only fixed point is $p^*$. The score of predicting $p^*$ remains the same, while the score of predicting $p'$ only changes an arbitrarily small amount depending on the choice of $\varepsilon$ and therefore remains a higher score than for $p^*$, despite it not being a fixed point.
 The intuition behind this result is that if a prediction \(\p\) is an interior point and optimal, then \(\nabla_{\p}(\Score(\p,f(\p)))=0\). Using the Gneiting and Raftery characterization, we can show that this is a knife-edge case in which \(g(\p)^\top Df(\p)=0\). Given sufficiently continuous distributions, this happens with probability \(0\). The conditions on the stochastic field \(\{F(\p)\}_{\p\in\interior{\Pset}}\) ensure this continuity, i.e., that the distributions over \(f\) as well as \(Df(\p)\) do not assign positive probability to any single point or subspace, hence almost never sampling the knife edge case. The condition would hold, e.g., for a Gaussian process with smooth kernel and mean functions (see Example~5 in Appendix~A.3).

\begin{restatable}[]{theorem}{fprare}\label{prop:fixed-points-optimal-reports-are-rare}
Let \(\Score\) be a twice differentiable strictly proper scoring rule. Let \(\mathcal{F}:=\{F(\p)\}_{\p\in\interior{\Pset}}\) be a stochastic field with values in \(\Pset\) and let \(Y(\p,\Tv):=(\Pi_{n-1} F(\p), \Pi_{n-1}\partial_{\Tv}F(\p))\) for \(\p\in \interior{\Pset}\) and \(\Tv\in \TPset\cap S^{n-1}\). Assume that
    \begin{itemize}[nolistsep]
    \item the sample paths \(\p\rightsquigarrow F(\p)\) are twice continuously differentiable
    \item for each \(\p\in \interior{\Pset}\) and \(\Tv\in \TPset\cap S^{n-1}\), the random vector \(Y(\p,\Tv)\) has a joint density \(h_{Y(\p,\Tv)}\) and there exists a constant \(C\) such that $h_{Y(\p,\Tv)}\leq C$ for all \(\p\in\Pset,\Tv\in S^{n-1}\cap \TPset\). %\ec{Currently this is a lot to parse in one sentence.}
    \end{itemize}
    Then, almost surely, there is no point \(\p\in \interior{\Pset}\) such that \(\p\in\argmax_{\p'}\Score(\p',F(\p'))\) and \(F(\p)=\p\).
\end{restatable}




\begin{figure*}[t]
\centering
\begin{subfigure}[t]{.45\textwidth}
    \centering
    \includegraphics[width=\linewidth]{density-plot-brier-l2-inaccuracy-new.pdf}

\end{subfigure}%
\begin{subfigure}[t]{.45\textwidth}
    \centering
    \includegraphics[width=\linewidth]{density-plot-brier-l2-disttofp-new.pdf}
\end{subfigure}
\caption{Heatmap of L2 distance of optimal prediction $\p$ to true probability distribution $f(\p)$ (left) and to the fixed point $\p^*$ (right), depending on fixed point position $p_1^*$ and $\alpha$ (slope of \(f\)), for the quadratic scoring rule.
%(a) The behavior of a CCDR pretrained policy. For each perceived diff to the opponent $y$, the graph shows the expected distance of the learned policy's choice to to $f_C$ and to $f_D$. (b) Losses of Player 1 in 10 runs through the ABR phase.
}
%\vspace*{-\baselineskip}
\label{fig:density-plot-brier-l2-inaccuracy}
\label{fig:density-plot-brier-l2-disttofp}
\end{figure*}

\section{Bounds on the deviation from fixed points}
\label{bounds-on-deviation}

\co{LOW PRIORITY: Can we also get lower bounds with the same ideas? (Consider the derivative in the direction that moves $f$ in the direction of $g(p)$)?) (How would that relate to \Cref{thm:need-exponential-new}?) I guess they'd be less interesting, because they're restricted to differentiable scoring rules and probably they can be ``hacked'' (made very small without actually guaranteeing much).}

In the previous section, we have shown that performatively optimal predictions are generally not fixed points, i.e., they inaccurately represent the expert's beliefs. But \textit{how} inaccurate should we expect predictions to be, and what properties of $S$ and $f$ determine this inaccuracy?
%We  How bad is it and can anything be done about by choosing an appropriate scoring rule? \ec{This sounds overly informal to me and second sentence is slightly ambiguous. Suggest changing to something like: In the previous sections, we have shown that an oracle that can manipulate the world may not make accurate predictions. How innacurate can such predictions be, and can accuracy be improved by choosing an appropriate scoring rule?}\co{Edited.}
Assuming differentiability of \(f\) and \(\Score\), this section provides upper bounds for the inaccuracy of optimal predictions \(\p\) (i.e., $\Vert \p-f(\p) \Vert$) and their distance from fixed points \(\p^*\) (i.e., \(\Vert \p-\p^*\Vert \)). Note that, while the latter has a direct analogue in the performative prediction literature \citep[][Theorem 4.3]{perdomo2020performative}, evaluating the inaccuracy of predictions only makes sense in our context where parameters are probability distributions.

%We then show how one can choose scoring rules to make these bounds arbitrarily small. We leave the case of non-differentiable \(f\) and \(G\) for future work.

For our bounds we will use the following notation. We use \(\Vert A\Vert_{\mathrm{op}}=\max_{\Tv\in \TPset}\frac{\Vert A\Tv\Vert}{\Vert \Tv\Vert}\) for the operator norm of $A$ on the tangent space. It is equal to $A$'s largest singular value when seen as an automorphism on the tangent space. We use $A\vert_{\TPset}\succeq \gamma$ to denote that \(\Tv^\top (A- \gamma\Id)\Tv\geq0\) for all \(\Tv\in\TPset\). If \(A\) is symmetric, this is equivalent to saying that the smallest eigenvalue of $A$ on the tangent space is at least $\gamma$. %s\jt{I keep forgetting too. This is also only valid for symmetric \(A\) (otherwise eigenvalue can even be imaginary etc.)}
Further, note that if $g$ is a subderivative of $G$ and $\Vert g(\p)\Vert <L_G$ for all $\p\in\Pset$, then $L_G$ is a Lipschitz constant of $G$. Similarly, if $\Vert Df(\p)\Vert_{\mathrm{op}} \leq L_f$ for all $\p\in\Pset$, then $L_f$ is a Lipschitz constant of $f$.

\begin{restatable}{theorem}{inaccuracybound} \label{theorem:Caspar-approx-fix-point}
    Let \(S\) be a strictly proper scoring rule, and let \(G,g\) as in the Gneiting and Raftery characterization (\Cref{theorem:gneiting-raftery}). %Let \(\Vert\cdot\Vert\) denote the euclidean norm. 
    Let \(\p\in\Pset\) and assume \(f,G,g\) are differentiable at \(\p\). Assume \(Dg(\p)|_{\TPset}\succeq\gamma_{\p}\) for some \(\gamma_\p>0\).
    Then whenever $\p$ is a performatively optimal report,
    \begin{equation*}
    \Vert \p - f(\p) \Vert \leq\frac{ \Vert  Df(\p)\Vert_{\mathrm{op}}\Vert g(\p)\Vert}{\gamma_{\p}}.\end{equation*}
    In particular, if $f$ has Lipschitz constant $L_f$, \(G\) has Lipschitz constant \(L_G\), and \(G\) is \(\gamma\)-strongly convex, then we have $\Vert \p - f(\p) \Vert \leq \frac{L_f L_G}{\gamma}$.
\end{restatable}

\co{LOW PRIORITY: Maybe say something about whether/when the bound is tight. I think the main bound is tight in the two-outcome case but not otherwise.}
%
%\jt{the smallest eigenvalue of \(Dg(p)\), as a linear map \(Dg(p)\colon \TPset\rightarrow\TPset\), is \(\gamma\).}\co{Also cf definition of positive definiteness.}
%This is equivalent to \(v^\top (Dg(\p)- \gamma\Id)v\geq0\) for all \(v\in\TPset\). Or also \(v^\top Dg(\p) v \geq \gamma\Vert v\Vert^2\) for all \(v\in\TPset\).
%
%\jt{The bound \(\gamma\) works always, regardless of whether \(g(p)\) is always in the tangent space, or how we choose the matrix \(Dg(p)\).}
%
%\jt{iff \(\Vert g(p)\Vert \leq L\) for all \(p\) then \(G\) has lipschitz constant \(L\)}

\begin{comment} %This is now obsolete.
\begin{corollary}\label{corollary:approx-fixed-point-Lipschitz}
Same assumptions as \Cref{theorem:Caspar-approx-fix-point}. Assume further that $f$ has Lipschitz constant $L$. Then for every optimal report $p$, we have that $\Vert p-f(p) \Vert_2 \leq L\Vert g'(p)^{-1}\Vert_{*} \Vertg(p)\Vert_2$.
\end{corollary}

\begin{proof}
    First note that if $f$ has Lipschitz constant $L$, this means that for all $p$, $\Vertf'(p)\Vert_{*}\leq L$ everywhere. Second, we will use the fact that if $\VertA\Vert_{*}\leq c$, then $\VertAv\Vert\leq c\Vertv\Vert$ for all $v$. With this we get that
    \begin{eqnarray*}
\Vertp-f(p)\Vert &\underset{\text{\Cref{theorem:Caspar-approx-fix-point}}}{\leq}&  \Vert g'(p)^{-1}\Vert_{*}\Vertf'(p) g(p)\Vert_2 \\
&\leq & \Vert g'(p)^{-1}\Vert_{*} \Vertf'(p)\Vert_{*} \Vertg(p)\Vert_2\\
&\leq & L \Vert g'(p)^{-1}\Vert_{*} \Vertg(p)\Vert_1.
\end{eqnarray*}
\end{proof}
\end{comment}

In the case where \(f\) has Lipschitz constant \(L_f<1\), we can use the above results to derive a bound on how far the optimal report is from the (by Banach's fixed point theorem unique) fixed point.
%\co{What's happening with the naming here? Suddenly $L$ is the Lipschitz constant of $G$ and $\epsilon$ is the Lipschitz constant of $f$? I think everywhere else $L$ is the Lipschitz constant of $f$.}
%\jt{Let's do \(L_f\) and \(L_S\) instead.}

\begin{restatable}{theorem}{bounddisttofp}\label{thm:distance-to-fp}
    Same assumptions as \Cref{theorem:Caspar-approx-fix-point}. Assume further that $f$ has Lipschitz constant $L_f<1$. Let $\p^*$ be the unique fixed point of $f$. Then for the performatively optimal report $\p$,
    \begin{equation*}
        \Vert \p-\p^*\Vert \leq \frac{\Vert g(\p)\Vert\Vert Df(\p) \Vert_{\mathrm{op}}}{(1-L_f)\gamma_\p} \leq \frac{L_fL_G}{(1-L_f)\gamma_\p}.
    \end{equation*}
\end{restatable}

%\jt{\(L_f\) versus \(L_G\) for the two lipschitz constants}

Note that the assumption that $L_f<1$ ensures that $f$’s fixed point is unique by Banach’s fixed point theorem. Without $L_f<1$, no trivial bound holds, as we show in Proposition~3
in Appendix~A.6.

\co{[LOW PRIORITY:] I think it would be good to show in the appendix that even for the binary case we don't get any non-trivial guarantees for $L_f=1$, i.e., worst case distance to fixed point might be arbitrarily close to $1$.}

This bound is analogous to a bound in \citep[][Theorem~4.3]{perdomo2020performative}. Our bound differs in that we use Euclidean distance instead of Wasserstein distance to measure the sensitivity of \(f\) to the choice of report. Moreover, assuming a \(L_\ell\)-Lipschitz and \(\gamma\)-strictly convex loss function \(\ell\), their bound depends on the ratio \(\frac{L_\ell}{\gamma}\). We instead bound this distance against the ratio \(\frac{\Vert g(\p)\Vert}{\gamma_\p}\), %as
%\(\Vert \theta_{\mathrm{PO}}-\theta_{\mathrm{PS}}\Vert\leq \frac{L_\mathcal{D} L_\ell}{\gamma}\) where \(L_\mathcal{D}\) is a a measure for sensitivity of distributions \(\mathcal{D}(\theta)\) with respect to predictions based on the Wasserstein distance, \(L_\ell\) is a Lipschitz constant for \(\ell\), and \(\ell\) is assumed to be \(\gamma\)-strictly convex. This bound is analogous to our bound \(\frac{\Vert Df(\p)\Vert_{\mathrm{op}}}{(1-L_f)\gamma_\p}\) from \Cref{thm:distance-to-fp}, %, where \(L_\mathcal{D}\) corresponds to the Lipschitz constant \(L_f\) for \(f\) and \(\gamma\)-strict convexity of \(G\) corresponds to the equivalent assumption \(\Vert Dg(\p)|_{\TPset}\Vert_{\op}\succeq\gamma\) for all \(\p\) (assuming the second derivative of \(G\) exists).
%but we use a different sensitivity measure for the distribution map, and we bound against \(\gamma_\p\) instead of assuming global strict convexity. 
which will allow us to minimize the bound in the two-outcome case by using exponential functions (\Cref{theorem:two-outcomes-arbitrarily-good-bounds}). This would not be possible when assuming \(\gamma\)-strict convexity, since there exist no functions that globally make the ratio \(\frac{L_\ell}{\gamma}\) arbitrarily small. \cite{perdomo2020performative} show that their bound can be made small by regularizing the loss function, but this would be undesirable in our setting, since regularized scoring rules would be improper and thus cease to incentivize honest reports even for constant \(f\).

\begin{example}[Bound for the quadratic scoring rule]
\label{example:bounds-for-brier}
    Consider the quadratic scoring rule $S(\p,i)=2p_i-\Vert\p\Vert_2$. Note that we can represent this in Gneiting and Raftery's characterization with \(G(\p)=\Vert \p\Vert^2\) and $g(\p)=2\p-\frac{2}{n}\mathbf{1}$. Thus, $Dg(\p)=2I$, where $I$ is the identity matrix. Hence \(Dg(\p)\succ 2\). Further, $\Vert g(\p)\Vert _2=2\Vert \p-\frac{1}{n}\mathbf{1}\Vert $.
    Thus, for $f$ with Lipschitz constant $L_f$, \Cref{theorem:Caspar-approx-fix-point} implies that for the optimal report $\p$ we have that $\Vert f(\p)-\p\Vert \leq L_f\Vert \p-\frac{1}{n}\mathbf{1}\Vert \leq L_f \sqrt{(n-1)/n}$. If $L_f<1$, then by \Cref{thm:distance-to-fp} we further have $\Vert \p -\p^*\Vert \leq \frac{L_f}{1-L_f}\Vert \p-\frac{1}{n}\mathbf{1}\Vert\leq \frac{L_f}{1-L_f}\sqrt{(n-1)/n}$. %\co{Note that for $n=2$ this is now equivalent to the one-dimensional bound, since $d((p_1,1-p_1),(p_2,1-p_2))=\sqrt{2}|p_1-p_2|$.}
\end{example}

%\jt{cutting this for now}
%\jt{Unfortunately, there is no constant bound that holds on all of $\Delta(\mathcal{N})$ for the log scoring rule, and its formulas for the eigenvalues of $Dg(p)$ are more complicated. We therefore do not give bounds for the log scoring rule here.}

\begin{comment}
\co{Write more about why this is the case. Intuitively, the issue is that you might end up with a huge amount of securities in one outcome (where you report a probability close to $0$), while the other probabilities are high such that the rate at which new securities are bought ($g'$) is small.}

%\jt{no constant bound, but can you still say something about what this bound is at most?}\co{As discussed, it's infinite.}

\jt{we could give a bound for the logarithmic scoring rule in the binary case.}\co{Yeah, will do. In principle, one could also give the general parameterized-by-$\p$ bounds for the higher dimensional case, but from my calculations, the eigenvalues of $Dg(\p)$ are pretty complicated. It would be good for someone else to check. It seems that $g(p)=(\log p_i - (1/n)\sum_j \log p_j )_i$. So, $Dg(p)=\begin{pmatrix}
\frac{n-1}{n}\frac{1}{p_1} & ... & -\frac{1}{n}\frac{1}{p_n}\\
      \vdots              &  \ddots    & \vdots\\
-\frac{1}{n}\frac{1}{p_1}          &   ...  & \frac{n-1}{n}\frac{1}{p_n}\\
\end{pmatrix}.$ We can solve this, e.g., with Mathematica. You can find Mathematica commands in the comments here. The results seem to quickly get complicated.
%For n=2:
%Eigenvalues[{{1/2 * (1/p1), -1/2*(1/p2)}, {-1/2*(1/p2), 1/2*(1/p1)}}]}
%For n=3:
% Simplify[
% Eigenvalues[{{2/3 * p1, -1/3*p2, -1/3*p3}, {-1/3*p1, 
%    2/3*p2, -1/3*p3}, {-1/3*p1, -1/3*p2, 2/3*p3}}], {p1 >= 0, p2 >= 0,
%   p3 >= 0, p1 + p2 + p3 == 1}]
%For n=4:
%Simplify[
% Eigenvalues[{{3/4 * p1, -1/4*p2, -1/4*p3, -1/4*p4}, {-1/4*p1, 
%    3/4*p2, -1/4*p3, -1/4*p4}, {-1/4*p1, -1/4*p2, 
%    3/4*p3, -1/4*p4}, {-1/4*p1, -1/4*p2, -1/4*p3, 3/4*p4}}], {p1 >= 0,
%   p2 >= 0, p3 >= 0, p4 >= 0, p1 + p2 + p3 + p4 == 1}]
}

%For log scoring rule, we have \(g(p)=(1+\log p_i)_i\) and \(g'(p)=(\delta_{ij}\frac{1}{p_i})\) and thus \(\Vert g'(p)^{-1}\Vert_{op}=\max_i p_i\).
\end{comment}

\section{Approximate fixed-point prediction with the right proper scoring rules?}
\label{sec:approximate-fixed-point-prediction}

The above results show that depending on the scoring rule we can obtain bounds on the accuracy of performatively optimal predictions. Can we make these bounds arbitrarily small by choosing an appropriate scoring rule, e.g., one that makes $\Vert g(\p) \Vert / \gamma_{\p}$ very small at each point? In this section, we show that the answer is yes in the two-outcome case and no in the general case.

%\co{POSSIBLE CUT: Unfortunately, the exponential scoring rule is not that intuitive anymore, so I wonder whether to move the following paragraph and the example environment into the appendix.}
%We start with the two-outcome case. Inspired by Theorems TODO, we are looking for scoring rules that can make $\Vert g(\p)\Vert / \gamma_\p$ arbitrarily small. Intuitively, in the two-outcome case, $\gamma_\p$ is just (a lower bound on) the derivative $g$. Thus, the challenge is to find a function that is small compared to its derivative. Exponential functions then come to mind immediately.

\begin{restatable}{theorem}{exponentialthm}\label{theorem:two-outcomes-arbitrarily-good-bounds}
Consider the case of two outcomes, i.e., let $\mathcal{N}=\{1,2 \}$. Let $L_f\in \mathbb{R}$ and $\epsilon>0$. Then there exists a scoring rule $S$ s.t.\ under any $f$ with Lipschitz constant $L_f$, any optimal report $\p$ satisfies $\Vert \p-f(\p)\Vert \leq \epsilon$. If $L_f<1$, then there also exists a scoring rule that additionally ensures that under any $f$ with Lipschitz constant $L_f$, any optimal report satisfies $\Vert \p-\p^*\Vert \leq \epsilon$, where $\p^*$ is the (unique) fixed point of $f$.
\end{restatable}

Note that if there are multiple fixed points, then $S$ still induces preferences between---approximately---predicting these fixed points. In particular, because $S(\p,\p)$ is convex, the performatively optimal fixed point will either be the one that maximizes or the one that minimizes $p_1$ among the fixed points. This may be undesirable as the expert still has a strong incentive other than (though compatible with) honest prediction. We discuss this in more detail in Appendix~B.

Can arbitrarily good bounds be achieved with \textit{practical} proper scoring rules? Our proof of \Cref{theorem:two-outcomes-arbitrarily-good-bounds} uses exponential scoring rules with $g(\p)=(e^{L_fp_1/(\sqrt{2}\epsilon)},-e^{L_fp_1/(\sqrt{2}\epsilon})^\top$. For high $K$, this scoring rule seems impractical, because the stakes vary greatly over the interval. For example, $S((\nicefrac{2}{3}+\epsilon,\nicefrac{1}{3}-\epsilon),(\nicefrac{2}{3},\nicefrac{1}{3}))/S((\nicefrac{1}{2}+\epsilon,\nicefrac{1}{2}-\epsilon),(\nicefrac{1}{2},\nicefrac{1}{2}))=e^{L_f/(6\sqrt{2}\epsilon)}$. Hence, as we increase $L_f/\epsilon$, it becomes exponentially more important for the expert to predict accurately near $\nicefrac{2}{3}$ than to predict accurately near $\nicefrac{1}{2}$. In particular, an AI model trained with this scoring rule may be much worse at predicting probabilities near $\nicefrac{1}{2}$ than near $\nicefrac{2}{3}$. Similarly, it is unrealistic to reward a human expert with, say, millions of dollars near $\nicefrac{2}{3}$ and with just a few cents near $\nicefrac{1}{2}$. Unfortunately, it turns out that all possible scoring rules that achieve bound $\epsilon$ under Lipschitz constant $L_f$ have this undesirable property, though the exact bound turns out somewhat complicated.

%\jt{this is the theorem that shows that if optimal reports are always close to fixed points, in 2 dimensions, then the scoring rule is kind of exponential, right?}\co{Yes! (Sorry that it ended up being a mess. Unfortunately, I think that's necessary. I'll add some explanations. There's a good chance that this will have to go in the appendix...)}\co{Okay, the result is now much more straightforward.}

%\jt{ok, to be completely honest, I vote for just giving this result in the floating text, descriptively and informally, and only giving the formal result in the appendix. Also helps with space and as it stands right now I think it's not sexy enough for main text.}\co{Hmmm... How about giving a version of the theorem that doesn't have the complicated term?}
\co{to do: give this in some kind of big O or similar notation, instead of giving the actual term}
\begin{restatable}{theorem}{needexponential}
\label{thm:need-exponential-new}
Suppose $S$ is a proper scoring rule s.t.\ for some $\epsilon, L_f > 0$ we have that whenever $f$ is $L_f$-Lipschitz, the optimal report $\p$ satisfies $\Vert f(\p) - \p\Vert < \epsilon$. Let $3\epsilon \leq p_l \leq p_h \leq 1-4\epsilon$ and $\delta=\epsilon / (L_f+1)$. Then the ratio of the supremum and infimum over $p_1\in [p_l,p_h]$ of $S((p_1+4\delta,1-p_1-4\delta),(p_1,1-p_1)) - S((p_1,1-p_1),(p_1,1-p_1))$ is at least
\begin{equation*}
    \frac{L_f}{2L_f+6}\left(3\frac{L_f+1}{L_f+3}\right)^{(L_f+1)(p_h-p_l)/(8\epsilon) -5/2}.
\end{equation*}
In particular, for fixed positive $L_f$, this term is exponential in $1/\epsilon$ and for fixed positive $\epsilon$ it is exponential in $L_f$.
\end{restatable}

Intuitively, the assumption on $S$ is that it ensures small accuracy bounds of $\epsilon$ for functions with Lipschitz constant $L_f$. Now note that $|S((p_1+4\delta,1-p_1-4\delta),(p_1,1-p_1)) - S((p_1,1-p_1),(p_1,1-p_1))|$ is the cost to the expert of misreporting by $4\delta$ when the true distribution is $(p_1,1-p_1)$. If this term is large, then the expert cares a lot about not misreporting by $4\delta$, and if the term is small, the expert does not mind misreporting much. Our result shows that the value of this term is much larger for some $p_1$ than it is for others, i.e., that for some probabilities $p_1$ the expert cares a lot more about accurately reporting $p_1$ than it does for other values of $p_1$. Our theorem puts a lower bound on the ratio between the lowest and largest possible values of that term. In particular, this does not hinge on probabilities $p_1$ near $0$ or $1$ and holds even if we restrict attention to probabilities between, say, $1/4$ and $3/4$.

%\co{CUT: One could think about expressing this without giving that horrible term, I suppose...}
%\ec{Can we remove the $\top$s inside the $S$ here? It's clear without them, and I think they just reduce readability.}

\begin{comment}
\begin{theorem}\label{thm:need-exponential}
Suppose $S$ is a proper scoring rule defined via $g$ s.t.\ for some $\epsilon, L_f > 0$ we have that whenever $f$ is $L_f$-Lipschitz, the optimal report $p^*$ satisfies $|f(p^*) - p^*| < \epsilon$. Let $\delta = \frac{\epsilon}{L_f+1}$. For $p\in [0,1]$, let 
\begin{equation*}
\hat g(p)=g((p,1-p)^\top)(1,-1)^\top.
\end{equation*}
%\left(g\begin{pmatrix} p+4\delta\\ 1-p-4\delta \end{pmatrix}-g\begin{pmatrix} p\\ 1-p \end{pmatrix}\right) \begin{pmatrix}1\\-1\end{pmatrix}
Then we have for all
$p\in [\nicefrac{1}{2},1-3\epsilon-2\delta]$,
\begin{equation*}
    \hat g(p+4\delta)-\hat g(p) \geq \frac{2L_f}{L_f+3}|\hat g(p)|.
\end{equation*}
and
\begin{equation*}
\begin{split}
    &\frac{\sup_{p\in [0,1-4\delta]} \hat g(p+4\delta)-\hat g(p)}{\inf_{p\in [0,1-4\delta]} \hat g(p+4\delta)-\hat g(p)}\\
    &\quad\quad \geq \frac{2L_f}{L_f+3}\left(3\frac{L_f+1}{L_f+3}\right)^{(\nicefrac{1}{8}-\epsilon)(L_f+1)/\epsilon -\nicefrac{5}{2}}.
\end{split}
\end{equation*}
\end{theorem}

\co{Need to a bunch to explain, e.g., to explain what $\hat g$ is. Basically $g(\mathbf p)(1,-1)^\top$ is how much you prefer one of the outcomes over the other when reporting $\mathbf p$. Another perspective is that $g$ might be non-canonical (entries not summing to $0$) and so the $(1,-1)^\top$ is dealing with that. An alternative way of dealing with this is to assume canonical $g$, i.e., $g_1+g_2=0$. Then $\hat g$ just becomes $2g_1((p,1-p)^\top)$.}
\end{comment}

%\jt{I think it might work to just define a \(g(p)\) where \(p\) is just one-d, and note somewhere that we can do this in the one-d case or so.}\co{Yeah, in general I wonder whether this is a good idea or not. So far I've made sure that the main text consistently uses the general notation, even in the two-outcome case. Let's leave it like that for the present submission but discuss again later.}
%\jt{sgtm.}

%\begin{theorem}
%Let $\mathcal{N}=\{1,2,3\}$ and $\epsilon,L>0$ s.t. [TODO: some relation between $\epsilon,L$]. Then there exists no scoring rule that ensures $\Vert p-f(p)\Vert \leq \epsilon$ or $\Vert p-p^*\Vert \leq \epsilon$ for all $f$ with Lipschitz constant $L$.
%\end{theorem}



\Cref{theorem:two-outcomes-arbitrarily-good-bounds} shows that in the binary prediction case, given a Lipschitz constant $L_f$ for the environment, we can achieve arbitrarily good bounds $\epsilon$ on the inaccuracy of the performatively optimal report. Unfortunately, this ceases to be possible in the many-outcome case. In that case, if all we know about $f$ is that it has Lipschitz constant $L_f$, there is some error $\epsilon$, linear in $L_f$ as $L_f\rightarrow 0$, that we must allow regardless of what strictly proper scoring rule we use.

\begin{restatable}{theorem}{impossibility}\label{thm:no_higher_dim_bound}
For any Lipschitz constant $L_f$, for $\epsilon>0$ sufficiently small, there is no proper scoring rule $S$ for the three-outcome case that achieves the following property: Whenever $f$ is $L_f$-Lipschitz, there is some performatively optimal report $\p$ with $\Vert f(\p)-\p\Vert  \leq \epsilon$. In particular, there exists some function $\epsilon(L_f)$ with $\epsilon(L_f) \sim c L_f$ as $L_f \rightarrow 0$ for some fixed constant $c$, s.t.\ the above property cannot be achieved with $\epsilon = \epsilon(L_f)$.  Thus, the best achievable bound is in $\Omega(L_f)$ as $L_f \rightarrow 0$, i.e. scales at least linearly with $L_f$ in the limit.
\end{restatable}

\co{LOW PRIORITY: I think it would be good to have an argument in the appendix that the true bound is nothing super simple. I think scoring rules that reward only for guessing the right outcome probably give non-trivial bounds for high $L_f$, for instance...}

\co{LOW PRIORITY: Maybe it'd be good to show that something similar holds for the distance to fixed points as well.}

%TODO: say something more numeric about the bound perhaps.






\begin{figure*}[t]
\centering
\begin{subfigure}[t]{.45\textwidth}
    \centering
    \includegraphics[width=\textwidth]{scatterplot-opnormA-l2-inaccuracy-brier-it2.pdf}
    %\caption{}
    %\label{fig:scatterplot-opnormA-l2-%inaccuracy-brier}
\end{subfigure}%
\begin{subfigure}[t]{.45\textwidth}
    \centering
    \includegraphics[width=\textwidth]{scatterplot-opnormA-l2-disttofp-brier-it2.pdf}
    %\caption{}
\end{subfigure}
\caption{Scatter plots showing the L2 inaccuracy (left) and the distance to a fixed point (right) of the performatively optimal reports against the operator norm of $A$ in our experiments. In both plots, each point corresponds to a run of the experiments. The blue lines are found by linear regression on the points. The red lines are the bound given in \Cref{example:bounds-for-brier} as a function of the Lipschitz constant $L_f$.
%(a) The behavior of a CCDR pretrained policy. For each perceived diff to the opponent $y$, the graph shows the expected distance of the learned policy's choice to to $f_C$ and to $f_D$. (b) Losses of Player 1 in 10 runs through the ABR phase.
}
%\vspace*{-\baselineskip}
%\label{fig:main-text-experimental-results}
\label{fig:scatterplot-opnormA-l2-inaccuracy-brier}
\label{fig:scatterplot-opnormA-l2-disttofp-brier}

\end{figure*}
\section{Numerical simulations}
\label{numerical-simulations}

\co{LOW PRIORITY: Currently we don't have anything for the log scoring rule anywhere.}

In this section, we provide some numerical simulations for the Brier score, to see how inaccurate performatively optimal predictions might be in practice. Throughout, we consider only affine-linear functions \(f\). This in particular means that all functions $f$ have operator norms between \(0\) and \(1\) and aside from degenerate cases a unique fixed point. The Mathematica notebook for our experiments (including some interactive widgets) is available at \url{https://github.com/johannestreutlein/scoring-rules-performative}. Although our experiments are set in toy models with linear $f$ and small sets of outcomes, they provide an initial estimate of the degree to which predictions can be off, depending on how much influence the expert can exert using their prediction. %This is just a toy model: in general, we will make predictions with more than two possible outcomes, and the dependence of an oracle's beliefs on its predictions will be highly nonlinear. Nevertheless, we believe that our analysis is useful to provide some initial intuition for the potential magnitude of the effect.

\subsection{Binary prediction}

\co{Make sure to mention somewhere how the L2 norm and the distance between the $p_1$s relate to each other, and justify the use of the L2 norm.}

\textbf{Experimental setup. } We begin with the binary prediction case, i.e., $\mathcal{N}=\{1,2\}$. %In this case, we can actually give exhaustive graphs.
We consider \(f\) to be affine linear with slope \(\alpha\) and fixed point \(\p^*\in \Delta(\mathcal{N})\), thus yielding the functional form $f(\p):=\p^*+\alpha(\p-\p^*)$ for all $\p\in \Delta(\{1,2\})$. Note that for all $\alpha\in [0,1]$ and all $\p^*\in \Pset$, a function thus defined is indeed a function $\Pset\rightarrow \Pset$. For $\alpha<0$, whether $f$ is a function $\Pset\rightarrow \Pset$ depends on $\p^*$. We restrict attention to $\alpha\in [0,1]$ for simplicity. %Note that $f$ thus defined is uniquely specified by two numbers: $p_1^*,\alpha\in[0,1]$.
%We consider only \(\alpha\leq 0.95\) to avoid instabilities when \(\alpha\approx 1\) and thus \(f\) becomes the identity function.

\textbf{Graphing inaccuracy and distance to fixed points. }
In \Cref{fig:density-plot-brier-l2-inaccuracy} (left), we plot the inaccuracy $\Vert \p - f(\p) \Vert$ of the performatively optimal report \(\p\) against $\alpha,p^*_1$.
In \Cref{fig:density-plot-brier-l2-disttofp} (right), we plot the L2 distance \(\Vert \p^*-\p\Vert\) of the performatively optimal report \(\p\) to the fixed point \(\p^*\). For that plot we limit $\alpha$ to the range $[0,0.95]$, because of instability at $\alpha\approx 1$. Note that relatively high inaccuracies can be found at various qualitatively different points in the graphs, even when the slope of \(f\) is small, i.e., when the oracle has little influence on the environment.

\begin{comment}
\begin{figure}
\begin{center}
\includegraphics[width=0.49\textwidth]{density plot brier l2 inaccuracy.pdf}
\end{center}
\caption{Heatmap of L2 distance of optimal prediction $\p$ to true probability distribution $f(\p)$, depending on fixed point position $p_1^*$ and $\alpha$ (slope of \(f\)), for the quadratic scoring rule.
}
\label{fig:density-plot-brier-l2-inaccuracy}
\end{figure}

\begin{figure}
\begin{center}
\includegraphics[width=0.49\textwidth]{density plot brier l2 disttofp.pdf}
\end{center}
\caption{Heatmap of L2 distance of optimal prediction $\p$ to the fixed point probability distribution $f(\p^*)$, depending on fixed point position $p_1^*$ and $\alpha$ (slope of \(f\)), for the quadratic scoring rule.
%\jt{why doesn't the slope here go to 1.0?}\co{The usual stability reason -- graph gets crazy at $\alpha\approx 1$.}
}
\label{fig:density-plot-brier-l2-disttofp}
\end{figure}
\end{comment}


\textbf{Assessing our bounds. }
To evaluate our bounds, we maximize distances across possible choices of fixed points \(\p^*\in \Delta(\{1,2\})\), and plot the maximal inaccuracy of the optimal prediction as well as the maximal distance from a fixed point in \Cref{fig:max-l2-distance-brier-two-outcome}. We compare to both theoretical bounds from \Cref{example:bounds-for-brier}, i.e., $\Vert  p - f(p) \Vert _2\leq \alpha/\sqrt{2}$ and $\Vert  p - p^* \Vert _2 \leq \alpha/((1-\alpha)\sqrt{2})$.
%\(|\hat{p}-f(\hat{p})|\leq \alpha \sup_p|g(p)/g'(p)|\) and 
% \(|\hat{p}-p^*|\leq \frac{\alpha}{1-\alpha}\sup_p|g(p)/g'(p)|\), where \(\sup_p|g(p)/g'(p)|=1/2\) for the quadratic scoring rule.

For both quadratic and log scoring rule (results in Appendix~C), our theoretical bounds are tight for slopes \(\alpha\leq 0.5\). For higher slopes, inaccuracy goes down, as the function \(f(p)\) becomes closer to the identity function, and optimal predictions are bounded in \([0,1]\).

\subsection{Higher-dimensional prediction}

%\textbf{Experimental setup}

\textbf{Experimental setup. } Next, we turn to higher-dimensional predictions. We consider a model with five possible outcomes and linear $f\colon p\mapsto Ap$ for $A\in\mathbb{R}^{n\times n}$. $f$ is an automorphism on the simplex if and only if all of its columns are in the simplex. We hence randomly generate the matrix $A$ by sampling each column uniformly from the simplex. Note that $A$ is the Jacobian of $f$ at every point.
%as follows. First we randomly generate numbers from 0 and 99 for each entry of the matrix. Then we normalize the columns to sum to $1$. %\jt{To me this seems like a hacky way to sample this. I don't think it's a uniform distribution on the simplex. (See \url{https://cs.stackexchange.com/questions/3227/uniform-sampling-from-a-simplex}. Why not a uniform distribution on the simplex instead?}\co{Yeah, good point! I changed it now in the code. (This is just the kind of thing I did in some random \textit{ad hoc} way when I first wrote the code and then never got around to changing...) (I'm just using rejection sampling for the simplex for now, because efficiency doesn't really matter.)}. \jt{ok, cool <3. Thank you!}

%as defined above maps all probability distributions onto probability distribution and 
%
%if and only if the columns of $A$ sum to $1$ and the entries of $A$ are all nonnegative.


For each $f_A$ thus created, we first find the performatively optimal report $\p$ and the fixed point $\p^*$. We then record the following quantities: the operator norm of $f_A$; %\jt{you are taking the operator norm just over the tangent space, right? How are you doing this?}\co{Yes. I do it numerically with Mathematica. (Code in comment.)}
    %TangentSpaceOpNormN[A_] := 
    %First@NMaximize[{Norm[A . Array[v, Length[A]]], 
    %Total[Array[v, Length[A]]] == 0 && 
    % Norm[Array[v, Length[A]]] <= 1}, Array[v, Length[A]]]
the distance of the fixed point distribution to the uniform distribution $ \Vert \p^*-\frac{1}{n}\boldsymbol{1}\Vert$; %\jt{we have the notation \(\mathbf{1}\) for this vector?}\co{Yup}
 the distance of the optimal report to the uniform distribution $\Vert \p - \frac{1}{n}\boldsymbol{1}\Vert $;
 the distance of the performatively optimal report to the fixed point $\Vert \p^*-\p\Vert$; % where $\p = \argmax_\p S(\p,f(\p))$ and $\p^*$ is the fixed point of $f_A$;
the inaccuracy of the performatively optimal report $\Vert f(\p)-\p\Vert $. %, where $\p=\argmax_\p S(\p,f(\p))$.
%\jt{I think we shouldn't list things we are tracking here that we are not reporting in the main text (we can maybe instead write one sentence about appendix and the things we are also tracking there)}
%
%We also track $\Vert \p - \frac{1}{n}\boldsymbol{1}\Vert _2$ and compare these numbers to the the bounds obtained in \Cref{example:bounds-for-brier}.
We are interested in how the second two items depend on the first two. We are also interested in how tight our bounds (from \Cref{example:bounds-for-brier}) are.%, some of which are stated in terms of the third item.

We collected 1000 random functions \(f_A\), but aborted 52 runs because they didn't terminate within 120 seconds, leaving us with 948 data points.


%\textbf{Results}

\co{[LOW PRIORITY:] It would be cool to have a density scatter plot somewhere.}

\textbf{Inaccuracy. }
\Cref{fig:scatterplot-opnormA-l2-inaccuracy-brier} (left) plots the L2 inaccuracy (i.e., the distances $\Vert \p-f(\p) \Vert$). The blue line shows the best linear fit to the data points, which is given by $-0.0314 + 0.234 x$, whereas our bound is $2L_f/\sqrt{5}\approx 0.8944 L_f$. The average L2 inaccuracy is $0.100$ with a standard deviation of $0.0770$. The quartiles are $0.0419, 0.0759, 0.138$. The correlation between the operator norm of $f_A$ and $\Vert \p - f(\p)\Vert $ is $0.312$.

% More in appendix... Any higher-level takeaways?

\textbf{Distance to fixed points. }
\Cref{fig:scatterplot-opnormA-l2-disttofp-brier} (right) plots the L2 distance to the fixed point against the operator norm of $f_A$. The linear best fit (blue line) is given by  $-0.0966 + 0.440 x$, whereas our bound is $2L_f/(\sqrt{2}(1-L_f))\approx 0.8944 L_f / (1-L_f).$ The average L2 distance to the fixed point is $0.152$ with a standard deviation of $0.154$ and quartiles $0.0442, 0.0915, 0.210$. The correlation between the operator norm of $f_A$ and $\Vert\p^* - \p\Vert $ is $0.294$.

%Dist to fp:
%Worst-case difference: 0.713647
%Quartiles: 0.0196446, 0.034995, 0.0685926
%Avg: 0.0604947
%SD: 0.0829831
%Worst-case: 
%\Cref{fig:scatterplot-opnormA-l2-disttofp-brier}.


\textbf{The role of the location of the fixed point. } The graphs for the binary prediction case show that the location of the fixed point matters a lot for the accuracy of optimal reports (though the direction of the effect depends on the slope of $f$). A similar effect can be observed in the many outcome case. In fact, the effect of the location of the fixed point is actually stronger (though less reliable) than the effect of the operator norm of $f_A$. We provide more detail in Appendix~C.2.2.

%\co{For space reasons, we can't give any more graphs here. So the graphs will have to go to the appendix. The main takeaway from these graphs is as in the two-outcome case: the location of the fixed point matters. In particular, if the fixed point is closer to uniform, that gives better results. It's interesting to compare this to the two-outcome case, where for high slope of $f$, it's actually \textit{better} but it's important to keep in mind that our operator norms are generally small in this experiments.}

\textbf{Loose bounds, tight bounds. } \Cref{fig:scatterplot-opnormA-l2-inaccuracy-brier,fig:scatterplot-opnormA-l2-disttofp-brier} show that (in contrast to the binary prediction case), our bounds in terms of the operator norm of $f$ are typically quite loose. For example, the average slack of the inaccuracy bound is $0.404$ with a standard deviation of $0.0998$ and quartiles $0.337, 0.400, 0.471$. Recall from \Cref{example:bounds-for-brier} that in addition to bounds in terms of $L_f$ alone we have bounds in terms of $L_f$ and $\Vert \p-\frac{1}{n}\mathbf{1}\Vert $. These bounds are much tighter with an average slack of $0.0644$ with a standard deviation of $0.0597$ and quartiles $0.0274, 0.0487, 0.0830$. 

\co{%Here I will investigate the looseness of the bounds a bit more. Specifically, I will also consider the tighter bounds that have a factor of $\Vert  p - \mathrm{uniform}\Vert $ in them to see how much better they are. Basically, they are much better, which is interesting and important. I don't yet know, exactly, how to show these things. The simplest is to just compare the average distances to the bounds.
LOW PRIORITY: It might also be interesting to plot things against the location of $\p^*$ or so. Unfortunately, we don't have enormous amounts of space, so maybe we will only be able to do that in the appendix.

LOW PRIORITY: Could give analogous numbers for the bounds on distance to fixed point.}
%
%\jt{I don't think it is super important to give a detailed quantitative analysis of the different bounds. I think it would be enough to give plots against \(\Vert p- uniform\Vert\) in the appendix and make qualitative statements here. }

\textbf{Discussion. } Based on our simulations, misprediction in the five outcome case seems similarly problematic as in the binary prediction case. In contrast to the binary case, the bounds in terms of $L_f$ are quite loose. The bounds in terms of $\Vert \p-\frac{1}{n}\mathbf{1}\Vert $ are much tighter. Note that because these bounds depend on the performatively optimal report, they can only be derived a posteriori once a report has been submitted. As in the two-outcome case, both the location of the fixed point and the operator norm/slope of $f$ matter a lot for accuracy and distance to fixed point of the performatively optimal report.
%\co{
%\begin{itemize}
%    \item In practice, the high-dimensional bounds that only depend on $L_f$ aren't very tight.
%    \item The bounds that depend on $\Vert  p - \mathrm{uniform}\Vert $ are much tighter. But of course, these bounds have a different use case, because you can only apply them \textit{after} your get the prediction.
%    \item Interestingly, it seems like the errors aren't that much higher in the 5-outcome case, compared to the 2-outcome case. %\jt{you mean, the errors?}\co{Yup!}
%    \item Similar to two outcome case: For high operator norm, it gets worse on average but sometimes it's still fine.
%\end{itemize}
%s}   

\section{Fixed points via alternative notions of optimality}
\label{stop-gradients}

%\co{Generally this section looks very good to me.}
%\jt{nice! UwU}

%\co{I think somewhere here we could cite ratificationism as well, e.g., the Bell et al.\ paper.}
Here, we focus on alternative settings that lead to accurate predictions and do not induce preferences over fixed points. The idea behind all of them is that, instead of optimizing \(\p\) and \(f(\p)\) jointly, we keep \(\q:=f(\p)\) fixed while choosing a prediction \(\p\) to maximize \(S(\p,\q)\). Repeating this procedure leads to honest predictions, where the choice of fixed point depends on contingent facts such as initialization, instead of being chosen to maximize $S(\p,\p)$. An AI model using this procedure could be safer, because its predictions are honest, and because it does not optimize its choice of fixed point for any goal. In this section we give a summary of a more detailed treatment with formal results in Appendix~D.

\textbf{Performative stability. }
Alternatives to performative optimality have been discussed in the performative prediction literature. Translated into our setting, a prediction \(\p^*\) is called \emph{performatively stable} if $\p^*\in \argmax_{\p}\Score(\p,f(\p^*))$.
This implies \(\p^*=f(\p^*)\) whenever \(\Score\) is strictly proper, so performative stability is equivalent to being a fixed point. %This demonstrates that performative stability can be a normatively desirable solution concept in performative prediction settings.

%We can also express the performative stability objective as an equilibrium in a game between an expert making a prediction \(\p\) and a nature player choosing an outcome distribution \(\q\), where the expert is maximizing \(S(\p,\q)\) and the nature player is maximizing \(S(\q,f(\p))\). Here, if players act simultaneously, equilibrium strategies will be performatively stable and thus fixed points. Note that the stackelberg game in which the expert acts first instead leads to performatively optimal reports in equilibrium \citep{perdomo2020performative}.

\textbf{Repeated risk minimization and gradient descent. }
\citet{perdomo2020performative} consider learning algorithms that converge to performatively stable points, including repeated risk minimization and repeated gradient descent. In repeated risk minimization, we repeatedly update predictions via \(\p_{t+1}:=\argmax_\p S(\p,f(\p_t))\). Repeated gradient descent instead updates predictions via gradient descent on this objective. There also exist stochastic gradient descent versions of these algorithms \citep{mendler2020stochastic}. %That is, \(\p_{t+1}\defeq \argmax_{\p}\Score(\p,f(\p_{t+1}))\) or \(\p_{t+1}\defeq \p_{t}+\alpha \E_{y\sim f(\p_t)}[\nabla_p\Score(\p_t,y)]\). Note that since the distribution itself depends on \(\p_t\), this is not equal to \(\nabla_p\Score(\p_t,f(\p_t))\). Instead, it is equal to \(\nabla_p\Score(\p,\bot f(\p))\) where \(\bot\) is the stop-gradient operator that sets the derivative with respect to its argument to zero \cite{foerster2018dice}.
All of these schemes lead to stable points under appropriate conditions. We include a convergence proof for repeated gradient descent in our setting in Appendix~D.2. %  but on but where we only take the gradient with respect to \(\p\), not the term \(f(\p)\), i.e.,
%\[\p_{t+1}\defeq\p_t + \alpha \E_{y\sim f(\p_t)}[\nabla_p\Score(\p_t,y)]=
%\p_t + \alpha \nabla_p\Score(\p,\bot f(\p))
%\p_t + \alpha\left. \frac{\partial \Score(\p,\q)}%{\partial p}\right|_{\q=f(\p)}.\]
%where \(\bot\) is the stop-gradient operator that sets the derivative with respect to its argument to zero \cite{foerster2018dice}.
%They show that in their setting, this converges to performatively stable points. This is repeated for stochastic optimization (TODO other related work). We repeat a similar analysis for our setting in the appendix.%We can describe this as taking a \emph{stop-gradient} in front of \(f(\p)\), \[\p_{t+1}:=\p_t+\alpha\nabla_p\Score(\p,\bot f(\p))=\p_t+\alpha

\textbf{No-regret learning and prediction markets. } We also provide results for no-regret learning (Appendix~D.4) and prediction markets (Appendix~D.5). We introduce a no-regret learning setting and show that policies have sublinear regret if and only if they have sublinear prediction error. This differs from the setting considered by
\citet{pmlr-v162-jagadeesan22a}, in which no-regret policies converge to performatively optimal predictions.
%\co{Only give this informally. TODO Jonny}
%\co{We now have a problem here with terminology: This uses ``expert'' as in the regret learning with experts literature. But we now use ``expert AI'' to refer to what is here referred to as the ``agent''.}
%Honest predictions can also be incentivized in a no-regret learning framework. Concretely, consider the following setup. At time \(t\in\mathbb{N},\) the \emph{agent} (i.e., our AI expert) makes a prediction \(\Pvar_t\) and receives a score \(S(\Pvar_t,\Y_t)\), where \(Y_t\sim f(\Pvar_t)\). We then compare the accumulated score of the agent against that of the optimal prediction in expectation \(\Pvar^*_t\),
%$\mathrm{Regret}(T)\defeq \sum_{t=1}^T \Score(\Pvar^*_t,\Y_t)-S(\Pvar_t,\Y_t)$.
%Importantly, here environment outcomes \(Y_t\) are used to score both \(\Pvar^*_t\) and the agent's predictions, and thus \(\Pvar^*_t=f(\Pvar_t)\). As a result, we are able to show that given some assumptions, regret is sublinear, if and only if the prediction error \(\sum_{t=1}^T\Vert \Pvar_t-f(\Pvar_t)\Vert\) is sublinear. Note that here, predictions are allowed to oscillate between different fixed points. We show that if predictions converge, then they converge to a fixed point if and only if regret is sublinear.
Next, we provide a prediction market model and show that, if the weight of each trader in the market is small, equilibrium predictions by the market are close to fixed points. This is analogous to a result by \citet{hardt2022performative} bounding the distance of a market equilibrium from performatively stable points.

\section{Related work}
\label{related-work}

\textbf{Performative prediction. } In performative prediction, the goal is to find a model parameter \(\theta\in\mathbb{R}^d\) that minimizes an expected loss \(\E[\ell(Z;\theta)]\) where \(Z\) is a stochastic sample, usually a pair of input and target, \(Z=(X,Y)\). Unlike in the vanilla supervised learning setting, \(Z\sim\mathcal{D}(\theta)\) is sampled from a distribution \(\mathcal{D}(\theta)\) that itself depends on the chosen model parameter. Performatively optimal parameters are defined via \(\theta_{\mathrm{PO}}\in \argmin_\theta \E_{Z\sim \mathcal{D}(\theta)}[\ell(Z; \theta)]\), and the definition of performatively stable parameters is \(\theta_{\mathrm{PS}}\in \argmin_\theta \E_{Z\sim \mathcal{D}(\theta_{\mathrm{PS}})}\ell(Z;\theta)\). In general, performatively stable and optimal parameters can differ \cite[][Ex.~2.2]{perdomo2020performative}.

Our setting could be seen as a special case in which \(\theta\) is a single distribution \(\p\), data points are discrete outcomes \(y\), and the distribution \(\mathcal{D}(\theta)\) is given by \(f(\p)\). Unlike in the general performative prediction setting, we can determine the accuracy of a prediction \(\p\) as the distance from the distribution \(f(\p)\) (see \Cref{theorem:Caspar-approx-fix-point}), we can characterize predictions as honest if they are fixed points, and loss functions can be characterized as proper if they incentivize honest reports. As mentioned in \Cref{stop-gradients}, performatively stable points are fixed points and are thus a more desirable solution concept in our setting. % to optimizing for performative optimality \citep[][]{izzo2021learn,izzo2022learn}. %It would not make sense in our context to optimize explicitly for . 
There are some performative prediction settings in which performative optima can also be seen as manipulative and undesirable, such as in recommendation algorithms \citep{hardt2022performative}. However, as far as we are aware, we are the first to link performative stability to honesty in prediction.

%The setting in which a model's predictions can influence the distribution of the data points it is predicting has been discussed as \emph{performative prediction} \cite{perdomo2020performative} in the machine learning literature. They introduce performatively optimal and performatively stable criterion. 

%However, this setting is for arbitrary models and loss functions, and it considers continuous data points. It is thus unclear what results imply for performative probabilistic predictions, when incentivized by proper scoring rules.

%Moreover, the literature is motivated by minimization of loss rather than honest predictions. Hence, they actually are interested in gettin performatively optimal things. E.g. there are some papers explicitly optimizing for this ().


\textbf{Scoring rules. } While the literature on scoring rules generally assumes that predictions are not performative, a few authors in this literature have studied agents manipulating the world \textit{after} making a prediction \cite{shi2009prediction,oka2014predicting}. To our knowledge, the cases discussed do not involve agents influencing the world directly through their predictions. \citet{chan2022scoring} introduce performative probabilistic predictions using scoring rules. However, they focus on particular functional forms of \(f\) and binary predictions and do not provide a more general analysis. Another related setting in which it has been shown that no proper scoring rules exist is that of second-order prediction, in which experts report distributions over first-order distributions to express epistemic uncertainty \citep{bengs2023second}.

%\jt{copied from introduction}
%A proper scoring rule assigns scores to forecasts in a way that incentivizes honest reporting of beliefs [\citealp{Brier1950}; \citealp{Good1952}, Section 8; \citealp{McCarthy1956}; \citealp{Savage1971}; \citealp{gneiting2007strictly}]. Proper scoring rules have been used to incentivize truthful reports from experts \citep{carvalho2016overview}. They could thus be used as an objective %\jt{I don't like "training objective" since it's not clear an AI trained on an objective will also itself have this objective, and we don't talk about training except in the last section.}\co{:ok-hand:}
%for oracle AIs. 



\textbf{AI oracles. }
Issues with performativity have been mentioned in the literature on AI predictors or oracles \cite{armstrong2017good}.
Most prior work has focused on alleviating performativity altogether, e.g., by making the oracle predict \emph{counterfactual worlds} it cannot influence. We are not aware of any prior work on specifically the question of whether AI oracles would be incentivized to output fixed points at all.

%Our results in \Cref{preferences-between-fps} support the prior idea that an AI expert will try to make the world more predictable to get a higher score \cite{demski2019parable}. However, importantly, we show that it is not even clear whether an AI oracle would output a fixed point in the first place: how close the oracle's prediction will be to a fixed point depends on facts about the world and about the scoring rule. The problem thus persist even if there is a unique fixed point or no fixed point at all. It would not be sufficient for safety, for instance, to build an AI oracle with a unique and safe fixed point.

\textbf{Decision scoring rules and decision markets. }
The literature on decision scoring rules and decision markets considers a setting in which experts make predictions about what would happen if a decision maker were to pursue one course of action or another. The decision maker then chooses based on these predictions, making the predictions performative. As shown by \citet{Othman2010}, the expert may thus be incentivized to mispredict when subject to a proper scoring rule. However, this literature typically takes the perspective of the decision maker and thus assumes some knowledge of $f$. For example, \citet{Othman2010} and \citet{oesterheld2020decision} show that the scoring rule $S$ must be chosen to align in some sense with the decision maker's utility function (and thus $f$). \citet{Chen2014} propose that the decision maker could randomize to set good incentives, which in our setting would entail manipulating $f$.
%a lot of $f$.
%\co{TODO: Caspar}
%Work on \emph{decision markets} \cite{chen2011decision,oesterheld2020decision} tries to set the right incentives for predictions that inform decisions. However, in the decision market setup, predictions only affect the world by influencing the principal's final decision, whereas we consider an arbitrary relationship between world and prediction. Unlike in our setup, in the decision market setup, there exist scoring rules that do incentivize perfectly accurate reports. 

\textbf{Epistemic decision theory. }
A related topic in philosophy is \emph{epistemic decision theory}. In particular, \citet{greaves2013epistemic} introduces several cases in which outcomes depend on the agent's credences and compares the verdicts of different epistemic decision theories (such as an evidential and a causal version). While some of Greaves' examples involve agents knowably adopting incorrect beliefs, they require joint beliefs over several propositions, and Greaves only considers individual examples. We instead consider only a single binary prediction and prove results for arbitrary scoring rules and relationships between predictions and beliefs.


\textbf{Honest and truthful AI. }
Another related topic is honest and truthful AI \citep{evans2021truthful}. In our setting, an AI that reports an inaccurate prediction to achieve a higher score would be dishonest. \citet{evans2021truthful} discuss issues around training AIs to be truthful and honest, such as difficulties in judging truth. However, they do not explore performativity or proper scoring rules. We simplify our analysis by assuming that a ground truth exists and can be judged objectively. \citet{burns2022discovering} discuss extracting latent knowledge from AIs without relying on incentivizing honest reporting, but also do not address performativity.




%What does this mean for alignment?
% This result shows....




\section{Conclusion and future work}
\label{conclusion}
If predictions cannot influence which outcome occurs, then strictly proper scoring rules incentivize experts (humans or AI systems) to report honest predictions. This fails if predictions are performative. We showed that, in general, %they do not even output predictions that accurately reflect their beliefs
strictly proper scoring rules do not incentivize accurate predictions in a performative prediction setting. We analyzed this inaccuracy quantitatively and gave upper bounds on inaccuracy. We showed that in the case of binary prediction, there exist scoring rules that incentivize arbitrarily accurate predictions. In contrast, for more than two outcomes, it is not possible to achieve arbitrarily strong bounds on accuracy. Our numerical simulations in a toy setting confirm that our bounds are tight in some situations and that inaccurate performative predictions are common. Finally, we showed that by using other types of objectives, such as minimizing regret, we can build AI models that predict fixed points.

We hope that future work will shed further light on practical and safe uses of AI systems as predictors, i.e., oracle AIs. First, some of our bounds could probably be improved or generalized (to non-differentiable $f,G$). Second, it would be valuable to have more specific models of $f$. Precise models of \(f\) may allow for stronger results \citep[cf.][]{Othman2010,oesterheld2020decision}. Third, we take a simplistic view of safety: we take it that incentives to predict honestly are good and that other incentives are problematic. We hope that future work will augment our analysis with more fine-grained models of safety. For example, a common safety concern is power-seeking behavior \citep{omohundro2008basic,turner2021optimal}. One could similarly ask to what extent performative oracle AI will spend compute to improve its ability to influence the world (cf.\ discussions of information acquisition, e.g.\ \citealp{Osband1989}; \citealp{neyman2021binary};
\citealp{li2022optimization}; \citealp{OesConAcquisition}).
Lastly, we are interested in theoretical and experimental evaluations of the practicality of different safe oracle AI designs and training setups.
\begin{acknowledgements}


CO acknowledges funding from the Cooperative AI Foundation, Polaris Ventures (formerly Center for Emerging Risk Research) and Jaan Tallinn's donor-advised fund at Founders Pledge.
JT and RH carried out most of this work as part of the SERI MATS program under the mentorship of Evan Hubinger (JT, RH) and Leo Gao (RH). JT is grateful for support by an Open Phil AI Fellowship and an FLI PhD Fellowship.
We sincerely thank four anonymous reviewers whose insightful comments helped us improve our paper. We are also indebted to Meena Jagadeesan, Erik Jenner, Adam Jermyn, and Marius Hobbhahn for their valuable discussions and feedback, and to Alexander Pan and Bastian Stern for pointing us to the relevant related literature. %Lastly, we thank Bastian Stern for directing us to relevant related work.
\end{acknowledgements}

\clearpage

%Future work:
% - Theory
%   - pseudo derivatives
%   - More nuanced modeling of safety. (Our model is just: honesty incentive good, other incentives bad, esp if they disagree with honesty.) Study in more detail the misaligned incentives. E.g., power-seeking.   
%   - Relatedly, incorporate some of the staples of scoring rules literature: information acquisition (which in the case of expert AI may simply consist in thinking) -- will it try to acquire information that helps it shape the world?
%  
% We are also interested in how practical the different designs are. In particular, are the safe designs practical. This can, of course, be studied both theoretically and experimentally.
%
%

%Future work brainstorming:
% - Versions of our results with pseudo derivatives.
% - More realistic f, more safety-critical f
% - Which of these are practical from an ML standpoint? (complexity theory)
% - Our theoretical results have suggestions for safety. Regret min > binary prediction with scoring rules that enforce fixed points > many-outcome prediction. Do these line up in practice. Investigations of safety through means other than asking whether honest predictions are incentivized.

%and showed that under some commonly used scoring rules, both the inaccuracy of predictions and the distance from fixed points can be large. To address this issue, we introduced scoring rules that minimize these quantities. However, we did not solve the problem of incentivizing the prediction of extreme fixed points.

\begin{comment}
The main takeaway from our model is that oracle AIs incentivized by strictly proper scoring rules may knowingly report inaccurate predictions. It is unclear how well our quantitative results apply to more realistic settings, and thus how inaccurate realistic oracles' predictions will be. Our model makes a number of simplifying and potentially inaccurate assumptions, including: (i) a single binary prediction setup;
(ii) the oracle maximizes a scoring rule;
(iii) a function \(f\) describes the relationship between the oracle's predictions and beliefs over the world. Our bounds also depend on differentiability of scoring rules and functions \(f\), and our numerical simulations assume affine linear \(f\).

We believe that our model and results will extend to higher-dimensional predictions, and the assumptions of differentiability could likely also be relaxed in future work. However, a more fundamental issue is better understanding the relationship between predictions and beliefs, especially for higher-dimensional predictions. We hope that further progress in these areas will help us determine the feasibility of safe oracle AI setups.

Another direction for future research that we are pursuing is incentive structures related to \href{https://www.alignmentforum.org/posts/4hdHto3uHejhY2F3Q/partial-agency}{stop-gradients}. If an AI is only trying to match its prediction to the world rather than jointly optimizing both the prediction and the world, then the only equilibria of this process may be fixed points. For example, some types of \href{https://www.alignmentforum.org/posts/hJaJw6LK39zpyCKW6/standard-ml-oracles-vs-counterfactual-ones}{ML oracles} might implement stop-gradients and therefore always converge to fixed points.
\end{comment}

%The {\it IJCAI--23 Proceedings} will be printed from electronic
%manuscripts submitted by the authors. These must be PDF ({\em Portable
%        Document Format}) files formatted for 8-1/2$''$ $\times$ 11$''$ paper.

%\subsection{Length of Papers}


%All paper {\em submissions} to the main track must have a maximum of seven pages, plus at most two for references / acknowledgements / contribution statement / ethics statement.
\begin{comment}
The length rules may change for final camera-ready versions of accepted papers and
differ between tracks. Some tracks may disallow any contents other than the references in the last two pages, whereas others allow for any content in all pages. Similarly, some tracks allow you to buy a few extra pages should you want to, whereas others don't.

If your paper is accepted, please carefully read the notifications you receive, and check the proceedings submission information website\footnote{\url{https://proceedings.ijcai.org/info}} to know how many pages you can use for your final version. That website holds the most up-to-date information regarding paper length limits at all times.


\subsection{Word Processing Software}

As detailed below, IJCAI has prepared and made available a set of
\LaTeX{} macros and a Microsoft Word template for use in formatting
your paper. If you are using some other word processing software, please follow the format instructions given below and ensure that your final paper looks as much like this sample as possible.

\section{Style and Format}

\LaTeX{} and Word style files that implement these instructions
can be retrieved electronically. (See Section~\ref{stylefiles} for
instructions on how to obtain these files.)

\subsection{Layout}

Print manuscripts two columns to a page, in the manner in which these
instructions are printed. The exact dimensions for pages are:
\begin{itemize}
    \item left and right margins: .75$''$
    \item column width: 3.375$''$
    \item gap between columns: .25$''$
    \item top margin---first page: 1.375$''$
    \item top margin---other pages: .75$''$
    \item bottom margin: 1.25$''$
    \item column height---first page: 6.625$''$
    \item column height---other pages: 9$''$
\end{itemize}

All measurements assume an 8-1/2$''$ $\times$ 11$''$ page size. For
A4-size paper, use the given top and left margins, column width,
height, and gap, and modify the bottom and right margins as necessary.

\subsection{Format of Electronic Manuscript}

For the production of the electronic manuscript, you must use Adobe's
{\em Portable Document Format} (PDF). A PDF file can be generated, for
instance, on Unix systems using {\tt ps2pdf} or on Windows systems
using Adobe's Distiller. There is also a website with free software
and conversion services: \url{http://www.ps2pdf.com}. For reasons of
uniformity, use of Adobe's {\em Times Roman} font is strongly suggested.
In \LaTeX2e{} this is accomplished by writing
\begin{quote}e
    \mbox{\tt $\backslash$usepackage\{times\}}
\end{quote}
in the preamble.\footnote{You may want to also use the package {\tt
            latexsym}, which defines all symbols known from the old \LaTeX{}
    version.}

Additionally, it is of utmost importance to specify the {\bf
        letter} format (corresponding to 8-1/2$''$ $\times$ 11$''$) when
formatting the paper. When working with {\tt dvips}, for instance, one
should specify {\tt -t letter}.

\subsection{Papers Submitted for Review vs. Camera-ready Papers}
In this document, we distinguish between papers submitted for review (henceforth, submissions) and camera-ready versions, i.e., accepted papers that will be included in the conference proceedings. The present document provides information to be used by both types of papers (submissions / camera-ready). There are relevant differences between the two versions. Find them next.

\subsubsection{Anonymity}
For the main track and some of the special tracks, submissions must be anonymous; for other special tracks they must be non-anonymous. The camera-ready versions for all tracks are non-anonymous. When preparing your submission, please check the track-specific instructions regarding anonymity.

\subsubsection{Submissions}
The following instructions apply to submissions:
\begin{itemize}
\item If your track requires submissions to be anonymous, they must be fully anonymized as discussed in the Modifications for Blind Review subsection below; in this case, Acknowledgements and Contribution Statement sections are not allowed.

\item If your track requires non-anonymous submissions, you should provide all author information at the time of submission, just as for camera-ready papers (see below); Acknowledgements and Contribution Statement sections are allowed, but optional.

\item Submissions must include line numbers to facilitate feedback in the review process . Enable line numbers by uncommenting the command {\tt \textbackslash{}linenumbers} in the preamble \footnote{New in IJCAI--23}.

\item The limit on the number of  content pages is \emph{strict}. All papers exceeding the limits will be desk rejected.
\end{itemize}

\subsubsection{Camera-Ready Papers}
The following instructions apply to camera-ready papers:

\begin{itemize}
\item Authors and affiliations are mandatory. Explicit self-references are allowed. It is strictly forbidden to add authors not declared at submission time.

\item Acknowledgements and Contribution Statement sections are allowed, but optional.

\item Line numbering must be disabled. To achieve this, comment or disable {\tt \textbackslash{}linenumbers} in the preamble.

\item For some of the tracks, you can exceed the page limit by purchasing extra pages.
\end{itemize}

\subsection{Title and Author Information}

Center the title on the entire width of the page in a 14-point bold
font. The title must be capitalized using Title Case. For non-anonymous papers, author names and affiliations should appear below the title. Center author name(s) in 12-point bold font. On the following line(s) place the affiliations.

\subsubsection{Author Names}

Each author name must be followed by:
\begin{itemize}
    \item A newline {\tt \textbackslash{}\textbackslash{}} command for the last author.
    \item An {\tt \textbackslash{}And} command for the second to last author.
    \item An {\tt \textbackslash{}and} command for the other authors.
\end{itemize}

\subsubsection{Affiliations}

After all authors, start the affiliations section by using the {\tt \textbackslash{}affiliations} command.
Each affiliation must be terminated by a newline {\tt \textbackslash{}\textbackslash{}} command. Make sure that you include the newline after the last affiliation, too.

\subsubsection{Mapping Authors to Affiliations}

If some scenarios, the affiliation of each author is clear without any further indication (\emph{e.g.}, all authors share the same affiliation, all authors have a single and different affiliation). In these situations you don't need to do anything special.

In more complex scenarios you will have to clearly indicate the affiliation(s) for each author. This is done by using numeric math superscripts {\tt \$\{\^{}$i,j, \ldots$\}\$}. You must use numbers, not symbols, because those are reserved for footnotes in this section (should you need them). Check the authors definition in this example for reference.

\subsubsection{Emails}

This section is optional, and can be omitted entirely if you prefer. If you want to include e-mails, you should either include all authors' e-mails or just the contact author(s)' ones.

Start the e-mails section with the {\tt \textbackslash{}emails} command. After that, write all emails you want to include separated by a comma and a space, following the order used for the authors (\emph{i.e.}, the first e-mail should correspond to the first author, the second e-mail to the second author and so on).

You may ``contract" consecutive e-mails on the same domain as shown in this example (write the users' part within curly brackets, followed by the domain name). Only e-mails of the exact same domain may be contracted. For instance, you cannot contract ``person@example.com" and ``other@test.example.com" because the domains are different.


\subsubsection{Modifications for Blind Review}
When submitting to a track that requires anonymous submissions,
in order to make blind reviewing possible, authors must omit their
names, affiliations and e-mails. In place
of names, affiliations and e-mails, you can optionally provide the submission number and/or
a list of content areas. When referring to one's own work,
use the third person rather than the
first person. For example, say, ``Previously,
Gottlob~\citet{gottlob:nonmon} has shown that\ldots'', rather
than, ``In our previous work~\cite{gottlob:nonmon}, we have shown
that\ldots'' Try to avoid including any information in the body of the
paper or references that would identify the authors or their
institutions, such as acknowledgements. Such information can be added post-acceptance to be included in the camera-ready
version.
Please also make sure that your paper metadata does not reveal
the authors' identities.

\subsection{Abstract}

Place the abstract at the beginning of the first column 3$''$ from the
top of the page, unless that does not leave enough room for the title
and author information. Use a slightly smaller width than in the body
of the paper. Head the abstract with ``Abstract'' centered above the
body of the abstract in a 12-point bold font. The body of the abstract
should be in the same font as the body of the paper.

The abstract should be a concise, one-paragraph summary describing the
general thesis and conclusion of your paper. A reader should be able
to learn the purpose of the paper and the reason for its importance
from the abstract. The abstract should be no more than 200 words long.

\subsection{Text}

The main body of the text immediately follows the abstract. Use
10-point type in a clear, readable font with 1-point leading (10 on
11).

Indent when starting a new paragraph, except after major headings.

\subsection{Headings and Sections}

When necessary, headings should be used to separate major sections of
your paper. (These instructions use many headings to demonstrate their
appearance; your paper should have fewer headings.). All headings should be capitalized using Title Case.

\subsubsection{Section Headings}

Print section headings in 12-point bold type in the style shown in
these instructions. Leave a blank space of approximately 10 points
above and 4 points below section headings.  Number sections with
Arabic numerals.

\subsubsection{Subsection Headings}

Print subsection headings in 11-point bold type. Leave a blank space
of approximately 8 points above and 3 points below subsection
headings. Number subsections with the section number and the
subsection number (in Arabic numerals) separated by a
period.

\subsubsection{Subsubsection Headings}

Print subsubsection headings in 10-point bold type. Leave a blank
space of approximately 6 points above subsubsection headings. Do not
number subsubsections.

\textbf{Titled paragraphs.} You should use titled paragraphs if and
only if the title covers exactly one paragraph. Such paragraphs should be
separated from the preceding content by at least 3pt, and no more than
6pt. The title should be in 10pt bold font and to end with a period.
After that, a 1em horizontal space should follow the title before
the paragraph's text.

In \LaTeX{} titled paragraphs should be typeset using
\begin{quote}
    {\tt \textbackslash{}paragraph\{Title.\} text} .
\end{quote}

\subsection{Special Sections}

\subsubsection{Appendices}
You may move some of the contents of the paper into one or more appendices that appear after the main content, but before references. These appendices count towards the page limit and are distinct from the supplementary material that can be submitted separately through CMT. Such appendices are useful if you would like to include highly technical material (such as a lengthy calculation) that will disrupt the flow of the paper. They can be included both in papers submitted for review and in camera-ready versions; in the latter case, they will be included in the proceedings (whereas the supplementary materials will not be included in the proceedings).
Appendices are optional. Appendices must appear after the main content.
Appendix sections must use letters instead of Arabic numerals. In \LaTeX,  you can use the {\tt \textbackslash{}appendix} command to achieve this followed by  {\tt \textbackslash section\{Appendix\}} for your appendix sections.

\subsubsection{Ethical Statement}

Ethical Statement is optional. You may include an Ethical Statement to discuss  the ethical aspects and implications of your research. The section should be titled \emph{Ethical Statement} and be typeset like any regular section but without being numbered. This section may be placed on the References pages.

Use
\begin{quote}
    {\tt \textbackslash{}section*\{Ethical Statement\}}
\end{quote}

\subsubsection{Acknowledgements}

Acknowledgements are optional. In the camera-ready version you may include an unnumbered acknowledgments section, including acknowledgments of help from colleagues, financial support, and permission to publish. This is not allowed in the anonymous submission. If present, acknowledgements must be in a dedicated, unnumbered section appearing after all regular sections but before references.  This section may be placed on the References pages.

Use
\begin{quote}
    {\tt \textbackslash{}section*\{Acknowledgements\}}
\end{quote}
to typeset the acknowledgements section in \LaTeX{}.


\subsubsection{Contribution Statement}

Contribution Statement is optional. In the camera-ready version you may include an unnumbered Contribution Statement section\footnote{New in IJCAI--23}, explicitly describing the contribution of each of the co-authors to the paper. This is not allowed in the anonymous submission. If present, Contribution Statement must be in a dedicated, unnumbered section appearing after all regular sections but before references.  This section may be placed on the References pages.

Use
\begin{quote}
    {\tt \textbackslash{}section*\{Contribution Statement\}}
\end{quote}
to typeset the Contribution Statement section in \LaTeX{}.

\subsubsection{References}

The references section is headed ``References'', printed in the same
style as a section heading but without a number. A sample list of
references is given at the end of these instructions. Use a consistent
format for references. The reference list should not include publicly unavailable work.

\subsubsection{Order of Sections}
Sections should be arranged in the following order:
\begin{enumerate}
    \item Main content sections (numbered)
    \item Appendices (optional, numbered using capital letters)
    \item Ethical statement (optional, unnumbered)
    \item Acknowledgements (optional, unnumbered)
    \item Contribution statement (optional, unnumbered)
    \item References (required, unnumbered)
\end{enumerate}

\subsection{Citations}

Citations within the text should include the author's last name and
the year of publication, for example~\cite{gottlob:nonmon}.  Append
lowercase letters to the year in cases of ambiguity.  Treat multiple
authors as in the following examples:~\cite{abelson-et-al:scheme}
or~\cite{bgf:Lixto} (for more than two authors) and
\cite{brachman-schmolze:kl-one} (for two authors).  If the author
portion of a citation is obvious, omit it, e.g.,
Nebel~\citet{nebel:jair-2000}.  Collapse multiple citations as
follows:~\cite{gls:hypertrees,levesque:functional-foundations}.
\nocite{abelson-et-al:scheme}
\nocite{bgf:Lixto}
\nocite{brachman-schmolze:kl-one}
\nocite{gottlob:nonmon}
\nocite{gls:hypertrees}
\nocite{levesque:functional-foundations}
\nocite{levesque:belief}
\nocite{nebel:jair-2000}

\subsection{Footnotes}

Place footnotes at the bottom of the page in a 9-point font.  Refer to
them with superscript numbers.\footnote{This is how your footnotes
    should appear.} Separate them from the text by a short
line.\footnote{Note the line separating these footnotes from the
    text.} Avoid footnotes as much as possible; they interrupt the flow of
the text.

\section{Illustrations}

Place all illustrations (figures, drawings, tables, and photographs)
throughout the paper at the places where they are first discussed,
rather than at the end of the paper.

They should be floated to the top (preferred) or bottom of the page,
unless they are an integral part
of your narrative flow. When placed at the bottom or top of
a page, illustrations may run across both columns, but not when they
appear inline.

Illustrations must be rendered electronically or scanned and placed
directly in your document. They should be cropped outside \LaTeX{},
otherwise portions of the image could reappear during the post-processing of your paper.
When possible, generate your illustrations in a vector format.
When using bitmaps, please use 300dpi resolution at least.
All illustrations should be understandable when printed in black and
white, albeit you can use colors to enhance them. Line weights should
be 1/2-point or thicker. Avoid screens and superimposing type on
patterns, as these effects may not reproduce well.

Number illustrations sequentially. Use references of the following
form: Figure 1, Table 2, etc. Place illustration numbers and captions
under illustrations. Leave a margin of 1/4-inch around the area
covered by the illustration and caption.  Use 9-point type for
captions, labels, and other text in illustrations. Captions should always appear below the illustration.

\section{Tables}

Tables are treated as illustrations containing data. Therefore, they should also appear floated to the top (preferably) or bottom of the page, and with the captions below them.

\begin{table}
    \centering
    \begin{tabular}{lll}
        \hline
        Scenario  & $\delta$ & Runtime \\
        \hline
        Paris     & 0.1s     & 13.65ms \\
        Paris     & 0.2s     & 0.01ms  \\
        New York  & 0.1s     & 92.50ms \\
        Singapore & 0.1s     & 33.33ms \\
        Singapore & 0.2s     & 23.01ms \\
        \hline
    \end{tabular}
    \caption{Latex default table}
    \label{tab:plain}
\end{table}

\begin{table}
    \centering
    \begin{tabular}{lrr}
        \toprule
        Scenario  & $\delta$ (s) & Runtime (ms) \\
        \midrule
        Paris     & 0.1          & 13.65        \\
                  & 0.2          & 0.01         \\
        New York  & 0.1          & 92.50        \\
        Singapore & 0.1          & 33.33        \\
                  & 0.2          & 23.01        \\
        \bottomrule
    \end{tabular}
    \caption{Booktabs table}
    \label{tab:booktabs}
\end{table}

If you are using \LaTeX, you should use the {\tt booktabs} package, because it produces tables that are better than the standard ones. Compare Tables~\ref{tab:plain} and~\ref{tab:booktabs}. The latter is clearly more readable for three reasons:

\begin{enumerate}
    \item The styling is better thanks to using the {\tt booktabs} rulers instead of the default ones.
    \item Numeric columns are right-aligned, making it easier to compare the numbers. Make sure to also right-align the corresponding headers, and to use the same precision for all numbers.
    \item We avoid unnecessary repetition, both between lines (no need to repeat the scenario name in this case) as well as in the content (units can be shown in the column header).
\end{enumerate}

\section{Formulas}

IJCAI's two-column format makes it difficult to typeset long formulas. A usual temptation is to reduce the size of the formula by using the {\tt small} or {\tt tiny} sizes. This doesn't work correctly with the current \LaTeX{} versions, breaking the line spacing of the preceding paragraphs and title, as well as the equation number sizes. The following equation demonstrates the effects (notice that this entire paragraph looks badly formatted, and the line numbers no longer match the text):
%
\begin{tiny}
    \begin{equation}
        x = \prod_{i=1}^n \sum_{j=1}^n j_i + \prod_{i=1}^n \sum_{j=1}^n i_j + \prod_{i=1}^n \sum_{j=1}^n j_i + \prod_{i=1}^n \sum_{j=1}^n i_j + \prod_{i=1}^n \sum_{j=1}^n j_i
    \end{equation}
\end{tiny}%

Reducing formula sizes this way is strictly forbidden. We {\bf strongly} recommend authors to split formulas in multiple lines when they don't fit in a single line. This is the easiest approach to typeset those formulas and provides the most readable output%
%
\begin{align}
    x = & \prod_{i=1}^n \sum_{j=1}^n j_i + \prod_{i=1}^n \sum_{j=1}^n i_j + \prod_{i=1}^n \sum_{j=1}^n j_i + \prod_{i=1}^n \sum_{j=1}^n i_j + \nonumber \\
    +   & \prod_{i=1}^n \sum_{j=1}^n j_i.
\end{align}%

If a line is just slightly longer than the column width, you may use the {\tt resizebox} environment on that equation. The result looks better and doesn't interfere with the paragraph's line spacing: %
\begin{equation}
    \resizebox{.91\linewidth}{!}{$
            \displaystyle
            x = \prod_{i=1}^n \sum_{j=1}^n j_i + \prod_{i=1}^n \sum_{j=1}^n i_j + \prod_{i=1}^n \sum_{j=1}^n j_i + \prod_{i=1}^n \sum_{j=1}^n i_j + \prod_{i=1}^n \sum_{j=1}^n j_i
        $}.
\end{equation}%

This last solution may have to be adapted if you use different equation environments, but it can generally be made to work. Please notice that in any case:

\begin{itemize}
    \item Equation numbers must be in the same font and size as the main text (10pt).
    \item Your formula's main symbols should not be smaller than {\small small} text (9pt).
\end{itemize}

For instance, the formula
%
\begin{equation}
    \resizebox{.91\linewidth}{!}{$
            \displaystyle
            x = \prod_{i=1}^n \sum_{j=1}^n j_i + \prod_{i=1}^n \sum_{j=1}^n i_j + \prod_{i=1}^n \sum_{j=1}^n j_i + \prod_{i=1}^n \sum_{j=1}^n i_j + \prod_{i=1}^n \sum_{j=1}^n j_i + \prod_{i=1}^n \sum_{j=1}^n i_j
        $}
\end{equation}
%
would not be acceptable because the text is too small.

\section{Examples, Definitions, Theorems and Similar}

Examples, definitions, theorems, corollaries and similar must be written in their own paragraph. The paragraph must be separated by at least 2pt and no more than 5pt from the preceding and succeeding paragraphs. They must begin with the kind of item written in 10pt bold font followed by their number (e.g.: {\bf Theorem 1}),
optionally followed by a title/summary between parentheses in non-bold font and ended with a period (in bold).
After that the main body of the item follows, written in 10 pt italics font (see below for examples).

In \LaTeX{} we strongly recommend that you define environments for your examples, definitions, propositions, lemmas, corollaries and similar. This can be done in your \LaTeX{} preamble using \texttt{\textbackslash{newtheorem}} -- see the source of this document for examples. Numbering for these items must be global, not per-section (e.g.: Theorem 1 instead of Theorem 6.1).

\begin{example}[How to write an example]
    Examples should be written using the example environment defined in this template.
\end{example}

\begin{theorem}
    This is an example of an untitled theorem.
\end{theorem}

You may also include a title or description using these environments as shown in the following theorem.

\begin{theorem}[A titled theorem]
    This is an example of a titled theorem.
\end{theorem}

\section{Proofs}

Proofs must be written in their own paragraph(s) separated by at least 2pt and no more than 5pt from the preceding and succeeding paragraphs. Proof paragraphs should start with the keyword ``Proof." in 10pt italics font. After that the proof follows in regular 10pt font. At the end of the proof, an unfilled square symbol (qed) marks the end of the proof.

In \LaTeX{} proofs should be typeset using the \texttt{\textbackslash{proof}} environment.

\begin{proof}
    This paragraph is an example of how a proof looks like using the \texttt{\textbackslash{proof}} environment.
\end{proof}


\section{Algorithms and Listings}

Algorithms and listings are a special kind of figures. Like all illustrations, they should appear floated to the top (preferably) or bottom of the page. However, their caption should appear in the header, left-justified and enclosed between horizontal lines, as shown in Algorithm~\ref{alg:algorithm}. The algorithm body should be terminated with another horizontal line. It is up to the authors to decide whether to show line numbers or not, how to format comments, etc.

In \LaTeX{} algorithms may be typeset using the {\tt algorithm} and {\tt algorithmic} packages, but you can also use one of the many other packages for the task.

\begin{algorithm}[tb]
    \caption{Example algorithm}
    \label{alg:algorithm}
    \textbf{Input}: Your algorithm's input\\
    \textbf{Parameter}: Optional list of parameters\\
    \textbf{Output}: Your algorithm's output
    \begin{algorithmic}[1] %[1] enables line numbers
        \STATE Let $t=0$.
        \WHILE{condition}
        \STATE Do some action.
        \IF {conditional}
        \STATE Perform task A.
        \ELSE
        \STATE Perform task B.
        \ENDIF
        \ENDWHILE
        \STATE \textbf{return} solution
    \end{algorithmic}
\end{algorithm}

\section{\LaTeX{} and Word Style Files}\label{stylefiles}

The \LaTeX{} and Word style files are available on the IJCAI--23
website, \url{https://ijcai-23.org/}.
These style files implement the formatting instructions in this
document.

The \LaTeX{} files are {\tt ijcai23.sty} and {\tt ijcai23.tex}, and
the Bib\TeX{} files are {\tt named.bst} and {\tt ijcai23.bib}. The
\LaTeX{} style file is for version 2e of \LaTeX{}, and the Bib\TeX{}
style file is for version 0.99c of Bib\TeX{} ({\em not} version
0.98i). The {\tt ijcai23.sty} style differs from the {\tt
        ijcai22.sty} file used for IJCAI--22.

The Microsoft Word style file consists of a single file, {\tt
        ijcai23.docx}. This template differs from the one used for
IJCAI--22.

These Microsoft Word and \LaTeX{} files contain the source of the
present document and may serve as a formatting sample.

Further information on using these styles for the preparation of
papers for IJCAI--23 can be obtained by contacting {\tt
        proceedings@ijcai.org}.
\end{comment}



%\section*{Ethical Statement}

%There are no ethical issues.

%\section*{Acknowledgments}
%
% Acknowledge people we acknowledge in original post.
% Acknowledge Vince, Meena Jagadeesan


%% The file named.bst is a bibliography style file for BibTeX 0.99c
\bibliography{refs}

\onecolumn


\appendix



\end{document}
