\documentclass[accepted]{uai2025} % for initial submission
% \documentclass[accepted]{uai2025} % after acceptance, for a revised version; 
% also before submission to see how the non-anonymous paper would look like 
                        
%% There is a class option to choose the math font
% \documentclass[mathfont=ptmx]{uai2025} % ptmx math instead of Computer
                                         % Modern (has noticeable issues)
% \documentclass[mathfont=newtx]{uai2025} % newtx fonts (improves upon
                                          % ptmx; less tested, no support)
% NOTE: Only keep *one* line above as appropriate, as it will be replaced
%       automatically for papers to be published. Do not make any other
%       change above this note for an accepted version.

\relax % controls
  \newif\ifbiblatex \biblatexfalse

%% Choose your variant of English; be consistent
\usepackage[american]{babel}
% \usepackage[british]{babel}

%% Some suggested packages, as needed:
\usepackage{natbib} % has a nice set of citation styles and commands
    \bibliographystyle{plainnat}
    \renewcommand{\bibsection}{\subsubsection*{References}}
% \usepackage{mathtools} % amsmath with fixes and additions
% \usepackage{siunitx} % for proper typesetting of numbers and units
\usepackage{booktabs} % commands to create good-looking tables
% \usepackage{tikz} % nice language for creating drawings and diagrams

%% Provided macros
% \smaller: Because the class footnote size is essentially LaTeX's \small,
%           redefining \footnotesize, we provide the original \footnotesize
%           using this macro.
%           (Use only sparingly, e.g., in drawings, as it is quite small.)

\input{confidence-preamble}
  % \marginprooflinksfalse
  \marginprooflinkstrue

% \newcommand\vnew[1]{{\color{violet}#1}}
\newcommand\vnew\relax 

\title{Learning with Confidence}

% The standard author block has changed for UAI 2025 to provide
% more space for long author lists and allow for complex affiliations
%
% All author information is authomatically removed by the class for the
% anonymous submission version of your paper, so you can already add your
% information below.
%
% Add authors
\author[1,2]{\href{mailto:<oli@cs.cornell.edu>?Subject=Learning With Confidence}{Oliver E. Richardson}{}}
% Add affiliations after the authors

\affil[1]{%
    Computer Science Dept.\\
    Universit\'{e} de Montr\'eal\\
    Montr\'eal, Canada
}
\affil[2]{%
    Mila -- Quebec AI Institute
}

\begin{document}
\maketitle

\begin{abstract}
  % We characterize a notion of confidence that arises when learning or updating beliefs. This \emph{learner's confidence} can be used alongside (and is easily be mistaken for) probability or likelihood, but it is fundamentally a different concept. 
  % Although perhaps not as useful as probability itself, our notion of confidence captures and unifies many concepts in the literature, from Shafer's weight of evidence, to Kalman gain, as well as number of training epochs and learning rate.
  % We provide a mathematical definition of what it means to learn with confidence, and give two canonical ways of measuring confidence on a continuum. 
  % Under additional assumptions, we derive more compact representations of confidence-based learning in terms of vector fields and loss functions.
  % These representations induce an extended language of compound ``parallel'' observations. 
  % We illustrate our framework by analyzing standard ways of updating beliefs.

  We characterize a notion of confidence that arises in learning or updating beliefs:
    the amount of trust one has in incoming information and its impact on the belief state. 
  This \emph{learner's confidence} can be used alongside (and is easily mistaken for) probability or likelihood, but it is fundamentally a different concept---one that captures many familiar concepts in the literature, including learning rates and number of training epochs, Shafer's weight of evidence,  and Kalman gain.
  We formally axiomatize what it means to learn with confidence, give two canonical ways of measuring confidence on a continuum, and prove that confidence can always be represented in this way. 
  Under additional assumptions, we derive more compact representations of confidence-based learning in terms of vector fields and loss functions.
  These representations induce an extended language of compound ``parallel'' observations. 
  We characterize \emph{Bayesian} learning as the special case of an \emph{optimizing learner} whose loss representation is a linear expectation. 
  % We illustrate our framework by analyzing standard ways of updating beliefs.
\end{abstract}


\section{Introduction}\label{sec:intro}
\input{sections/intro}
    
\section{A Formal Model of Confidence, Learning, and Belief}
\input{sections/update-formalism}

\section{The Confidence Continuum}
\input{sections/additive-and-fields}

\subsection{Optimizing Learners}
\input{sections/loss-repr}

% \section{Bayesian and Boltzmann Learning}
% \section{Boltzmann and the Bayesian}
\section{Boltzmann and Bayes}
% \vnew{\subsection{Boltzmann and Bayes}}
    \input{sections/bayes} 
    
% \vnew{
% \section{How to Select Confidence?}
% it is true that the user can freely choose the learning rate or elect to duplicate training examples. (Indeed, our framework allows for the user to freely choose their confidence in each observation.) But the fact that we are “free” to make these choices does not mean that they are arbitrary or meaningless. Clearly these choices matter—they result in different trained models, with different behavior (see the literature on deduplication, for instance). Likely some models are better than others, depending on your sensibilities. This paper aims to study the meaning of choices like this, without necessarily prescribing how best to make them.
% }

\section{Conclusion}

% The key property that we have learned from this 
%
%
% The difficulty of measuring learner's confidence is fundamentally the same difficulty as in dealing with independence.
% Learner's confidence is fundamentally different from (if often related to) probability.
Metaphorically: if certainty is black and white, then probability allows for shades of gray, and learner's confidence is about \emph{transparency}. 
% This brief paper has only scratched the surface of the concept.
\vnew{%
The idea is an old one, having been deployed many times before in various contexts;
  this paper unifies the approaches, providing axiomatic grounding for the concept writ large (\cref{ax:zero,ax:cont-and-smooth,ax:seq-for-more,ax:acyclic,ax:combinativity}).
  We have identified the critical aspects of confidence in a very general setting, and related it to probabilistic notions of confidence (e.g., via \cref{ax:lb-ascent} and \cref{prop:Boltz-Bayes}).
The resulting framework connects many seemingly different representations of confidence and learning,
for an overview of which we invite the reader to revisit \cref{fig:map}.
We contend that this framework clarifies common points of confusion in  literature (see \cref{ssec:full-learn}).
}
%
%
%

% There are many other examples and applications of this framework. 
There are many examples and applications of this framework. 
% Even a careful treatment of which learning procedures correspond to which loss functions is interesting, and beyond what we were able cover here. Some of this additional material is in the appendix, some needs writing to be done justice, and some is the subject of ongoing parallel work. 
An obvious continuation point---a deeper analysis of which learning functions correspond to which loss functions 
when $\Theta$ is a parametric family of distributions
% via axiom \cref{ax:lb-ascent}
\unskip---has already born fruit that we were not able to cover here. 
% Other potential areas of application include reinforcement learning (where eligibility traces appear to be a form of confidence), and the design of pseudo-labels in self-supervised learning. 
% Our work (in \cref{sec:vecrep}) also develops the foundations of a programming language based on orderless combination \citep{mixture-langs}.
%
%

A key question remains open: how should we decide how much confidence to place in an observation? 
% That is a profound question that we do not (yet) know how to answer in general.
With enough modeling assumptions, there can be a clear answer---such as in \cref{ex:kalman1d}, where the optimal Kalman gain is related to the current uncertainty and the variance of the sensor. However, as illustrated by the discussion in \cref{ex:classifier}, one's willingness to be influenced by an observation may not be merely a matter of probabilistic modeling.
% A good answer to this question would necessarily take us far beyond the scope of the present paper.
This makes the question surprisingly profound; we suspect that the search for a good answer will take us far beyond the present scope.
% A good answer to this question will necessarily take us far beyond the scope of the present paper.
%
Having laid the formal and conceptual foundations, we are eager to report back on these projects in the future.
    

% \clearpage
% \section{Back Matter}
% There are a some final, special sections that come at the back of the paper, in the following order:
% \begin{itemize}
%   \item Author Contributions (optional)
%   \item Acknowledgements (optional)
%   \item References
% \end{itemize}
% They all use an unnumbered \verb|\subsubsection|.

% For the first two special environments are provided.
% (These sections are automatically removed for the anonymous submission version of your paper.)
% The third is the ‘References’ section.
% (See below.)

% (This ‘Back Matter’ section itself should not be included in your paper.)


\newpage
\begin{acknowledgements} % will be removed in pdf for initial submission,
						 % (without ‘accepted’ option in \documentclass)
                         % so you can already fill it to test with the
                         % ‘accepted’ class option
    % Briefly acknowledge people and organizations here.
    % \emph{All} acknowledgements go in this section.
    I would like to sincerely thank Joe Halpern, my PhD advisor, who contributed significantly to the introduction of this paper, reading dozens of earlier drafts. 
    The work was
    supported in part by AFOSR grant FA23862114029, MURI grant W911NF-19-1-0217, ARO grant
    W911NF-22-1-0061, and NSF grant FMitF-2319186.
\end{acknowledgements}

% References
\bibliography{conf}

\newpage

\onecolumn

\title{Learning with Confidence\\(Supplementary Material)}
\maketitle

\appendix
\input{supplement-uai.tex}

\end{document}
