\documentclass[accepted]{uai2025}
\usepackage[american]{babel}

%% Some suggested packages, as needed:
\usepackage{natbib} % has a nice set of citation styles and commands
    \bibliographystyle{plainnat}
    \renewcommand{\bibsection}{\subsubsection*{References}}
\usepackage{mathtools}                  % amsmath with fixes and additions
\usepackage{booktabs}                   % commands to create good-looking tables
\usepackage{tikz}                       % nice language for creating drawings and diagrams

% ------------------------------------------------------- %
\usepackage{amsthm,amssymb,amsfonts}    % math stuff
\usepackage{multirow}
\usepackage{bbm}
\usepackage{subcaption}
\usepackage{cleveref}                   % smart cross-referencing
\Crefname{equation}{Eq.}{Eqs.}
\usepackage{wrapfig}
\usepackage{comment}
% ------------------------------------------------------- %
\usepackage{listings}
\crefname{lstlisting}{listing}{listings}
\Crefname{lstlisting}{Listing}{Listings}

\usepackage{arydshln} %for dashed lines in tables
\newcommand{\ind}{\mathbbm{1}}
% ------------------------------------------------------- %

\newcommand{\VI}{\mathcal{L}_{\mathrm{VI}}}
\newcommand{\ML}{\mathcal{L}_{\mathrm{ML}}}

\newcommand{\KL}{D_\mathrm{KL}}
\newcommand{\Var}{\mathrm{Var}}
\newcommand{\E}{\mathbb{E}}
\newcommand{\PACm}{PAC$^{m}$}

\newcommand{\absdev}{\overline{m}}
\renewcommand{\d}{\mathrm{d}}
\newcommand{\std}[1]{\tiny{$\pm$#1}}

\newcounter{countprop}
\newtheorem{theorem}[countprop]{Theorem} %[section]
\newtheorem{proposition}[countprop]{Proposition} %[section]
\newtheorem{lemma}[countprop]{Lemma} %[section]

\newcounter{countApp}
\newtheorem{theoremApp}[countApp]{Proposition} %[section]

% ------------------------------------------------------- %

\title{ELBO, regularized maximum likelihood,
and their common one-sample approximation for training 
stochastic neural networks}

\author[1]{Sina~Däubener}
\author[1]{Simon~Damm}
\author[1]{Asja~Fischer}

\affil[1]{%
    Department of Computer Science\\
    Ruhr University Bochum\\ Germany.
}
  
  \begin{document}
\maketitle

\begin{abstract}
    Monte Carlo approximations are central to the training of stochastic neural networks in general, and Bayesian neural networks (BNNs) in particular.
    We observe that the common one-sample approximation of the standard training objective can be viewed both as maximizing the Evidence Lower Bound (ELBO) \textit{and} as maximizing a regularized log-likelihood of a compound distribution. 
    This latter approach differs from the ELBO only in the order of the logarithm and expectation, and is theoretically grounded in PAC-Bayes theory.
    We argue theoretically and demonstrate empirically that training with the regularized maximum likelihood increases prediction variance, enhancing performance in misspecified settings, adversarial robustness, and strengthening out-of-distribution (OOD) detection.
    Our findings help reconcile previous contradictions in the literature by providing a detailed analysis of how training objectives and Monte Carlo sample sizes affect uncertainty quantification in stochastic neural networks.
\end{abstract}


\input{sections/1_introduction}
\input{sections/2_investigating_behaviour}
\input{sections/3_core_practical}
\input{sections/4_related_work}
\input{sections/5_discussion}

% \begin{contributions} % will be removed in pdf for initial submission 
% 					  % (without ‘accepted’ option in \documentclass)
%                       % so you can already fill it to test with the
%                       % ‘accepted’ class option
%     Briefly list author contributions. 
%     This is a nice way of making clear who did what and to give proper credit.
%     This section is optional.

%     H.~Q.~Bovik conceived the idea and wrote the paper.
%     Coauthor One created the code.
%     Coauthor Two created the figures.
% \end{contributions}

\begin{acknowledgements}

This work was funded by the Deutsche Forschungsgemeinschaft (DFG, German Research Foundation) under Germany’s Excellence Strategy – EXC 2092 CASA – 390781972 and under project 464104047, ‘On the Convergence of Variational Deep Learning to Sums of Entropies’, within the priority program ‘Theoretical Foundations of Deep Learning’ (SPP 2298).
Moreover, we acknowledge funding by the Ministry of Culture and Science of Northrhine-Westphalia as part of the Lamarr Fellow Network.

\end{acknowledgements}

% References
\bibliography{Literatur}

\newpage

\onecolumn

\title{ELBO, regularized maximum likelihood,
and their common one-sample approximation for training stochastic neural networks \\ (Supplementary Material)}
\maketitle

\input{sections/Appendix}

\end{document}
