\documentclass[accepted]{uai2024}

\usepackage[american]{babel}

\usepackage{natbib} % has a nice set of citation styles and commands
    \bibliographystyle{plainnat}
    \renewcommand{\bibsection}{\subsubsection*{References}}

% Recommended, but optional, packages for figures and better typesetting:
\usepackage{microtype}
\usepackage{graphicx}
\usepackage{subfigure}
\usepackage{mathtools} % amsmath with fixes and additions
% \usepackage{siunitx} % for proper typesetting of numbers and units
\usepackage{booktabs} % commands to create good-looking tables
\usepackage{tikz} % nice language for creating drawings and diagrams


\usepackage{hyperref}


\usepackage{amsmath}
\usepackage{amssymb}
\usepackage{mathtools}
\usepackage{amsthm}
\usepackage{xspace}
\usepackage{bm}
\usepackage{bbm}
\usepackage{enumitem}

% if you use cleveref..
\usepackage[capitalize,noabbrev]{cleveref}

%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
% THEOREMS
%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
\theoremstyle{plain}
\newtheorem{theorem}{Theorem}[section]
\newtheorem{proposition}[theorem]{Proposition}
\newtheorem{lemma}[theorem]{Lemma}
\newtheorem{corollary}[theorem]{Corollary}
\theoremstyle{definition}
\newtheorem{definition}[theorem]{Definition}
\newtheorem{assumption}[theorem]{Assumption}
\theoremstyle{remark}
\newtheorem{remark}[theorem]{Remark}

\newcommand\snote[2]{{\color{blue!30!red} **{\bf #1:} \texttt{ #2}**}}
\newcommand{\eps}{\varepsilon}
\newcommand{\td}{\tilde{\mathcal{D}}}
\newcommand{\Ex}{\mathbb{E}}
\newcommand{\E}{\mathbb{E}}
\newcommand{\oS}{{\overline{S}}}
\newcommand{\oN}{{\overline{N}}}
\newcommand{\oQ}{\overline{Q}}
\newcommand{\done}{{\mathcal{D}_1}}
\newcommand{\dzero}{{\mathcal{D}_0}}
\newcommand{\Langle}{\left\langle}
\newcommand{\Rangle}{\right\rangle}
\newcommand{\cH}{\mathcal{H}}
\newcommand{\mT}{\mathfrak{T}}
\newcommand{\Var}{\operatorname{Var}}
\newcommand{\Cov}{\operatorname{Cov}}
\newcommand{\trc}{{\sf{trunc}}}
\newcommand{\pos}{{\sf{pos}}}
\newcommand{\opt}{{\sf{opt}}}
\newcommand{\val}{{\sf{val}}}
\newcommand{\R}{\mathbb{R}}
\newcommand{\Z}{\mathbb{Z}}

\newcommand{\mc}[1]{\ensuremath{\mathcal{#1}}\xspace}
\newcommand{\mb}[1]{\ensuremath{\mathbf{#1}}\xspace}
\newcommand{\tn}[1]{\ensuremath{\textnormal{#1}}\xspace}
\newcommand{\ol}[1]{\ensuremath{\overline{#1}}\xspace}
\newcommand{\wh}[1]{\ensuremath{\widehat{#1}}\xspace}

\DeclareMathAlphabet\mathbfcal{OMS}{cmsy}{b}{n}

\newcommand{\mbc}[1]{\ensuremath{\mathbfcal{#1}}\xspace}

\newcommand{\bX}{{\mb{X}}}
\newcommand{\bY}{{\mb{Y}}}
\newcommand{\bc}{{\mb{c}}}
\newcommand{\bZ}{{\mb{Z}}}
\newcommand{\bA}{{\mb{A}}}
\newcommand{\ba}{{\mb{a}}}
\newcommand{\bB}{{\mb{B}}}
\newcommand{\bb}{{\mb{b}}}
\newcommand{\bW}{{\mb{W}}}
\newcommand{\bU}{{\mb{U}}}
\newcommand{\bV}{{\mb{V}}}

\newcommand{\bg}{{\mb{g}}}
\newcommand{\bx}{{\mathbf{x}}}
\newcommand{\by}{{\mathbf{y}}}
\newcommand{\bL}{{\mathbf{L}}}
\newcommand{\bT}{{\mathbf{T}}}
\newcommand{\bs}{{\mathbf{s}}}
\newcommand{\bz}{{\mathbf{z}}}
\newcommand{\bu}{{\mathbf{u}}}
\newcommand{\bv}{{\mathbf{v}}}
\newcommand{\bw}{{\mathbf{w}}}
\newcommand{\br}{{\mathbf{r}}}
\newcommand{\bS}{{\mathbf{S}}}
\newcommand{\bG}{{\mathbf{G}}}
\newcommand{\bH}{{\mathbf{H}}}
\newcommand{\bD}{{\mathbf{D}}}


\newcommand{\pmir}{{{\sc MIR}}\xspace}
\newcommand{\iidpmir}{{{\sc iid-MIR}}}
\newcommand{\slc}{{\sc Smooth-Label-Cover}\xspace}

\newcommand{\wtdAssign}{{\sf wtd-Assign}\xspace}


\usepackage[textsize=tiny]{todonotes}





\title{Generalization and Learnability in Multiple Instance Regression}


\author[1]{Kushal~Chauhan}
\author[1]{Rishi~Saket}
\author[2]{Lorne~Applebaum}
\author[2]{Ashwinkumar~Badanidiyuru}
\author[2]{Chandan~Giri}
\author[1]{Aravindan~Raghuveer}
% Add affiliations after the authors
\affil[1]{%
Google Research, India \\ {\small \texttt{\{kushalchauhan,rishisaket,araghuveer\}@google.com}}
}
\affil[2]{
Google, USA \\ {\small \texttt{\{lapplebaum,ashwinkumarbv,chandangiri\}@google.com}}
}
\begin{document}
\maketitle

\begin{abstract}
Multiple instance regression (MIR) was introduced by \cite{RP01} as an analogue of multiple instance learning (MIL) in which we are given bags of feature-vectors (instances) and for each bag there is a bag-label which matches the label of one (unknown) primary instance from that bag. The goal is to compute a hypothesis regressor consistent with the underlying instance-labels. A natural approach  is to find the best primary instance assignment and regressor optimizing the mse loss on the bags %, 
though no formal generalization guarantees were known. Our work is the first to prove generalization error bounds for MIR when the bags are drawn i.i.d. at random. Essentially, with high probability any MIR regressor with low error on sampled bags also has low error on the underlying instance-label distribution.
We next study the complexity of linear regression on MIR bags, shown to be NP-hard in general by \cite{RP01}, who however left open the possibility of arbitrarily good approximations. %,   
Significantly strengthening previous work, we prove a strong inapproximability bound: even if there exists zero bag-loss MIR linear regressor on a collection of $2$-sized bags with labels in $[-1,1]$, it is NP-hard to find an MIR linear regressor with bag-loss  $< C$ for some absolute constant $C > 0$. %
Our work also proposes a model training method for MIR based on a novel weighted assignment loss, geared towards handling overlapping bags which have not received much attention previously.  We conduct empirical evaluations on synthetic and real-world datasets showing that our method outperforms the baseline MIR methods. 




\end{abstract}

\input{introduction}
\input{prelims}
\input{errbounds}

\input{method-1}
\input{experiments}

\section{Conclusion}
Our work proves the first generalization error bounds for the multiple instance regression (MIR) problem in which the label of a bag is given by that of an (unknown) primary instance in the bag. Specifically, we show that optimizing the mse loss on i.i.d sampled bags yields a regressor which has low mse on the underlying instance distribution, with high probability over the sampled bags. We also prove the first inapproximability result for MIR: given an MIR instance with bounded labels which admits a linear regressor with primary instances  which has zero mse bag-loss, it is NP-hard to find one which has bag-loss lower than some absolute constant. While our contributions  develop a deeper theoretical understanding of the problem, from a practical standpoint we also propose a weighted assignment based model training method which naturally handles overlapping bags unlike previous works. Our experiments on synthetic and real-world datasets demonstrate the improvements provided by our method.

Future work can include generalization guarantees for non-iid MIR bags, as well as investigation from the computational learning perspective of non-linear regressors on MIR data.

\bibliography{references}


%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
% APPENDIX
%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
\newpage
\appendix

\onecolumn

\title{Generalization and Learnability in Multiple Instance Regression\\(Appendix)}
\maketitle
\input{hardness_redn}


\end{document}


