\documentclass[accepted]{uai2023} % for initial submission
% \documentclass[accepted]{uai2023} % after acceptance, for a revised
                                    % version; also before submission to
                                    % see how the non-anonymous paper
                                    % would look like

%% There is a class option to choose the math font
% \documentclass[mathfont=ptmx]{uai2023} % ptmx math instead of Computer
% Modern (has noticable issues)
% \documentclass[mathfont=newtx]{uai2023} % newtx fonts (improves upon
 % ptmx; less tested, no support)
% NOTE: Only keep *one* line above as appropriate, as it will be replaced
%       automatically for papers to be published. Do not make any other
%       change above this note for an accepted version.

%% Choose your variant of English; be consistent
\usepackage{natbib} % has a nice set of citation styles and commands
    \bibliographystyle{plainnat}
    \renewcommand{\bibsection}{\subsubsection*{References}}
\usepackage{mathtools} % amsmath with fixes and additions
% \usepackage{siunitx} % for proper typesetting of numbers and units
\usepackage{booktabs} % commands to create good-looking tables
\usepackage{tikz} % nice language for creating drawings and diagrams
\usepackage{amsmath,amsfonts}
\usepackage{IEEEtrantools}
\usepackage{amsthm}
\usepackage{graphicx}
\usepackage{tikz}
\usetikzlibrary{positioning,chains,fit,shapes,calc}
\usetikzlibrary{arrows}
\usepackage{algorithm}
\usepackage{algorithmic}
% \usepackage{algpseudocode} %%% NOT COMPATIBLE WITH algorithmic package
\usepackage{xspace}
\usepackage{pgfplots}
\usepackage{pgfplotstable}
\usepackage{comment}
% for cross referencing the main text
% PLEASE ONLY USE xr IN THE SUPPLEMENTARY MATERIAL. 
% In the main paper, hard code any cross-reference to the supplementary material. 
\usepackage{xr} 
\externaldocument{uai2023-template}
\newtheorem{problem}{Problem}
\newtheorem{observation}{\textsc{Observation}}
\newtheorem{theorem}{\textsc{Theorem}}
\newtheorem{lemma}{\textsc{Lemma}}
\newtheorem{corollary}{\textsc{Corollary}}
\newtheorem{remark}{\textsc{Remark}}
\newtheorem{claim}{\textsc{Claim}}
\DeclareMathOperator*{\argmax}{arg\,max}
\DeclareMathOperator*{\argmin}{arg\,min}
\newcommand{\greedy}{\textsc{Greedy}\xspace}
\newcommand{\mcge}{{\em Maximum Constrained Gain Element }}
\newcommand{\mcg} {{\em Maximum Constrained Gain }}
\newcommand{\MCGE}{{\rm MCGE}}
\newcommand{\MCG}{{\rm MCG}}
\newcommand{\OPT}{{\rm OPT}}
\newcommand{\NP}{{\rm NP}}
\newcommand{\OptimalS}{{\rm OptimalSeq}}
\newcommand{\SCSKC}{{\sc SCSK-C}\xspace}
\newcommand{\DiffC}{{\sc Diff-C}\xspace}
\newcommand{\SCSK}{{\sc SCSK}\xspace}
\newcommand{\Diff}{{\sc Diff}\xspace}
\newcommand{\lineara}{{\sc Linear-Approx}\xspace}
\newcommand{\loga}{{\sc Log-Approx}\xspace}
%% Provided macros
% \smaller: Because the class footnote size is essentially LaTeX's \small,
%           redefining \footnotesize, we provide the original \footnotesize
%           using this macro.
%           (Use only sparingly, e.g., in drawings, as it is quite small.)

%% Self-defined macros
\newcommand{\swap}[3][-]{#3#1#2} % just an example

\title{Maximizing Submodular Functions under Submodular Constraints\\(Supplementary Material)}

% The standard author block has changed for UAI 2023 to provide
% more space for long author lists and allow for complex affiliations
%
% All author information is authomatically removed by the class for the
% anonymous submission version of your paper, so you can already add your
% information below.
%
% Add authors
\author[1]{Madhavan R. Padmanabhan}
\author[1]{Yanhui Zhu}
\author[1]{Samik Basu}
\author[1]{A. Pavan}
% Add affiliations after the authors
\affil[1]{%
    Department of Computer Science\\
    
    Iowa State University\\
    
    Ames, Iowa, USA
}

 
  \begin{document}
  
\onecolumn %% Turn this off if single column is desired for the supplement
\maketitle


\appendix

\section{Missing Proofs}

\setcounter{theorem}{0}
\setcounter{observation}{0}
\begin{observation}
Given a submodular function $g$ and $\theta$, it is NP-Hard to calculate $K_g$ where $K_g = max\{|X|: g(X)\leq \theta \text{ and } |X|\leq k\}$.
\label{thm:upperrankhardness}
\end{observation}
\begin{proof}
Let $K'_g = max\{|X|: g(X)\leq \theta\}$. We will first show that computing $K'_g$ is NP-Hard. Consider the knapsack problem: We have $n$ elements  $S = \{1, 2, .. n\}$ with values $\{v_1, v_2, .., v_n \}$ and weights $\{w_1, w_2, .. , w_n\}$. Given a capacity $W$, and a target $\gamma$, is there a set $S'\subseteq S$ such that $\sum_{i\in S'} v_i\geq \gamma$ and $\sum_{i\in S'}w_i\leq W$.


For each element $i$, construct a complete bipartite graph $G_i = (L_i, R_i, E_i)$ where $L_i = \{x_{i_1}, x_{i_2}, .. , x_{iv_i}\}$ and $R_i = \{ y_{i_1}, y_{i_2}, .. ., y_{iw_i}\}$. $L_i$ and $R_i$ represent the values and weights of element $i$ respectively. Let $L = \cup L_i$, $R = \cup R_i$ and $E = \cup E_i$. Let $G = (L, R, E)$. We define the neighborhood function $g(X)$ for all $X\subseteq L$ as the number of neighbors of $X$. $g(X)$ is known to be a submodular function. Assume that we can compute $K'_g =  max\{|X|: g(X)\leq W\}$. Initially, let $X=\phi$. For a graph $G_i$, if we add a single node from $L_i$ to $X$, we can add every node in $L_i$ such that $g(X)$ increases by $w_i$. This is equivalent to selecting an element $i$, where the number of elements added increases the value by $v_i$ and has a weight $w_i$. If $K'_g\geq \gamma$ then there exists $S'\subseteq S$ such that $\sum_{i\in S'} v_i\geq \gamma$ and $\sum_{i\in S'}w_i\leq W$. Next, we show that if $S'$ exists then $K'_g \geq \gamma$. Let $S' = \{z_1, z_2., ..., z_l\}$. Based on our reduction we can construct $X = \{L_{z_1} \cup L_{z_2}..\cup L_{z_l}\}$. Clearly $g(X) = \sum_{i\in S'} w_i \leq W$ and $|X| = \sum_{i\in S'} v_i \geq \gamma$. Thus, $K'_g\geq \gamma$.  Since computing $K'_g$ is NP-Hard, computing $K_g$ is NP-Hard.

\end{proof}
\setcounter{claim}{0}
\begin{claim}
%For $1 \leq i \leq k$. 
\begin{eqnarray*}
OPT_{k,\theta} - f(X_k ) & \leq & \left(\frac{O-1}{O}\right)^{k - 1} \left(OPT_{k,\theta}-f(X_1)\right) \\
 & &+ \sum_{i=1}^{k-1} MCDG_i
\end{eqnarray*}
\end{claim}
\begin{proof}
\begin{eqnarray*}
OPT_{k,\theta} - f(X_k) & \leq & \frac{O-1}{O}
\left(OPT_{k,\theta}-f(X_{k-1})\right)\\
 & &  + MCGD_{k-1} \\
& \leq& \frac{O-1}{O}\left( \frac{O-1}{O} \left[OPT_{k, \theta} - f(X_{k-2})\right]\right.\\
& &  \left.+ MCGD_{k-2}\right) + MCGD_{k-1}\\
 & = & \left(\frac{O-1}{O}\right)^2\left(OPT_{k,\theta}-f(X_{k-2})\right)\\
 & &+ \frac{O-1}{O} MCGD_{k-2} + MCGD_{k-1}\\
& \leq &  \left(\frac{O-1}{O}\right)^{k - 1} \left(OPT_{k,\theta}-f(X_1)\right)+ \sum_{i=1}^{k-1}  MCDG_{i}\\
\end{eqnarray*}


\end{proof}

\setcounter{theorem}{1}

\begin{theorem}
There does not exist a polynomial time algorithm $\mathcal{A}$ for SCSK and SCSK-C such that it outputs a set $X$ with guarantee $f(X)\geq d\cdot OPT - A$ where $d<1, A>0$ are universal constants. 
\label{thm:datadependentA}
\end{theorem}

\begin{proof}
In ~\cite{Iyer:NIPS13}, it is shown that there exists no polynomial time algorithm for SCSK that achieves a constant factor approximation. We will use this to show that there also does not exist a $(d,A)$-multiplicative additive approximation algorithm with constants $d<1, A>0$ for SCSK. 

Assume that there exists an algorithm $\mathcal{A}$ such that it outputs a set $f(X) \geq d\cdot OPT - A$. 


Let $f'(X) = A\cdot f(X)$. Consider the same problem with $f'$. The optimum solution is $OPT' = A \cdot OPT$. 
The guarantee is still $f'(X)\geq d\cdot OPT' - A$.  Thus
$A\cdot f(X) \geq  d\cdot A\cdot OPT - A$ and this implies that $f(X) \geq  d\cdot OPT - 1$ 

Thus, algorithm $\mathcal{A}$ has the guarantee with $A=1$. We can repeat the argument by defining $f'(X) = q\cdot f(X)$ leading to guarantee $f(X) \geq d\cdot OPT - \frac{1}{q}$. $\mathcal{A}$ has $(d,A)$-multiplicative additive guarantee for an arbitrarily small $A$. 

Consider an instance $\mathcal{X}$ of SCSK. Let $\mathcal{I}$ be the family of feasible sets for this instance. Let $\mathcal{I'} = \{X \texttt{ s.t }  f(X)< d\cdot OPT\}$. Let $R\in \mathcal{I'}$ such that $\forall X\in \mathcal{I'}, f(R)\geq f(X)$. Let $\epsilon = d\cdot OPT - f(R)$. $\mathcal{A}$ has $(d,\epsilon')$-multiplicative additive guarantee where $\epsilon'<\epsilon$. In such an instance, the following inequalities hold.
\begin{IEEEeqnarray*}{l}
f(\mathcal{A(\mathcal{X})}) \geq  d\cdot OPT - \epsilon' >  d\cdot OPT - \epsilon = f(R) 
\end{IEEEeqnarray*}
If $f(\mathcal{A(\mathcal{X})})>f(R)$ then it must be the case that $A(\mathcal{X}) \in \mathcal{I}\setminus \mathcal{I'}$. By definition of $\mathcal{I'}$, $f(A(\mathcal{X})) \geq d\cdot OPT$. If $\mathcal{I'}=\phi$, we consider the feasible element $e^*$ that has the maximum value on $f$ among all feasible elements. In such cases, if we output $max\{f(e^*), f(A(\mathcal{X}))\}$, we obtain a $d-$approximate algorithm for SCSK. This is a contradiction as such an algorithm does not exist for SCSK ~\cite{Iyer:NIPS13} which invalidates our assumption. We can extend the argument for SCSK-C by varying the cardinality from $1..n$ to arrive at a similar contradiction. 
\end{proof}


\setcounter{theorem}{2}
\begin{theorem}\label{thm:cur}
Let $X$ be the solution produced by Algorithm~1, then 
\[f(X) \geq \frac{1}{c_f}\left (1 - (1-\frac{c_f}{k})^{k}\right )OPT_{k, \theta} - A,\]
%and when $\ell=k$, then
%$f(X) \geq \frac{1}{c_f}\left (1 - e^{-c_f}\right ) OPT_{k, \theta} - A,$
where $A$ is the additive error  same as in Theorem~1.
\end{theorem}


\begin{proof}
We combine the ideas from the proof of Theorem~3 with that of Lemma 5.2 in ~\cite{ConfortiC84}. At iteration $t-1$ of the Greedy Algorithm, we extend an ordered set $X_{t-1} = \{j_1, j_2, .. j_{t-1}\}$ by adding element $j_t$ to obtain $X_{t} = \{j_1, j_2, .. j_{t}\}$. Define $\rho_i = f(j_i| \{j_1, j_2... j_{i-1}\})$. Let $X^*_{k,\theta}$ be an optimal solution. $l\leq k$ be the number of iterations of the Greedy Algorithm. From Lemma 2.1 in ~\cite{ConfortiC84}, it follows that for $t=1..l$:
\begin{IEEEeqnarray*}{lCr}
OPT_{k, \theta} &\leq& c_f \sum_{j_i\in X_t \setminus X^*_{k,\theta}} \rho_i + \sum_{j_i\in X_t \cap X^*_{k,\theta}} \rho_i + \sum_{j_i \in X^*_{k,\theta}\setminus X_t} \rho_i
\end{IEEEeqnarray*}
Recall that for $i=0..l-1$: 
\begin{IEEEeqnarray*}{lCr}
f(X_{i+1}) & = & f(X_i) + \MCG(X_i, \theta) \\
f(X'_{i+1}) & = & f(X_i) + \MCG(X_i, 2\theta)
\end{IEEEeqnarray*}

This leads to the following observation:
\begin{IEEEeqnarray*}{lCr}
f(X'_{i+1}) - f(X_i) \\ 
= \rho_{i+1} + \MCG(X_i, 2\theta) - \MCG(X_i, \theta)
\end{IEEEeqnarray*}
We define $\gamma_{i+1} = \MCG(X_i, 2\theta) - \MCG(X_i, \theta)$. Let $s=|X^*_{k,\theta}\setminus X_i|$. Thus, we have:
\[
\begin{array}{rcl}
OPT_{k, \theta} & \leq & c_f \sum_{j_i\in X_t \setminus X^*_{k,\theta}} \rho_i + \sum_{j_i\in X_t \cap X^*_{k,\theta}} \rho_i\\
& & + \sum_{j_i \in X^*_{k,\theta}\setminus X_t} f(X'_{t+1}|X_t) \\
& \leq  & c_f \sum_{j_i\in X_t \setminus X^*_{k,\theta}} \rho_i\\
& & + \sum_{j_i\in X_t \cap X^*_{k,\theta}} \rho_i + (O-s) \cdot f(X'_{t+1}|X_t) \\
&= &  c_f \sum_{j_i\in X_t \setminus X^*_{k,\theta}} \rho_i  \\
& & + \sum_{j_i\in X_t \cap X^*_{k,\theta}} \rho_i + (O-s) \cdot \left[\rho_{t+1} + \gamma_{t+1} \right]
\end{array}
\]
Fix $O$, $l$ and curvature $c_f$. Consider all problems $\mathcal{F}_{O, l, c_f}$ that has curvature $c_f$, optimal solution size $O$ and the greedy set size $l$. Denote $\mathcal{F}(i_1, i_2, ... i_s)\subseteq \mathcal{F}_{O, l, c_f}$ as the set of problems meeting the following two conditions

\begin{enumerate}
    \item The greedy algorithm selects the set $X = \{j_1, j_2, ... j_l\}$ where $l\leq O$.  
    \item $X\cap X^*_{k,\theta} = \{j_{i_1}, j_{i_2}, ... j_{i_s}\}$ for $0\leq s \leq l$. The greedy algorithm selects $s$ elements from the optimal solution within the first $l$ iterations. 
\end{enumerate}

The greedy algorithm produces $X$ such that $f(X)\geq \sum_{i=1}^{l}\rho_i\geq \sum_{i=1}^{l} \rho_i + \gamma_i$. Define $q_i = \rho_i+\gamma_i$ for $0\leq i\leq l$. 

Consider the ratio : $\frac{1}{O} \cdot\left(f(X) + \sum_{i=1}^{l} \gamma_i \right)$. We see that $\frac{1}{O} \cdot\left(f(X) + \sum_{i=1}^{l} \gamma_i \right)\geq R(\{i_1, i_2..., i_s\})$ where $R(\{i_1, i_2..., i_s\})$ is defined as:

$R(\{i_1, i_2..., i_s\})  = \min \sum_{i=1}^{l}q_i$ subject to
\[
\forall i, q_i \geq 0, \ OPT_{k, \theta} \leq c_f \sum_{j_i\in X_t \setminus X^*_{k,\theta}} q_i + \sum_{j_i\in X_t \cap X^*_{k,\theta}} q_i + (O-s) \cdot q_i \\
\]


From ~\cite{ConfortiC84}, it follows that $R(\{i_1, i_2..., i_s\}) \geq R(\phi) \geq \frac{1}{c_f}\left[1 - (1- \frac{c_f}{O})^l \right]$. Thus, we have:
\begin{IEEEeqnarray*}{lCr}
f(X) + \sum_{i=1}^{l} \gamma_i \geq \frac{1}{c_f}\left[1 - \left(1- \frac{c_f}{O}\right)^l \right] \cdot OPT_{k, \theta}
\end{IEEEeqnarray*}
Since $O \leq k$
\begin{IEEEeqnarray*}{lCr}
f(X)  \geq \frac{1}{c_f}\left[1 - \left(1- \frac{c_f}{k}\right)^l \right] \cdot OPT_{k, \theta} - \sum_{i=1}^{l} \gamma_i 
\end{IEEEeqnarray*}

The term $\sum_{i=1}^{l} \gamma_i $ is the additive error, which equals
\[\sum_{i=0}^{\ell-1} MCG(X_i, 2\theta) - \sum_{i=0}^{\ell-1}MCG(X_i, \theta)\]
Since $\sum_{i=0}^{\ell-1}MCG(X_i, \theta)$ equals $f(X)$, the additive error term is same as the one from Theorem~3. Finally, observe that when when $\ell = k$, the term $(1 - \frac{c_f}{k})^k$ tends to $e^{-c_f}$.
\end{proof}


\label{eqn:recur}



\setcounter{theorem}{4}
\begin{theorem}
Let $f$ and $g$ be two submodular functions and where $f$ is monotone, let $h = f-g$. Consider Algorithm $\mathcal{B}$.
If the subroutine $\mathcal{A}$ can solve \SCSKC exactly, then Algorithm $\mathcal{B}$ produces a set $S$ such that
$h(S) \geq h(OPT) - 1$.  Algorithm{B} makes by making $O(\lambda)$ calls to  $\mathcal{A}$, where $\lambda = k\cdot max_{e\in V} g(e)$.
\end{theorem}

\begin{proof}
Let us first assume that the range of $g$ is non-negative integers and let $OPT$ be the optimal solution for $h$.
We claim that this algorithm produces an optimal solution for \DiffC.  Let $\gamma' = g(S^*)$. Since the range of $g$ are non negative integers, Algorithm $\mathcal{B}$ will have queried $\mathcal{A}$ with paramaters $f,g,k,\gamma'$. Let the set produced at that iteration be $P^*$. Assume that $P^*$ is not an optimal solution to \DiffC i.e.  such that $f(OPT) - g(OPT) > f(P^*) - g(P^*)$. We know that $f(P^*) \geq f(OPT)$, since Algorithm $\mathcal{A}$ produces an optimal solution. In addition, $g(P^*) \leq \gamma' = g(S^*)$ leading to $-g(P^*) \geq -g(S^*)$. Therefore, $f(P^*) - g(P^*) \geq f(S^*) - g(S^*)$ which contradicts our assumption.  Now suppose that the range of $g$ is not an integer and let $g(OPT) = \gamma''$ and let $\gamma' = \lceil \gamma''\rceil$. Let $P^*$ be the set output by $A(f, g, k, \gamma'$. Note that $f(P^*) \geq f(OPT)$ and thus $h(P^*) \geq f(P^*) - \gamma' \geq f(OPT) - \gamma'' -1 = h(OPT) -1$.
\end{proof}



\section{Extensive Experimental Results}
\label{sec:expt}

% \input{experimentsCommand.tex}
% ---------------------------------------------------------------------
% SCSK-C figure settings
% ---------------------------------------------------------------------
\newcommand{\thetaVObjective}[2]{
\begin{tikzpicture}
    \begin{axis}[xlabel=\textbf{$\theta$}, ylabel=\textbf{\Large $f(X)$}, title=\textbf{#2}, legend columns=2, legend style={at={(0.5,-0.1)},anchor=north,draw=none}, transpose legend]
        \pgfplotstableread[col sep=comma]{datasets/#1}
        \datatable
        
        \addplot table[y = Greedy] from \datatable ;
        % \addplot table[y = dynamic] from \datatable ;
        \addplot table[y = Random] from \datatable;
        \addplot table[y = Equal] from \datatable;
        % \addplot table[y = 0.63OPTUpperBound] from \datatable;
        % \addplot table[y = maxsingle] from \datatable;
        % \addplot table[y = randomizedgreedy] from \datatable;
        % \addlegendentry{\Large Greedy}
        % \addlegendentry{\Large Dynamic Programming}
        % \addlegendentry{$0.63 OPT Bound$}
        % \addlegendentry{\Large MaxSingle}
        % \addlegendentry{\Large Random Part.}
        % \addlegendentry{\Large Equal Part.}
        % \addlegendentry{\Large Rand Greedy}
        
    \end{axis}
\end{tikzpicture}}

\newcommand{\thetaVError}[2]{
\begin{tikzpicture}
    \begin{axis}[xlabel=\textbf{$\theta$}, ylabel=\textbf{\Large Additive Error}, title=\textbf{#2}, legend columns=-1, legend style={at={(0.5,-0.1)},anchor=north,draw=none}]
        \pgfplotstableread[col sep=comma]{datasets/#1}
        \datatable
        
        \addplot table[y = Greedy] from \datatable ;
        % \addplot table[y = dpError] from \datatable ;
        \addplot table[y = Random] from \datatable ;
        \addplot table[y = Equal] from \datatable ;
        % \addlegendentry{\Large Greedy}
        % \addlegendentry{\Large Dynamic Programming}
        % \addlegendentry{\Large Random Part.}
        % \addlegendentry{\Large Equal Part.}
        
    \end{axis}
\end{tikzpicture}}

\newcommand{\thetaVTime}[2]{
\begin{tikzpicture}
    \begin{axis}[xlabel=\textbf{$\theta$}, ylabel=\textbf{\Large Runtime(s)}, title=\textbf{#2}, legend columns=-1, legend style={at={(0.5,-0.1)},anchor=north,draw=none}]
        \pgfplotstableread[col sep=comma]{datasets/#1}
        \datatable
        
        \addplot table[y = Greedy] from \datatable ;
        % \addplot table[y = dpError] from \datatable ;
        \addplot table[y = Random] from \datatable ;
        \addplot table[y = Equal] from \datatable ;
        % \addlegendentry{\Large Greedy}
        % \addlegendentry{\Large Dynamic Programming}
        % \addlegendentry{\Large Random Part.}
        % \addlegendentry{\Large Equal Part.}
        
    \end{axis}
\end{tikzpicture}}

% ---------------------------------------------------------------------
% DIFF-C figure settings
% ---------------------------------------------------------------------

\newcommand{\diffValuesSubmodularCost}[2]{
\begin{tikzpicture}
    \begin{axis}[xlabel=\textbf{$k$}, ylabel=\textbf{\Large $f(X) - g(X)$}, title=\textbf{#2}, legend columns=3, legend style={at={(0.5,-0.1)},anchor=north,draw=none}, transpose legend]
        \pgfplotstableread[col sep=comma]{datasets/#1}
        \datatable
        
        \addplot table[y = Exponential] from \datatable ;
        \addplot table[y = Linear] from \datatable ;
        \addplot table[y = supSub] from \datatable;
        % \addlegendentry{Algorithm $\mathcal{B}$ - Exponential Search}
        % \addlegendentry{Algorithm $\mathcal{B}$ - Linear Search}
        % \addlegendentry{SupSub}
        
    \end{axis}
\end{tikzpicture}}

\newcommand{\diffTimeSubmodularCost}[2]{
\begin{tikzpicture}
    \begin{axis}[xlabel=\textbf{$k$}, ylabel=\textbf{\Large $\log(runtime)$}, title=\textbf{#2}, legend columns=3, legend style={at={(0.5,-0.1)},anchor=north,draw=none}, transpose legend]
        \pgfplotstableread[col sep=comma]{datasets/#1}
        \datatable
        
        \addplot table[y = Exponential] from \datatable ;
        \addplot table[y = Linear] from \datatable ;
        \addplot table[y = supSub] from \datatable;
        % \addlegendentry{Algorithm $\mathcal{B}$ - Exponential Search}
        % \addlegendentry{Algorithm $\mathcal{B}$ - Linear Search}
        % \addlegendentry{SupSub}
        
    \end{axis}
\end{tikzpicture}}

\newcommand{\diffErrorsSubmodularCost}[2]{
\begin{tikzpicture}
    \begin{axis}[xlabel=\textbf{$k$}, ylabel=\textbf{\Large Additive Error}, title=\textbf{#2}, legend columns=2, legend style={at={(0.5,-0.1)},anchor=north,draw=none}, transpose legend]
        \pgfplotstableread[col sep=comma]{datasets/#1}
        \datatable
        \addplot table[y = Exponential] from \datatable ;
        \addplot table[y = Linear] from \datatable ;
        % \addlegendentry{Algorithm $\mathcal{B}$ - Exponential Search}
        % \addlegendentry{Algorithm $\mathcal{B}$ - Linear Search}
    \end{axis}
\end{tikzpicture}}
In this section, we present the full experimental results. We empirically examine the performance of \SCSKC and \DiffC on the application of Information Diffusion in social networks. 
%We design the computation method for the submodular cost of a seed set. Subsequently, we compare our proposed algorithms with respect to objective function value, additive error and runtime on six social networks. 
% All the algorithms are implemented in C++ and run on a Linux server with AMD Opteron 6320 CPU (8 cores and 2.8 GHz) and 64GB RAM. 

\textbf{Information Diffusion.\ }
The diffusion of information in a social
network under various probabilistic diffusion models is captured as a
submodular function~\cite{Kempe:kdd03}. %The problem input is a graph $G=(V,E)$ and a probability function $p(u,v), \forall (u,v)\in E$. The graph represents the users in the social network along with their connections (edges). The probability function represents the probability with which a user $u$ succeeds in influencing user $v$.
For a (seed) set $X \subseteq V$,  the submodulaer function $f(X)$ is the expected number of users influenced by $X$. 
%if information originates from $X$, the expected number of users in the network who receives (or potentially gets influenced by) the information is captured by the submodular function $f(X)$. The goal is to identify a set $X$ that maximizes $f(X)$. 
On the other hand, there is often some cost function $g$ associated with each seed set. Often cost functions are submodular in nature. The goal is to find a seed set of size $\leq k$ maximize $f$ while minimizing $g$. Clearly, this problem can be formulated either as \SCSKC or as \DiffC.


For our experiments, we  design the submodular function $g$ based on the reachability. For all nodes $u \in V$ in the network, we use $R_z(u)$ to denote the set of nodes reachable from $u$ using $\leq z$ steps/edges. For any $S\subseteq V$, we have $R_z(S) = \cup_{v\in S} R_z(v)$.  We define the function $g(X) = \alpha \cdot |R_z(S)|$ where $\alpha = \frac{c \cdot m}{n}$. The values $c, z$ are tunable parameters that can be adjusted to suit the cost function. In our experiments, we use $z=2, c = 0.02$. 

% Following the works of ~\cite{Crawford:ICML19}, we define a modular cost function. For each node $v$, we randomly generate a modular cost $c_v$ drawn from $\mathcal{N} (20, 10)$ such that $0\leq c_v \leq 2\cdot \mu$. The cost function $g(S) = \sum_{v\in S} c_v$. 

\textbf{Datasets.\ } For the application of information diffusion, we collect six directed networks to conduct experiments: NetHept \cite{NetGraph}, p2p-Gnutella31 \cite{ripeanu2002mapping}, Facebook \cite{leskovec2012learning}, Bitcoin \cite{kumar2016edge}, Wikipedia \cite{leskovec2010predicting} and DBLP \cite{yang2012defining}. The number of nodes of them ranges from 3,783 to 317,080.





\subsection{Experiments for \SCSKC}
\label{sec:exp:scsk}

The main objective we seek in these experiments is to demonstrate that the approximation factors can be computed efficiently, which helps to gain an understanding of the quality of the solution.  For the Natural greedy algorithm(Algorithm~2, we compute the additive error produced and also study how the additive error changes as the submodular budget $\theta$ increases.
% , and to experimentally establish that the dynamic programming algorithm produces better solutions.
%We use this to assess the quality of  assess the quality of the solutions produced by the greedy algorithm and the dynamic programming based algorithm. For the greedy algorithm, we compute the additive error produced and study how the additive error changes as the submodular budget $\theta$ increases. As claimed, the dynamic programming based algorithm seeks to minimize the additive error;  we empirically evaluate this by comparing the solutions produced by the greedy algorithm and the dynamic programming algorithm. 

%Recall that for the problem of maximizing any non-negative, non-decreasing submodular function under a cardinality constraint,  a greedy algorithm can produce a solution $X$ such that $f(X) \geq (1-1/e)\OPT$, which is approximately $0.63\OPT$.  Thus, there is no additive error when no submodular constraint is imposed.  As shown by our analysis, we suffer an additive error in the presence of the submodular constraint. 
%If the additive error were zero, then we would have produced a solution that is at least $0.63OPT$. 
%Thus, a way to empirically evaluate the performance of the greedy algorithm is to compare the solutions produced by taking $0.63\OPT$ as benchmark.
%Though we cannot hope to compute $0.63\OPT$  exactly,  we can upper bound this quantity using Theorem~\ref{thm:baseline}, and Theorem ~\ref{thm:ktheta}.

 %Recall that Theorem~\ref{thm:refined} states that the greedy algorithm has a $(1-1/e, D)$--multiplicative-additive approximation guarantee. We can compute the value of $D$ as we run the greedy algorithm. This leads to the following observation: $(1-1/e)OPT \leq f(X)+ D$. Note that this is dependent on the algorithm producing a solution of size $k$. However, this is not necessarily the case for all instances. We address this by applying Theorem ~\ref{thm:baseline} in conjunction with Theorem ~\ref{thm:ktheta}. Let $X$ be the output of the Basic greedy algorithm,  where $|X|=\ell\leq O\leq k$. 
 
% By Theorem~\ref{thm:baseline}, we have that 
%  $f(X) \geq (1- (1- 1/k)^\ell) \OPT - A$
%  where $A$ is the additive error. 
%  Let $UB_1 = ((1 - (1-1/k)^\ell)^{-1}(f(X) + A))(1-1/e)$. 
%  Now, we have that $(1-1/e)\OPT \leq UB_1$ and $UB_1$ can be efficiently computed. We next use the bi-criteria 
%  algorithm and Theorem~\ref{thm:bicrit} to obtain another upper bound. Let $Y$ be the output of the algorithm. If we denote $f(Y)$ with $UB_2$,  we have $(1-1/e)\OPT \leq UB_2$. Combining the two upper bounds, we obtained that $(1-1/e)\OPT \leq \min\{UB_1, UB_2\}$.  We call $\min\{UB_1, UB_2\}$ as {\em 0.63\OPT Bound}.
 
 
%By Theorem~\ref{thm:baseline}, we have that 
% $f(X) \geq (1- (1- 1/k)^\ell) \OPT - A$
% where $A$ is the additive error. 
 %Now, we have that $(1-1/e)\OPT \leq UB$ and $UB$ can be efficiently computed. We have $(1-1/e)\OPT \leq UB$, and we call $UB$ as { $0.63\OPT Bound$}.
 
 %We define $UB_1= \frac{(1 - (1-1/k)^l)^{-1}}{(1-1/e)}(f(X) + D) \geq (1-1/e)OPT$. For the same problem instance, we can run Algorithm ~\ref{algo:modgreedy} with the submodular constraint as $k\theta$. Define $UB_2$ as the output of Algorithm ~\ref{algo:modgreedy}. Thus, $(1-1/e)OPT\leq min\{UB_1, UB_2\}$. 

 


\textbf{Comparison Algorithms.\ } We compare the solutions produced by the Greedy algorithm (Algorithm~2) with two variants. Note that during each iteration of this algorithm, the entire submodular budget $\theta$ is made available. We obtain a {\em budget-conscious} variant of this algorithm that allows iteration $i$ to spend at most $\theta_i < \theta$ budget. 
Algorithm 4 describes this strategy. By following an analysis that is very similar to that of Theorem~1, we can show that this algorithm produces a set $X$ for such that $f(X)$ is at least $(1-1/e)f(OPT)-A$, and $A$ can be computed efficiently.
We use the following budget-conscious algorithms.
%\begin{itemize}
     \textbf{Equal Partition:} Use $\theta/k, 2\theta/k, \cdots \theta$ as input to the budget-conscious  Greedy algorithm. 
   \textbf{Random Partition:} Select a random sequence of thresholds to use in the budget-conscious Greedy Algorithms. 
   %We run Random Partition for five times and report the average objective function values, additive errors, and running time.
%\end{itemize}

% We also compare the above algorithms with two baseline algorithms: \textbf{Maximum Single Element} where we select an element with the largest value on $f$, and \textbf{Random Greedy}  where at each iteration, select a random element that satisfies the submodular constraint.

% \paragraph{Information Diffusion}

 % argument #1: any options
    \newenvironment{customlegend}[1][]{%
        \begingroup
        % inits/clears the lists (which might be populated from previous
        % axes):
        \csname pgfplots@init@cleared@structures\endcsname
        \pgfplotsset{#1}%
    }{%
        % draws the legend:
        \csname pgfplots@createlegend\endcsname
        \endgroup
    }%

    % makes \addlegendimage available (typically only available within an
    % axis environment):

    \def\addlegendimage{\csname pgfplots@addlegendimage\endcsname}
\pgfplotsset{
cycle list={%
% {draw=green,mark=star,solid}, % 
{draw=blue, mark=square,solid},%densely dashed}, % 
% {draw=black,mark=+,solid},%dashdotted}, %every mark/.append style={rotate=90}, % Random Partition
{draw=red,mark=o,solid}, % 
% {draw=red,mark=square,solid}, % 0.63OPT Upper Bound
{draw=green,mark=+,solid}, % 
% {draw=pink,mark=square,solid} % Random Greedy
}}

\begin{figure}[h]
\begin{tikzpicture}
        \begin{customlegend}[legend columns=3,legend style={align=center,draw=none,column sep=2ex},legend entries={Basic Greedy, Random Partition, Equal Partition}]
        % \addlegendimage{draw=green,mark=star,solid}
        \addlegendimage{draw=blue, mark=square,solid}
        % \addlegendimage{draw=black,mark=+,solid}
        \addlegendimage{draw=red,mark=o,solid}
        % \addlegendimage{draw=red,mark=square,solid}
        \addlegendimage{draw=green,mark=+,solid}
        % \addlegendimage{draw=pink,mark=square,solid}
        \end{customlegend}
     \end{tikzpicture}
\end{figure}

\begin{figure}[h]
\begin{tabular}{c c}
\resizebox {0.45\linewidth} {!} {
\thetaVObjective{SCSK-C/objective/nethept-obj-scsk-c.csv}{}
}
&
\resizebox {0.45\linewidth} {!} {
\thetaVError{SCSK-C/error/nethept-error-scsk-c.csv}{}
}
\end{tabular}
\caption{\SCSKC, NetHept; $k=50$, a) $\theta$ vs. $f(X)$; b) $\theta$ vs. Additive Error with submodular cost on Basic Greedy, Random Partition and Equal Partition}
\label{fig:nethept-scsk}
\end{figure}



\begin{figure}[h]
\begin{tabular}{c c}
\resizebox {0.45\linewidth} {!} {
\thetaVObjective{SCSK-C/objective/p2p-obj-scsk-c.csv}{}
}
&
\resizebox {0.45\linewidth} {!} {
\thetaVError{SCSK-C/error/p2p-error-scsk-c.csv}{}
}
\end{tabular}
\caption{\SCSKC, p2p-Gnutella31, $k=50$, a) $\theta$ vs. $f(X)$; b) $\theta$ vs. Additive Error with submodular cost on Basic Greedy, Random Partition and Equal Partition}
\label{fig:p2p-scsk}
\end{figure}


\begin{figure}[h]
\begin{tabular}{c c}
\resizebox {0.45\linewidth} {!} {
\thetaVObjective{SCSK-C/objective/facebook-obj-scsk-c.csv}{}
}
&
\resizebox {0.45\linewidth} {!} {
\thetaVError{SCSK-C/error/facebook-error-scsk-c.csv}{}
}
\end{tabular}
\caption{\SCSKC, Facebook, $k=50$, a) $\theta$ vs. $f(X)$; b) $\theta$ vs. Additive Error with submodular cost on Basic Greedy, Random Partition and Equal Partition}
\label{fig:facebook-scsk}
\end{figure}


\begin{figure}[h]
\begin{tabular}{c c}
\resizebox {0.45\linewidth} {!} {
\thetaVObjective{SCSK-C/objective/bitcoin-obj-scsk-c.csv}{}
}
&
\resizebox {0.45\linewidth} {!} {
\thetaVError{SCSK-C/error/bitcoin-error-scsk-c.csv}{}
}
\end{tabular}
\caption{\SCSKC, Bitcoin, $k=50$, a) $\theta$ vs. $f(X)$; b) $\theta$ vs. Additive Error with submodular cost on Basic Greedy, Random Partition and Equal Partition}
\label{fig:bitcoin-scsk}
\end{figure}


\begin{figure}[h]
\begin{tabular}{c c}
\resizebox {0.45\linewidth} {!} {
\thetaVObjective{SCSK-C/objective/wiki-obj-scsk-c.csv}{}
}
&
\resizebox {0.45\linewidth} {!} {
\thetaVError{SCSK-C/error/wiki-error-scsk-c.csv}{}
}
\end{tabular}
\caption{\SCSKC, Wikipedia, $k=50$, a) $\theta$ vs. $f(X)$; b) $\theta$ vs. Additive Error with submodular cost on Basic Greedy, Random Partition and Equal Partition}
\label{fig:wiki-scsk}
\end{figure}


\begin{figure}[h]
\begin{tabular}{c c}
\resizebox {0.45\linewidth} {!} {
\thetaVObjective{SCSK-C/objective/dblp-obj-scsk-c.csv}{}
}
&
\resizebox {0.45\linewidth} {!} {
\thetaVError{SCSK-C/error/dblp-error-scsk-c.csv}{}
}
\end{tabular}
\caption{\SCSKC, DBLP, $k=50$, a) $\theta$ vs. $f(X)$; b) $\theta$ vs. Additive Error with submodular cost on Basic Greedy, Random Partition and Equal Partition}
\label{fig:dblp-scsk}
\end{figure}


% \begin{figure}[h]
% \begin{tabular}{c c}
% \resizebox {0.45\linewidth} {!} {
% \thetaVTime{SCSK-C/runtime/nethept-time-scsk-c.csv}{\Large  NetHept}
% }
% &
% \resizebox {0.45\linewidth} {!} {
% \thetaVTime{SCSK-C/runtime/p2p-time-scsk-c.csv}{\Large  p2p-Gnutella31}
% }
% \end{tabular}

% \begin{tabular}{c c}
% \resizebox {0.45\linewidth} {!} {
% \thetaVTime{SCSK-C/runtime/facebook-time-scsk-c.csv}{\Large Facebook}
% }
% &
% \resizebox {0.45\linewidth} {!} {
% \thetaVTime{SCSK-C/runtime/dblp-time-scsk-c.csv}{\Large DBLP}
% }
% \end{tabular}

% \begin{tabular}{c c}
% \resizebox {0.45\linewidth} {!} {
% \thetaVTime{SCSK-C/runtime/wiki-time-scsk-c.csv}{\Large Wikipedia}
% }
% &
% \resizebox {0.45\linewidth} {!} {
% \thetaVTime{SCSK-C/runtime/bitcoin-time-scsk-c.csv}{\Large Bitcoin}
% }
% \end{tabular}

% \caption{\SCSKC; $\theta$ vs. Runtime(s) with Submodular Cost on Basic Greedy, Random Partition and Equal Partition}
% \label{fig:time-scsk}
% \end{figure}


\begin{figure}[H]
\begin{tabular}{c c c}
\resizebox {0.3\linewidth} {!} {
\thetaVTime{SCSK-C/runtime/nethept-time-scsk-c.csv}{\Large  NetHept}
}
&
\resizebox {0.3\linewidth} {!} {
\thetaVTime{SCSK-C/runtime/p2p-time-scsk-c.csv}{\Large  p2p-Gnutella31}
}
&
\resizebox {0.3\linewidth} {!} {
\thetaVTime{SCSK-C/runtime/facebook-time-scsk-c.csv}{\Large Facebook}
}
\end{tabular}

\begin{tabular}{c c c}


\resizebox {0.3\linewidth} {!} {
\thetaVTime{SCSK-C/runtime/dblp-time-scsk-c.csv}{\Large DBLP}
}
&
\resizebox {0.3\linewidth} {!} {
\thetaVTime{SCSK-C/runtime/wiki-time-scsk-c.csv}{\Large Wikipedia}
}
&
\resizebox {0.3\linewidth} {!} {
\thetaVTime{SCSK-C/runtime/bitcoin-time-scsk-c.csv}{\Large Bitcoin}
}
\end{tabular}

\caption{\SCSKC; $\theta$ vs. Runtime(s) with Submodular Cost on Basic Greedy, Random Partition and Equal Partition}
\label{fig:time-scsk}
\end{figure}













% The diffusion of information in a social
% network under various probabilistic diffusion models is captured as a
% submodular function~\cite{Kempe:kdd03}. The problem input is a graph $G=(V,E)$ and a probability function $p(u,v), \forall (u,v)\in E$. The graph represents the users in the social network along with their connections (edges). The probability function represents the probability with which a user $u$ succeeds in influencing user $v$.
% For a (seed) set $X$, if
% information originates from $X$, the expected number of users in the
% network who receives (or potentially gets influenced by) the
% information is captured by the submodular function $f(X)$. The goal is to identify a set $X$ that maximizes $f(X)$. 
% On the other hand, there
%  is often some cost function $g$ associated with each seed set. Often cost functions are submodular in nature. Therefore, the objective is to
% maximize the value of submodular function $f$ subject to  the budgetary constraints on the
% cost (submodular function) and number (cardinality) of the seed set 
% engaged in the process. Thus, the problem is an instance of SCSK-C.

% Following the works of ~\cite{Crawford:ICML19}, we randomly generate the cost of each user($c(\cdot)$) from a normal distribution. We define a modular cost function $c(S) = \sum_{x\in S}c(x)$. We also define a submodular cost function $g$. For any $u\in V$, we say $R(u)$ is the set of vertices such that $v$ in $R(u)$ iff there exists a path $u\to v$ containing at most $3$ edges. For any set $S\subseteq V$, $R(S) = \bigcup_{u\in S}R(u)$. $R(\cdot)$ is a monotone, non-negative, non-decreasing submodular set function. We calculate the cost function $g(S) = 20\alpha\frac{|R(S)|}{|V|}$ where $\alpha$ is the median reachability. 

% We implemented the algorithms on the NetHept graph~\cite{NetGraph} submodular cost function. This graph has around $15,000$ vertices and $62,000$ edges.

\textbf{Results Analyses.\ } We chose $k = 50$ and varied the submodularity budget $\theta$ from $10$ to $300$. The results are shown in Figure ~\ref{fig:nethept-scsk} to ~\ref{fig:dblp-scsk}. As can be seen, the Basic Greedy, Equal Partition and Random Partition algorithms produce very similar results, except for Facebook. It can be seen  from Figure~\ref{fig:nethept-scsk}b,~\ref{fig:p2p-scsk}b,~\ref{fig:dblp-scsk}b,  that as the submodular budget increases, the additive error decreases. Recall that the additive factor is approximately the difference between the quality of the seed sets produced with submodular constraints $\theta$ and $2\theta$. Thus all $\theta$ grows larges there may not be much difference between the constraints $g(X) \leq \theta$ and $g(X) \leq 2\theta$. It is likely that a set that satisfies the latter constraint will also satisfy the former constraint.

We now analyze the quality of the solutions produced. For NetHept, P2p-Gnutella31 and DBLP  additive error is less than $10\%$ of $f(X)$  most of the time and much smaller many times. When this happens we can conclude that for all these sets $f(X) \geq 0.53f(OPT)$.
For example, for NetHept, when $k = 50, \theta =200$, the greedy algorithm produced a solution $X$ of size $50$, and the additive error is $0$ and $f(X)  = 968.21$. This implies that $f(X) \geq 0.63f(OPT)$. Another example is DBLP, at $\theta - 20$, Basic Greedy produced a solution with value $13810$ and the additive error is $1044$. This implies that additive error is leass than  which $7.5\%$ of the optimal value. Thus we can be guaranteed that the value produced by the algorithm is at least $0.55f(OPT)$. For graphs such as Facebook, Bitcoin, and Wikipedia additive errors are higher. For example, for Bitcoin with $\theta = 160$, the Basic Greedy produced a solution with value $110$ whereas the additive error is $26$. This implies that the value of the solution is at least $0.4f(OPT)$. The density of the graphs could explain this phenomenon. The Average degrees of Facebook, Bitcoin and Wikipedia graphs are 43, 12, and 29 whereas for the other graphs, the average degree is less than 8.  For higher  average degree graphs there is a larger difference between the constraints $g(X) \leq \theta$ and $g(X) \leq 2\theta$.
 

In terms of running time, these three algorithms are very fast. The comparisons are shown in Fig. \ref{fig:time-scsk}. Comparing with Random Partition and Basic Greedy, Equal Partition is faster for the reason that it started from a small cost, which took a smaller number of iterations. In contrast, Random Partition can generate various cost sequences, and the submodular cost of each iteration for Basic Greedy is fixed.

%with $62586$ vertices and $147892$ edges~\cite{NutGraph}.
% We report the results in Figure ~\ref{fig:p2p-scsk} and observe similar results. 

% Experiments for the speech data subset selection are reported in the appendix.
%The dynamic programming algorithm  outperforms Greedy and $0.63OPTBound$ apart with the exception of $\theta=20$. For smaller values of $\theta$, we observe that the additive error is high(Figure ~\ref{fig:infGnuAndSpeech} b).

% \subsection{Speech Data Subset Selection}

% We consider the Speech Data Subset selection problem
% ~\cite{Lin:Interspeech09,Lin:Interspeech11,Iyer:NIPS13}, where the goal
% is to select utterances with maximal acoustic variability constrained
% by the number of utterances and the words covered by the
% utterances. For scalability, we use a subset of the TIMIT dataset ~\cite{timit:DARPA}, which
% contains utterances spoken by a multitude of speakers along with their
% transcriptions. Let $V, W$ be the set of utterances and words
% respectively. A bipartite graph $G=(V\cup W, E)$ over $V$ and $W$
% describes the following relationship: if an utterance $v\in V$
% contains a word $w\in W$, an edge $(v, w)$ is present in the graph.
% Next, we use $s_{ij}$ to capture the similarity between any two
% utterances by capturing the string similarity of their corresponding
% transcriptions using the \emph{String Subsequence Kernel} metric
% defined in ~\cite{Lodhi:JMLR02}. Given $X\subseteq V$, we use the
% \emph{facility location} function $f(X) = \sum_{i\in V} max_{j\in X}
% s_{ij}$, which is known to be submodular~\cite{Iyer:NIPS13}.  We
% impose a cardinality constraint on the number of utterances selected,
% and we add a submodular constraint on the number of words that the
% solution $X$ can cover. This is precisely the neighbors of $X$ in the
% bipartite graph, which we denote by $g(X)$.



% We run the the basic greedy algorithm
% (Algorithm~\ref{algo:algorithm1}) and the dynamic programming algorithm.  The results are reported in Figure ~\ref{fig:infGnuAndSpeech}(c). As expected, the
%   former is outperformed by the latter. The difference between the
%   value of $f$ corresponding to the the sets computed by the two
%   algorithms tends to increase with an increase in submodularity
%   budget $\theta$. Larger budget is likely to provide more
%   possibilities in selecting budget-expenses in each step of the
%   (budget-conscious) greedy algorithm, and hence can achieve less
%   additive error compared to the ones resulting from basic greedy
%   algorithm. For this dataset, the difference between the solutions of Dynamic programming and $0.63OPTBound$ is larger.

% We also run the basic greedy algorithm while keeping track of the
% Additive Error (Figure ~\ref{fig:infGnuAndSpeech}(d)). We observe that in our dataset, as $\theta$ increases, there is
% a steep decline in the additive error, which eventually reaches
% zero. This provides an important information about the quality of the
% solution.  In particular, for the choices of $k, \theta$ presented in
% the experiment, we were able to obtain a solution of size $k$ which
% implies that when the additive error reaches zero, the algorithm has
% obtained a solution within a constant factor of the optimal solution.


% \newcommand{\greedyVsROI}[2]{
% \begin{tikzpicture}
%     \begin{axis}[xlabel=\textbf{$k$}, ylabel=\textbf{\Large $f(X) - g(X)$}, title=\textbf{#2}, legend columns=2, legend style={at={(0.5,-0.1)},anchor=north,draw=none}, transpose legend]
%         \pgfplotstableread[col sep=comma]{data/#1}
%         \datatable
        
%         \addplot table[y = greedy] from \datatable ;
%         \addplot table[y = dp] from \datatable ;
%         \addplot table[y = roigreedyk] from \datatable;
%         \addlegendentry{Algorithm $\mathcal{B}$}
%         \addlegendentry{\Large Dynamic Programming}
%         \addlegendentry{ROI-Greedy-k}
        
%     \end{axis}
% \end{tikzpicture}}





\subsection{Experiments for \DiffC}
\label{sec:exp:diff}
 

% \begin{figure}[H]
% \vspace{-0.5em}
% \begin{tabular}{c c}
% \resizebox {0.45\linewidth} {!} {
% \greedyVsROI{diffc/netheptGreedyVsROI.csv}{Nethept}
% }
% &
% \resizebox {0.45\linewidth} {!} {
% \greedyVsROI{diffc/amazonGreedyVsROI.csv}{Amazon}
% }
% \end{tabular}
% \caption{Budget vs Difference for a) NetHept; b)Amazon}
% \label{fig:diffcModular}
% \vspace{-0.5em}
% \end{figure}

% \textbf{Modular Cost Function}
% We see that both Algorithm $\mathcal{B}$ and Dynamic Programming outperforms ROI-Greedy-k in terms of the quality of the solution for increasing values of $k$. Additionally, we see that the Dynamic Programming outperforms Algorithm $\mathcal{B}$. As $k$ is increased, we see that the difference between Dynamic Programming and Algorithm $\mathcal{B}$ tends to increase. For example, on NetHept with $k=20$, Algorithm $\mathcal{B}$ outputs a difference value of $249.35$ while DP yields $305.72$. With $k=100$, the algorithms produce $482.60$ and  $685.34$ respectively. Under the same parameters, the gap between Algorithm $\mathcal{B}$ and ROI-Greedy-k reduces, however the former still outperforms ROI-Greedy-k.

% \textbf{Submodular Cost Function}
We use the Basic Greedy algorithm of \SCSKC as a subroutine of  Algorithms \loga and \lineara.

\textbf{Baseline Algorithm.\ } We compare our methods  against the supSub method proposed by ~\cite{Iyer:CORR12}. 
This replaces the submodular function $g$ with a surrogate modular function $g'$ and attempts to maximize $f-g'$. In addition, this method iteratively updates the surrogate modular function $g'$ the seed set until convergence.  
The work of~\cite{jin2021unconstrained} presents the best know  algorithm (called ROI-Greedy)  to maximize  
$f-g'$, when $f$ is submodular and $g'$ is modular. 
In our  implementation  of supsub, we use this algorithm.
 We vary the cardinality constraint $k$ from $10$ to $100$ to compare our \loga and \lineara with supSub.


\textbf{Results Analyses.\ } As we see in Figure ~\ref{fig:nethept-diff} to \ref{fig:dblp-diff},  Algorithm \loga and \lineara perform better than the supSub method. Interestingly, we observe that \loga and \lineara produced similar results on NetHept, p2p-Gnutella31, Bitcoin and DBLP. This observation suggests that when the cost function is submodular, it may suffice to just use \loga since it is fast while sacrifices just a little bit of objective value. See Fig. \ref{fig:time-diff} for running time comparisons. We can also see that supSub performed well on Wikipedia. However, supSub needs more time to converge on this network. Nevertheless, in general, there is still a significant gap between \loga and SupSub. 


    \def\addlegendimage{\csname pgfplots@addlegendimage\endcsname}
\pgfplotsset{
cycle list={%
% {draw=green,mark=star,solid}, % 
{draw=blue, mark=square,solid},%densely dashed}, % 
% {draw=black,mark=+,solid},%dashdotted}, %every mark/.append style={rotate=90}, % Random Partition
{draw=brown,mark=o,solid}, % 
% {draw=red,mark=square,solid}, % 0.63OPT Upper Bound
{draw=black,mark=+,solid}, % 
% {draw=pink,mark=square,solid} % Random Greedy
}}

\begin{figure}[H]
\begin{tikzpicture}
        \begin{customlegend}[legend columns=3,legend style={align=center,draw=none,column sep=2ex},legend entries={\loga, \lineara, supSub}]
        % \addlegendimage{draw=green,mark=star,solid}
        \addlegendimage{draw=blue, mark=square,solid}
        % \addlegendimage{draw=black,mark=+,solid}
        \addlegendimage{draw=brown,mark=o,solid}
        % \addlegendimage{draw=red,mark=square,solid}
        \addlegendimage{draw=black,mark=+,solid}
        % \addlegendimage{draw=pink,mark=square,solid}
        \end{customlegend}
     \end{tikzpicture}
\end{figure} 

\begin{figure}[H]
\vspace{-0.5em}
\begin{tabular}{c c}
\resizebox {0.45\linewidth} {!} {
\diffValuesSubmodularCost{DIFF-C/objective/nethept-obj-diff-c.csv}{}
}
&
\resizebox {0.45\linewidth} {!} {
\diffErrorsSubmodularCost{DIFF-C/error/nethept-error-diff-c.csv}{}
}
\end{tabular}
\caption{\DiffC, NetHept a) Budget vs Difference on \loga, \lineara and supSub; b) Budget vs Additive error on \loga and \lineara}
\label{fig:nethept-diff}
\vspace{-0.5em}
\end{figure}


\begin{figure}[H]
\vspace{-0.5em}
\begin{tabular}{c c}
\resizebox {0.45\linewidth} {!} {
\diffValuesSubmodularCost{DIFF-C/objective/p2p-obj-diff-c.csv}{}
}
&
\resizebox {0.45\linewidth} {!} {
\diffErrorsSubmodularCost{DIFF-C/error/p2p-error-diff-c.csv}{}
}
\end{tabular}
\caption{\DiffC, p2p-Gnutella31; a) Budget vs Difference on \loga, \lineara and supSub; b) Budget vs Additive error on \loga and \lineara}
\label{fig:nethept-diff}
\vspace{-0.5em}
\end{figure}

\begin{figure}[H]
\vspace{-0.5em}
\begin{tabular}{c c}
\resizebox {0.45\linewidth} {!} {
\diffValuesSubmodularCost{DIFF-C/objective/facebook-obj-diff-c.csv}{}
}
&
\resizebox {0.45\linewidth} {!} {
\diffErrorsSubmodularCost{DIFF-C/error/facebook-error-diff-c.csv}{}
}
\end{tabular}
\caption{\DiffC, Facebook; a) Budget vs Difference on \loga, \lineara and supSub; b) Budget vs Additive error on \loga and \lineara}
\label{fig:facebook-diff}
\vspace{-0.5em}
\end{figure}


\begin{figure}[H]
\vspace{-0.5em}
\begin{tabular}{c c}
\resizebox {0.45\linewidth} {!} {
\diffValuesSubmodularCost{DIFF-C/objective/bitcoin-obj-diff-c.csv}{}
}
&
\resizebox {0.45\linewidth} {!} {
\diffErrorsSubmodularCost{DIFF-C/error/bitcoin-error-diff-c.csv}{}
}
\end{tabular}
\caption{\DiffC, Bitcoin; a) Budget vs Difference on \loga, \lineara and supSub; b) Budget vs Additive error on \loga and \lineara}
\label{fig:bitcoin-diff}
\vspace{-0.5em}
\end{figure}


\begin{figure}[H]
\vspace{-0.5em}
\begin{tabular}{c c}
\resizebox {0.45\linewidth} {!} {
\diffValuesSubmodularCost{DIFF-C/objective/wiki-obj-diff-c.csv}{}
}
&
\resizebox {0.45\linewidth} {!} {
\diffErrorsSubmodularCost{DIFF-C/error/wiki-error-diff-c.csv}{}
}
\end{tabular}
\caption{\DiffC, Wikipedia; a) Budget vs Difference on \loga, \lineara and supSub; b) Budget vs Additive error on \loga and \lineara}
\label{fig:wiki-diff}
\vspace{-0.5em}
\end{figure}


\begin{figure}[H]
\vspace{-0.5em}
\begin{tabular}{c c}
\resizebox {0.45\linewidth} {!} {
\diffValuesSubmodularCost{DIFF-C/objective/dblp-obj-diff-c.csv}{}
}
&
\resizebox {0.45\linewidth} {!} {
\diffErrorsSubmodularCost{DIFF-C/error/dblp-error-diff-c.csv}{}
}
\end{tabular}
\caption{\DiffC; DBLP a) Budget vs Difference on \loga, \lineara and supSub; b) Budget vs Additive error on \loga and \lineara}
\label{fig:dblp-diff}
\vspace{-0.5em}
\end{figure}


% \begin{figure}[h]
% \begin{tabular}{c c}
% \resizebox {0.45\linewidth} {!} { 
% \diffTimeSubmodularCost{DIFF-C/runtime/nethept-time-diff-c.csv}{\Large  NetHept}
% }
% &
% \resizebox {0.45\linewidth} {!} {
% \diffTimeSubmodularCost{DIFF-C/runtime/p2p-time-diff-c.csv}{\Large  p2p-Gnutella31}
% }
% \end{tabular}

% \begin{tabular}{c c}
% \resizebox {0.45\linewidth} {!} {
% \diffTimeSubmodularCost{DIFF-C/runtime/facebook-time-diff-c.csv}{\Large Facebook}
% }
% &
% \resizebox {0.45\linewidth} {!} {
% \diffTimeSubmodularCost{DIFF-C/runtime/dblp-time-diff-c.csv}{\Large DBLP}
% }
% \end{tabular}

% \begin{tabular}{c c}
% \resizebox {0.45\linewidth} {!} {
% \diffTimeSubmodularCost{DIFF-C/runtime/wiki-time-diff-c.csv}{\Large Wikipedia}
% }
% &
% \resizebox {0.45\linewidth} {!} {
% \diffTimeSubmodularCost{DIFF-C/runtime/bitcoin-time-diff-c.csv}{\Large Bitcoin}
% }
% \end{tabular}

% \caption{\DiffC; $k$ vs. Runtime(s) on \loga, \lineara and supSub with Submodular Cost}
% \label{fig:time-diff}
% \end{figure}


\begin{figure}[H]
\begin{tabular}{c c c}
\resizebox {0.3\linewidth} {!} { 
\diffTimeSubmodularCost{DIFF-C/runtime/nethept-time-diff-c.csv}{\Large  NetHept}
}
&
\resizebox {0.3\linewidth} {!} {
\diffTimeSubmodularCost{DIFF-C/runtime/p2p-time-diff-c.csv}{\Large  p2p-Gnutella31}
}
&
\resizebox {0.3\linewidth} {!} {
\diffTimeSubmodularCost{DIFF-C/runtime/facebook-time-diff-c.csv}{\Large Facebook}
}
\end{tabular}

\begin{tabular}{c c c}


\resizebox {0.3\linewidth} {!} {
\diffTimeSubmodularCost{DIFF-C/runtime/dblp-time-diff-c.csv}{\Large DBLP}
}
&
\resizebox {0.3\linewidth} {!} {
\diffTimeSubmodularCost{DIFF-C/runtime/wiki-time-diff-c.csv}{\Large Wikipedia}
}
&
\resizebox {0.3\linewidth} {!} {
\diffTimeSubmodularCost{DIFF-C/runtime/bitcoin-time-diff-c.csv}{\Large Bitcoin}
}
\end{tabular}

\caption{\DiffC; $k$ vs. Logarithm of Runtime(s) on \loga, \lineara and supSub with Submodular Cost}
\label{fig:time-diff}
\end{figure}



\bibliography{padmanabhan_530}

\end{document}
