\documentclass[accepted]{uai2023} % for initial submission
% \documentclass[accepted]{uai2023} % after acceptance, for a revised
                                    % version; also before submission to
                                    % see how the non-anonymous paper
                                    % would look like

%% There is a class option to choose the math font
% \documentclass[mathfont=ptmx]{uai2023} % ptmx math instead of Computer
% Modern (has noticable issues)
% \documentclass[mathfont=newtx]{uai2023} % newtx fonts (improves upon
 % ptmx; less tested, no support)
% NOTE: Only keep *one* line above as appropriate, as it will be replaced
%       automatically for papers to be published. Do not make any other
%       change above this note for an accepted version.

%% Choose your variant of English; be consistent
\usepackage[american]{babel}
% \usepackage[british]{babel}
\newcommand{\alg}{{\scshape kicn}}
%% Some suggested packages, as needed:
\usepackage{natbib} % has a nice set of citation styles and commands
    \bibliographystyle{plainnat}
    \renewcommand{\bibsection}{\subsubsection*{References}}
\usepackage{mathtools} % amsmath with fixes and additions
% \usepackage{siunitx} % for proper typesetting of numbers and units
\usepackage{booktabs} % commands to create good-looking tables
 \usepackage{multirow}
\usepackage[dvipsnames]{xcolor}
\usepackage{tikz} % nice language for creating drawings and diagrams
\usetikzlibrary{arrows,positioning}
% for cross referencing the main text
% PLEASE ONLY USE xr IN THE SUPPLEMENTARY MATERIAL. 
% In the main paper, hard code any cross-reference to the supplementary material. 
\usepackage{xr} 


%\externaldocument{mathur_549}

%% Provided macros
% \smaller: Because the class footnote size is essentially LaTeX's \small,
%           redefining \footnotesize, we provide the original \footnotesize
%           using this macro.
%           (Use only sparingly, e.g., in drawings, as it is quite small.)

%% Self-defined macros
\newcommand{\swap}[3][-]{#3#1#2} % just an example
\newcommand{\eat}[1]{}

\title{Knowledge Intensive Learning of Cutset Networks\\(Supplementary Material)}

% The standard author block has changed for UAI 2023 to provide
% more space for long author lists and allow for complex affiliations
%
% All author information is authomatically removed by the class for the
% anonymous submission version of your paper, so you can already add your
% information below.
%
% Add authors
\author[1]{\href{mailto:<SaurabhSanjay.Mathur@utdallas.edu>?Subject=Your UAI 2023 paper}{Saurabh Mathur}{}}
\author[1]{Vibhav Gogate}
\author[1]{Sriraam Natarajan}

% Add affiliations after the authors
\affil[1]{%
    Erik Jonsson School of Engineering \& Computer Science\\
    University of Texas at Dallas\\
    Richardson, Texas, USA
}
  
  \begin{document}
  
%\onecolumn %% Turn this off if single column is desired for the supplement
\maketitle


\appendix

\section{Dataset Details}
Table \ref{tab:data} shows the number of variables, the number of qualitative influences, and the number of examples in each of the datasets. 
\section{Cutset Network structures}
Figure \ref{fig:haberman} shows the CNs fit on the haberman data set using LearnCNet (left) and \alg{} (right). While the CN fit using LearnCNet selects the year of surgery as the top node (year), the CN fit using \alg{} selects the number of positive axillary nodes detected (Nodes) as the top node. This is in line with prior work that identifies the number of positive axillary nodes as the most important risk factor \cite{fisher1983relation}.

Figure \ref{fig:ppd} shows the CNs fit on the ppd data set using LearnCNet (left) and \alg{} (right). While the CN fit using LearnCnet selects PPD, Child care stress, and Employment status as the top variables after Age, the CN fit using \alg{} selects Maternity Blues and a History of Depression. Maternity Blues and a History of Depression are important risk factors for Post-partum depression \citep{zanardo2020maternity, o1996rates}

Figure \ref{fig:adni} shows the CNs fit on the adni data set using LearnCNet (left) and \alg{} (right). While the CN fit using LearnCnet selects Education as the top variable, the CN fit using \alg{} selects Age as the top variable. Age is the most important risk factor in Alzheimer's Disease \cite{knopman2021alzheimer}



\section{Additional Results on Benchmark data sets}
Table \ref{tab:structure} shows the number of edges and the number of edges and the number of free parameters in the CNs fit using LearnCNet and \alg{}.


\begin{figure*}[!ht]
    \centering
    \resizebox{0.4\linewidth}{!}{
    
        \tikzset{
  treenode/.style = {align=center, inner sep=0pt, text centered,
    font=\sffamily},
  or_node/.style = {treenode, circle, black, font=\sffamily\tiny, draw=black,
    fill=none, text width=1.5em},  
  product_node/.style = {treenode, circle, black, font=\sffamily\bfseries, draw=none,
    fill=blue!20, text width=1.5em},  
  sum_node/.style = {treenode, circle, black,  font=\sffamily\bfseries, draw=none, 
    fill=red!20, text width=1.5em},
  leaf_node/.style = {treenode, rectangle, ForestGreen, font=\tiny, draw=ForestGreen,dashed,
    fill=none, text width=2em, minimum height=2em}
}
\begin{tikzpicture}[node distance=0.7cm]
\node[or_node, name=n1]{Year};
\coordinate[below of = n1,yshift=-0.5cm](c1);
\node[or_node,name=n11,left of = c1, xshift=-0.5cm]{Age};
\node[or_node,name=n12,right of = n11, xshift=0cm]{Nodes};
\node[or_node,name=n13,right of = n12, xshift=0cm]{Age};
\node[or_node,name=n14,right of = n13, xshift=0cm]{Age};
\node[or_node,name=n15,right of = n14, xshift=0cm]{Age};
\draw (n1) --  node[sloped,midway,align=center]{
    \setlength{\fboxsep}{1pt}\colorbox{white}{\tiny \sffamily 0.24}
}(n11);
\draw  (n1) --  node[sloped,midway,align=center]{
    \setlength{\fboxsep}{1pt}\colorbox{white}{\tiny \sffamily 0.12}
}(n12);
\draw   (n1) --  node[sloped,midway,align=center]{
    \setlength{\fboxsep}{1pt}\colorbox{white}{\tiny \sffamily 0.25}
}(n13);
\draw  (n1) --  node[sloped,midway,align=center]{
   \setlength{\fboxsep}{1pt}\colorbox{white}{\tiny \sffamily 0.19}
}(n14);
\draw  (n1) --  node[sloped,midway,align=center]{
    \setlength{\fboxsep}{1pt}\colorbox{white}{\tiny \sffamily 0.2}
}(n15);
\end{tikzpicture}
    }
    \resizebox{0.25\linewidth}{!}{
        \tikzset{
  treenode/.style = {align=center, inner sep=0pt, text centered,
    font=\sffamily},
  or_node/.style = {treenode, circle, black, font=\sffamily\tiny, draw=black,
    fill=none, text width=1.5em},  
  product_node/.style = {treenode, circle, black, font=\sffamily\bfseries, draw=none,
    fill=blue!20, text width=1.5em},  
  sum_node/.style = {treenode, circle, black,  font=\sffamily\bfseries, draw=none, 
    fill=red!20, text width=1.5em},
  leaf_node/.style = {treenode, rectangle, ForestGreen, font=\tiny, draw=ForestGreen,dashed,
    fill=none, text width=2em, minimum height=2em}
}
\begin{tikzpicture}[node distance=0.7cm]
\node[or_node, name=n1]{Nodes};
\coordinate[below of = n1,yshift=-0.5cm](c1);
\node[or_node,name=n11,left of = c1, xshift=0cm]{Age};
\node[or_node,name=n12,right of = n11, xshift=0cm]{Age};
\node[leaf_node,name=n13,right of = n12, xshift=0cm]{$T_1$};
\draw (n1) --  node[sloped,midway,align=center]{
    \setlength{\fboxsep}{1pt}\colorbox{white}{\tiny \sffamily 0.82}
}(n11);
\draw  (n1) --  node[sloped,midway,align=center]{
    \setlength{\fboxsep}{1pt}\colorbox{white}{\tiny \sffamily 0.17}
}(n12);
\draw   (n1) --  node[sloped,midway,align=center]{
    \setlength{\fboxsep}{1pt}\colorbox{white}{\tiny \sffamily 0.01}
}(n13);
\end{tikzpicture}
    }
    \caption{First two levels of cutset networks fit on a sample of the haberman dataset using LearnCNet (left) and \alg{} (right)
    }
    \label{fig:haberman}
\end{figure*}

\begin{figure*}[!h]
    \centering
    \resizebox{0.25\linewidth}{!}{
        
        \tikzset{
  treenode/.style = {align=center, inner sep=0pt, text centered,
    font=\sffamily},
  or_node/.style = {treenode, circle, black, font=\sffamily\tiny, draw=black,
    fill=none, text width=2em},  
  product_node/.style = {treenode, circle, black, font=\sffamily\bfseries, draw=none,
    fill=blue!20, text width=1.5em},  
  sum_node/.style = {treenode, circle, black,  font=\sffamily\bfseries, draw=none, 
    fill=red!20, text width=1.5em},
  leaf_node/.style = {treenode, rectangle, ForestGreen, font=\tiny, draw=ForestGreen,dashed,
    fill=none, text width=2em, minimum height=2em}
}
\begin{tikzpicture}[node distance=1cm]
\node[or_node, name=n1]{Age};
\coordinate[below of = n1,yshift=-0.5cm](c1);
\node[or_node,name=n11,left of = c1, xshift=0cm]{PPD};
\node[or_node,name=n12,right of = n11, xshift=0cm]{Child\\Stress};
\node[or_node,name=n13,right of = n12, xshift=0cm]{Employed};
\draw (n1) --  node[sloped,midway,align=center]{
    \setlength{\fboxsep}{1pt}\colorbox{white}{\tiny \sffamily 0.43}
}(n11);
\draw  (n1) --  node[sloped,midway,align=center]{
    \setlength{\fboxsep}{1pt}\colorbox{white}{\tiny \sffamily 0.43}
}(n12);
\draw   (n1) --  node[sloped,midway,align=center]{
    \setlength{\fboxsep}{1pt}\colorbox{white}{\tiny \sffamily 0.15}
}(n13);
\end{tikzpicture}
    }
    \resizebox{0.25\linewidth}{!}{
        
        \tikzset{
  treenode/.style = {align=center, inner sep=0pt, text centered,
    font=\sffamily},
  or_node/.style = {treenode, circle, black, font=\sffamily\tiny, draw=black,
    fill=none, text width=2em},  
  product_node/.style = {treenode, circle, black, font=\sffamily\bfseries, draw=none,
    fill=blue!20, text width=1.5em},  
  sum_node/.style = {treenode, circle, black,  font=\sffamily\bfseries, draw=none, 
    fill=red!20, text width=1.5em},
  leaf_node/.style = {treenode, rectangle, ForestGreen, font=\tiny, draw=ForestGreen,dashed,
    fill=none, text width=2em, minimum height=2em}
}
\begin{tikzpicture}[node distance=1cm]
\node[or_node, name=n1]{Age};
\coordinate[below of = n1,yshift=-0.5cm](c1);
\node[or_node,name=n11,left of = c1, xshift=0cm]{Maternity Blues};
\node[or_node,name=n12,right of = n11, xshift=0cm]{Past\\Depres.};
\node[or_node,name=n13,right of = n12, xshift=0cm]{Maternity Blues};
\draw (n1) --  node[sloped,midway,align=center]{
    \setlength{\fboxsep}{1pt}\colorbox{white}{\tiny \sffamily 0.43}
}(n11);
\draw  (n1) --  node[sloped,midway,align=center]{
    \setlength{\fboxsep}{1pt}\colorbox{white}{\tiny \sffamily 0.43}
}(n12);
\draw   (n1) --  node[sloped,midway,align=center]{
    \setlength{\fboxsep}{1pt}\colorbox{white}{\tiny \sffamily 0.15}
}(n13);
\end{tikzpicture}
    }
    \caption{First two levels of cutset networks fit on a sample of the ppd dataset using LearnCNet (left) and \alg{} (right)
    }
    \label{fig:ppd}
\end{figure*}

\begin{figure*}[!h]
    \centering
    \resizebox{0.4\linewidth}{!}{
        
        \tikzset{
  treenode/.style = {align=center, inner sep=0pt, text centered,
    font=\sffamily},
  or_node/.style = {treenode, circle, black, font=\sffamily\tiny, draw=black,
    fill=none, text width=2.2em},  
  product_node/.style = {treenode, circle, black, font=\sffamily\bfseries, draw=none,
    fill=blue!20, text width=1.5em},  
  sum_node/.style = {treenode, circle, black,  font=\sffamily\bfseries, draw=none, 
    fill=red!20, text width=1.5em},
  leaf_node/.style = {treenode, rectangle, ForestGreen, font=\tiny, draw=ForestGreen,dashed,
    fill=none, text width=2em, minimum height=2em}
}
\begin{tikzpicture}[node distance=1cm]
\node[or_node, name=n1]{Education};
\coordinate[below of = n1,yshift=-0.5cm](c1);
\node[or_node,name=n11,left of = c1, xshift=-0.5cm]{MMScore};
\node[or_node,name=n12,right of = n11, xshift=0cm]{Age};
\node[or_node,name=n13,right of = n12, xshift=0cm]{MMScore};
\node[or_node,name=n14,right of = n13, xshift=0cm]{MMScore};
\node[or_node,name=n15,right of = n14, xshift=0cm]{MMScore};
\draw (n1) --  node[sloped,midway,align=center]{
    \setlength{\fboxsep}{1pt}\colorbox{white}{\tiny \sffamily 0.23}
}(n11);
\draw  (n1) --  node[sloped,midway,align=center]{
    \setlength{\fboxsep}{1pt}\colorbox{white}{\tiny \sffamily 0.12}
}(n12);
\draw   (n1) --  node[sloped,midway,align=center]{
    \setlength{\fboxsep}{1pt}\colorbox{white}{\tiny \sffamily 0.23}
}(n13);
\draw   (n1) --  node[sloped,midway,align=center]{
    \setlength{\fboxsep}{1pt}\colorbox{white}{\tiny \sffamily 0.25}
}(n14);
\draw   (n1) --  node[sloped,midway,align=center]{
    \setlength{\fboxsep}{1pt}\colorbox{white}{\tiny \sffamily 0.16}
}(n15);
\end{tikzpicture}
    
    }
    \resizebox{0.35\linewidth}{!}{
        
        \tikzset{
  treenode/.style = {align=center, inner sep=0pt, text centered,
    font=\sffamily},
  or_node/.style = {treenode, circle, black, font=\sffamily\tiny, draw=black,
    fill=none, text width=2.2em},  
  product_node/.style = {treenode, circle, black, font=\sffamily\bfseries, draw=none,
    fill=blue!20, text width=1.5em},  
  sum_node/.style = {treenode, circle, black,  font=\sffamily\bfseries, draw=none, 
    fill=red!20, text width=1.5em},
  leaf_node/.style = {treenode, rectangle, ForestGreen, font=\tiny, draw=ForestGreen,dashed,
    fill=none, text width=2em, minimum height=2em}
}
\begin{tikzpicture}[node distance=1cm]
\node[or_node, name=n1]{Age};
\coordinate[below of = n1,yshift=-0.5cm](c1);
\node[or_node,name=n11,left of = c1, xshift=-0.5cm]{Diagnosis};
\node[or_node,name=n12,right of = n11, xshift=0cm]{Diagnosis};
\node[or_node,name=n13,right of = n12, xshift=0cm]{Diagnosis};
\node[or_node,name=n14,right of = n13, xshift=0cm]{Race};
\draw (n1) --  node[sloped,midway,align=center]{
    \setlength{\fboxsep}{1pt}\colorbox{white}{\tiny \sffamily 0.09}
}(n11);
\draw  (n1) --  node[sloped,midway,align=center]{
    \setlength{\fboxsep}{1pt}\colorbox{white}{\tiny \sffamily 0.36}
}(n12);
\draw   (n1) --  node[sloped,midway,align=center]{
    \setlength{\fboxsep}{1pt}\colorbox{white}{\tiny \sffamily 0.47}
}(n13);
\draw   (n1) --  node[sloped,midway,align=center]{
    \setlength{\fboxsep}{1pt}\colorbox{white}{\tiny \sffamily 0.08}
}(n14);
\end{tikzpicture}
    
    }
    \caption{First two levels of cutset networks fit on a sample of the adni dataset using LearnCNet (left) and \alg{} (right)
    }
    \label{fig:adni}
\end{figure*}

\begin{table}[!t]
\centering
\begin{tabular}{lrrrr}
\toprule
           \textbf{Data set} &  $|\textbf{X}|$ &  $|C|$ &  $|\mathcal{D}_\text{train}|$ & $|\mathcal{D}_\text{test}|$ \\
\midrule
            cpu &            7 &             6 &         104 &        105 \\
      ljubljana &            9 &             6 &         138 &        139 \\
       haberman &            4 &             3 &         153 &        153 \\
           auto &            8 &             5 &         196 &        196 \\
          yeast &            9 &             7 &         742 &        742 \\
            car &            7 &             2 &         864 &        864 \\
        redwine &           12 &            19 &         799 &        800 \\
      whitewine &           12 &             8 &        2,449 &       2,449 \\
        abalone &            9 &            17 &        2,088 &       2,089 \\
      cleveland &           12 &             6 &         148 &        149 \\
       diabetes &            5 &             4 &         364 &        365 \\
\midrule
          sachs &           11 &             6 &         100 &        100 \\
           asia &            8 &             5 &         100 &        100 \\
     earthquake &            5 &             3 &         100 &        100 \\
         survey &            6 &             5 &         100 &        100 \\
\midrule
            ppd &           11 &             4 &          86 &         87 \\
           adni &            7 &             3 &         168 &        168 \\
numom2b-a &            7 &             6 &        3,292 &       3,292 \\
numom2b-b &            8 &             7 &        1,828 &       1,829 \\
\bottomrule
\end{tabular}
\caption{The number of datapoints in training ($|\mathcal{D}_\text{train}|$) and test sets ($|\mathcal{D}_\text{test}|$), number of variables ($|\textbf{X}|$) and the number of qualitative influences ($|C|$) for all the data sets used in evaluation.}\label{tab:data}
\end{table}



\begin{table*}[!t]
\centering
\begin{tabular}{lrrrr}
\toprule
& \multicolumn{2}{c}{\textbf{Edge count}} & \multicolumn{2}{c}{\textbf{Parameter count}} \\ \cmidrule(lr){2-3} \cmidrule(lr){4-5}  
                                  \textbf{Data set} & \textbf{LearnCNet}    & \textbf{\alg{}}    & \textbf{LearnCNet}     & \textbf{\alg{}}     \\ \midrule

cpu                                & 75.2                 & 71.2           & 276.8                 & 266.8              \\
ljubljana                          & 155.7                & 171.9          & 441.5                 & 439.5              \\
haberman                           & 30.7                 & 24.4           & 134.8                  & 109.8               \\
auto                               & 173.8                & 205.6          & 724.4                 & 735.6              \\
car                                & 178.7                & 187.6          & 1,115.7               & 1,070.7            \\
abalone                            & 720.0                & 354.4          & 2,914.8               & 1,360.4            \\
redwine                            & 635.4                & 674.8          & 1,006.1               & 978.4              \\
whitewine                          & 801.5                & 933.1          & 1,172.5               & 1,240.7            \\
yeast                              & 556.8                & 541.6          & 1,808.3               & 1,694.3            \\
cleveland                          &          265.30 &       277.70 &          687.00 &       673.70 \\
diabetes                           &           51.30 &        45.60 &          270.20 &       266.00 \\
\midrule
sachs                              & 193.4                & 208.6          & 888.0                 & 843.2              \\
asia                               & 47.4                 & 49.4           & 73.3                  & 72.9               \\
earthquake                         & 11.0                 & 11.0           & 18.4                  & 17.7               \\
survey                    & 27.7                 & 25.9           & 63.8                  & 62.8               \\
\bottomrule
\end{tabular}
\caption{The number of edges and the number of free parameters for cutset networks fit using LearnCNet and \alg{} on UCI data sets with 30\% noise (rows 1--11) and data sampled from Bayesian Networks (rows 12--15) The counts are averaged over 10 bootstrap samples.}\label{tab:structure}
\end{table*}

\clearpage
\bibliography{mathur_549}

\end{document}
