\documentclass[accepted]{uai2023}


\usepackage{xr}
\makeatletter

\newcommand*{\addFileDependency}[1]{\typeout{(#1)}\@addtofilelist{#1}
\IfFileExists{#1}{}{\typeout{No file #1.}}
}\makeatother

\newcommand*{\myexternaldocument}[1]{\externaldocument{#1}\addFileDependency{#1.tex}\addFileDependency{#1.aux}}
\myexternaldocument{sharma_596}




\usepackage[american]{babel}


\usepackage{amsmath,amsfonts,bm}

\newcommand{\figleft}{{\em (Left)}}
\newcommand{\figcenter}{{\em (Center)}}
\newcommand{\figright}{{\em (Right)}}
\newcommand{\figtop}{{\em (Top)}}
\newcommand{\figbottom}{{\em (Bottom)}}
\newcommand{\captiona}{{\em (a)}}
\newcommand{\captionb}{{\em (b)}}
\newcommand{\captionc}{{\em (c)}}
\newcommand{\captiond}{{\em (d)}}

\newcommand{\newterm}[1]{{\bf #1}}


\def\figref#1{figure~\ref{#1}}
\def\Figref#1{Figure~\ref{#1}}
\def\twofigref#1#2{figures \ref{#1} and \ref{#2}}
\def\quadfigref#1#2#3#4{figures \ref{#1}, \ref{#2}, \ref{#3} and \ref{#4}}
\def\secref#1{section~\ref{#1}}
\def\Secref#1{Section~\ref{#1}}
\def\twosecrefs#1#2{sections \ref{#1} and \ref{#2}}
\def\secrefs#1#2#3{sections \ref{#1}, \ref{#2} and \ref{#3}}
\def\eqref#1{equation~\ref{#1}}
\def\Eqref#1{Equation~\ref{#1}}
\def\plaineqref#1{\ref{#1}}
\def\chapref#1{chapter~\ref{#1}}
\def\Chapref#1{Chapter~\ref{#1}}
\def\rangechapref#1#2{chapters\ref{#1}--\ref{#2}}
\def\algref#1{algorithm~\ref{#1}}
\def\Algref#1{Algorithm~\ref{#1}}
\def\twoalgref#1#2{algorithms \ref{#1} and \ref{#2}}
\def\Twoalgref#1#2{Algorithms \ref{#1} and \ref{#2}}
\def\partref#1{part~\ref{#1}}
\def\Partref#1{Part~\ref{#1}}
\def\twopartref#1#2{parts \ref{#1} and \ref{#2}}

\def\ceil#1{\lceil #1 \rceil}
\def\floor#1{\lfloor #1 \rfloor}
\def\1{\bm{1}}
\newcommand{\train}{\mathcal{D}}
\newcommand{\valid}{\mathcal{D_{\mathrm{valid}}}}
\newcommand{\test}{\mathcal{D_{\mathrm{test}}}}

\def\eps{{\epsilon}}


\def\reta{{\textnormal{$\eta$}}}
\def\ra{{\textnormal{a}}}
\def\rb{{\textnormal{b}}}
\def\rc{{\textnormal{c}}}
\def\rd{{\textnormal{d}}}
\def\re{{\textnormal{e}}}
\def\rf{{\textnormal{f}}}
\def\rg{{\textnormal{g}}}
\def\rh{{\textnormal{h}}}
\def\ri{{\textnormal{i}}}
\def\rj{{\textnormal{j}}}
\def\rk{{\textnormal{k}}}
\def\rl{{\textnormal{l}}}
\def\rn{{\textnormal{n}}}
\def\ro{{\textnormal{o}}}
\def\rp{{\textnormal{p}}}
\def\rq{{\textnormal{q}}}
\def\rr{{\textnormal{r}}}
\def\rs{{\textnormal{s}}}
\def\rt{{\textnormal{t}}}
\def\ru{{\textnormal{u}}}
\def\rv{{\textnormal{v}}}
\def\rw{{\textnormal{w}}}
\def\rx{{\textnormal{x}}}
\def\ry{{\textnormal{y}}}
\def\rz{{\textnormal{z}}}

\def\rvepsilon{{\mathbf{\epsilon}}}
\def\rvtheta{{\mathbf{\theta}}}
\def\rva{{\mathbf{a}}}
\def\rvb{{\mathbf{b}}}
\def\rvc{{\mathbf{c}}}
\def\rvd{{\mathbf{d}}}
\def\rve{{\mathbf{e}}}
\def\rvf{{\mathbf{f}}}
\def\rvg{{\mathbf{g}}}
\def\rvh{{\mathbf{h}}}
\def\rvu{{\mathbf{i}}}
\def\rvj{{\mathbf{j}}}
\def\rvk{{\mathbf{k}}}
\def\rvl{{\mathbf{l}}}
\def\rvm{{\mathbf{m}}}
\def\rvn{{\mathbf{n}}}
\def\rvo{{\mathbf{o}}}
\def\rvp{{\mathbf{p}}}
\def\rvq{{\mathbf{q}}}
\def\rvr{{\mathbf{r}}}
\def\rvs{{\mathbf{s}}}
\def\rvt{{\mathbf{t}}}
\def\rvu{{\mathbf{u}}}
\def\rvv{{\mathbf{v}}}
\def\rvw{{\mathbf{w}}}
\def\rvx{{\mathbf{x}}}
\def\rvy{{\mathbf{y}}}
\def\rvz{{\mathbf{z}}}

\def\erva{{\textnormal{a}}}
\def\ervb{{\textnormal{b}}}
\def\ervc{{\textnormal{c}}}
\def\ervd{{\textnormal{d}}}
\def\erve{{\textnormal{e}}}
\def\ervf{{\textnormal{f}}}
\def\ervg{{\textnormal{g}}}
\def\ervh{{\textnormal{h}}}
\def\ervi{{\textnormal{i}}}
\def\ervj{{\textnormal{j}}}
\def\ervk{{\textnormal{k}}}
\def\ervl{{\textnormal{l}}}
\def\ervm{{\textnormal{m}}}
\def\ervn{{\textnormal{n}}}
\def\ervo{{\textnormal{o}}}
\def\ervp{{\textnormal{p}}}
\def\ervq{{\textnormal{q}}}
\def\ervr{{\textnormal{r}}}
\def\ervs{{\textnormal{s}}}
\def\ervt{{\textnormal{t}}}
\def\ervu{{\textnormal{u}}}
\def\ervv{{\textnormal{v}}}
\def\ervw{{\textnormal{w}}}
\def\ervx{{\textnormal{x}}}
\def\ervy{{\textnormal{y}}}
\def\ervz{{\textnormal{z}}}

\def\rmA{{\mathbf{A}}}
\def\rmB{{\mathbf{B}}}
\def\rmC{{\mathbf{C}}}
\def\rmD{{\mathbf{D}}}
\def\rmE{{\mathbf{E}}}
\def\rmF{{\mathbf{F}}}
\def\rmG{{\mathbf{G}}}
\def\rmH{{\mathbf{H}}}
\def\rmI{{\mathbf{I}}}
\def\rmJ{{\mathbf{J}}}
\def\rmK{{\mathbf{K}}}
\def\rmL{{\mathbf{L}}}
\def\rmM{{\mathbf{M}}}
\def\rmN{{\mathbf{N}}}
\def\rmO{{\mathbf{O}}}
\def\rmP{{\mathbf{P}}}
\def\rmQ{{\mathbf{Q}}}
\def\rmR{{\mathbf{R}}}
\def\rmS{{\mathbf{S}}}
\def\rmT{{\mathbf{T}}}
\def\rmU{{\mathbf{U}}}
\def\rmV{{\mathbf{V}}}
\def\rmW{{\mathbf{W}}}
\def\rmX{{\mathbf{X}}}
\def\rmY{{\mathbf{Y}}}
\def\rmZ{{\mathbf{Z}}}

\def\ermA{{\textnormal{A}}}
\def\ermB{{\textnormal{B}}}
\def\ermC{{\textnormal{C}}}
\def\ermD{{\textnormal{D}}}
\def\ermE{{\textnormal{E}}}
\def\ermF{{\textnormal{F}}}
\def\ermG{{\textnormal{G}}}
\def\ermH{{\textnormal{H}}}
\def\ermI{{\textnormal{I}}}
\def\ermJ{{\textnormal{J}}}
\def\ermK{{\textnormal{K}}}
\def\ermL{{\textnormal{L}}}
\def\ermM{{\textnormal{M}}}
\def\ermN{{\textnormal{N}}}
\def\ermO{{\textnormal{O}}}
\def\ermP{{\textnormal{P}}}
\def\ermQ{{\textnormal{Q}}}
\def\ermR{{\textnormal{R}}}
\def\ermS{{\textnormal{S}}}
\def\ermT{{\textnormal{T}}}
\def\ermU{{\textnormal{U}}}
\def\ermV{{\textnormal{V}}}
\def\ermW{{\textnormal{W}}}
\def\ermX{{\textnormal{X}}}
\def\ermY{{\textnormal{Y}}}
\def\ermZ{{\textnormal{Z}}}

\def\vzero{{\bm{0}}}
\def\vone{{\bm{1}}}
\def\vmu{{\bm{\mu}}}
\def\vtheta{{\bm{\theta}}}
\def\va{{\bm{a}}}
\def\vb{{\bm{b}}}
\def\vc{{\bm{c}}}
\def\vd{{\bm{d}}}
\def\ve{{\bm{e}}}
\def\vf{{\bm{f}}}
\def\vg{{\bm{g}}}
\def\vh{{\bm{h}}}
\def\vi{{\bm{i}}}
\def\vj{{\bm{j}}}
\def\vk{{\bm{k}}}
\def\vl{{\bm{l}}}
\def\vm{{\bm{m}}}
\def\vn{{\bm{n}}}
\def\vo{{\bm{o}}}
\def\vp{{\bm{p}}}
\def\vq{{\bm{q}}}
\def\vr{{\bm{r}}}
\def\vs{{\bm{s}}}
\def\vt{{\bm{t}}}
\def\vu{{\bm{u}}}
\def\vv{{\bm{v}}}
\def\vw{{\bm{w}}}
\def\vx{{\bm{x}}}
\def\vy{{\bm{y}}}
\def\vz{{\bm{z}}}

\def\evalpha{{\alpha}}
\def\evbeta{{\beta}}
\def\evepsilon{{\epsilon}}
\def\evlambda{{\lambda}}
\def\evomega{{\omega}}
\def\evmu{{\mu}}
\def\evpsi{{\psi}}
\def\evsigma{{\sigma}}
\def\evtheta{{\theta}}
\def\eva{{a}}
\def\evb{{b}}
\def\evc{{c}}
\def\evd{{d}}
\def\eve{{e}}
\def\evf{{f}}
\def\evg{{g}}
\def\evh{{h}}
\def\evi{{i}}
\def\evj{{j}}
\def\evk{{k}}
\def\evl{{l}}
\def\evm{{m}}
\def\evn{{n}}
\def\evo{{o}}
\def\evp{{p}}
\def\evq{{q}}
\def\evr{{r}}
\def\evs{{s}}
\def\evt{{t}}
\def\evu{{u}}
\def\evv{{v}}
\def\evw{{w}}
\def\evx{{x}}
\def\evy{{y}}
\def\evz{{z}}

\def\mA{{\bm{A}}}
\def\mB{{\bm{B}}}
\def\mC{{\bm{C}}}
\def\mD{{\bm{D}}}
\def\mE{{\bm{E}}}
\def\mF{{\bm{F}}}
\def\mG{{\bm{G}}}
\def\mH{{\bm{H}}}
\def\mI{{\bm{I}}}
\def\mJ{{\bm{J}}}
\def\mK{{\bm{K}}}
\def\mL{{\bm{L}}}
\def\mM{{\bm{M}}}
\def\mN{{\bm{N}}}
\def\mO{{\bm{O}}}
\def\mP{{\bm{P}}}
\def\mQ{{\bm{Q}}}
\def\mR{{\bm{R}}}
\def\mS{{\bm{S}}}
\def\mT{{\bm{T}}}
\def\mU{{\bm{U}}}
\def\mV{{\bm{V}}}
\def\mW{{\bm{W}}}
\def\mX{{\bm{X}}}
\def\mY{{\bm{Y}}}
\def\mZ{{\bm{Z}}}
\def\mBeta{{\bm{\beta}}}
\def\mPhi{{\bm{\Phi}}}
\def\mLambda{{\bm{\Lambda}}}
\def\mSigma{{\bm{\Sigma}}}

\DeclareMathAlphabet{\mathsfit}{\encodingdefault}{\sfdefault}{m}{sl}
\SetMathAlphabet{\mathsfit}{bold}{\encodingdefault}{\sfdefault}{bx}{n}
\newcommand{\tens}[1]{\bm{\mathsfit{#1}}}
\def\tA{{\tens{A}}}
\def\tB{{\tens{B}}}
\def\tC{{\tens{C}}}
\def\tD{{\tens{D}}}
\def\tE{{\tens{E}}}
\def\tF{{\tens{F}}}
\def\tG{{\tens{G}}}
\def\tH{{\tens{H}}}
\def\tI{{\tens{I}}}
\def\tJ{{\tens{J}}}
\def\tK{{\tens{K}}}
\def\tL{{\tens{L}}}
\def\tM{{\tens{M}}}
\def\tN{{\tens{N}}}
\def\tO{{\tens{O}}}
\def\tP{{\tens{P}}}
\def\tQ{{\tens{Q}}}
\def\tR{{\tens{R}}}
\def\tS{{\tens{S}}}
\def\tT{{\tens{T}}}
\def\tU{{\tens{U}}}
\def\tV{{\tens{V}}}
\def\tW{{\tens{W}}}
\def\tX{{\tens{X}}}
\def\tY{{\tens{Y}}}
\def\tZ{{\tens{Z}}}


\def\gA{{\mathcal{A}}}
\def\gB{{\mathcal{B}}}
\def\gC{{\mathcal{C}}}
\def\gD{{\mathcal{D}}}
\def\gE{{\mathcal{E}}}
\def\gF{{\mathcal{F}}}
\def\gG{{\mathcal{G}}}
\def\gH{{\mathcal{H}}}
\def\gI{{\mathcal{I}}}
\def\gJ{{\mathcal{J}}}
\def\gK{{\mathcal{K}}}
\def\gL{{\mathcal{L}}}
\def\gM{{\mathcal{M}}}
\def\gN{{\mathcal{N}}}
\def\gO{{\mathcal{O}}}
\def\gP{{\mathcal{P}}}
\def\gQ{{\mathcal{Q}}}
\def\gR{{\mathcal{R}}}
\def\gS{{\mathcal{S}}}
\def\gT{{\mathcal{T}}}
\def\gU{{\mathcal{U}}}
\def\gV{{\mathcal{V}}}
\def\gW{{\mathcal{W}}}
\def\gX{{\mathcal{X}}}
\def\gY{{\mathcal{Y}}}
\def\gZ{{\mathcal{Z}}}

\def\sA{{\mathbb{A}}}
\def\sB{{\mathbb{B}}}
\def\sC{{\mathbb{C}}}
\def\sD{{\mathbb{D}}}
\def\sF{{\mathbb{F}}}
\def\sG{{\mathbb{G}}}
\def\sH{{\mathbb{H}}}
\def\sI{{\mathbb{I}}}
\def\sJ{{\mathbb{J}}}
\def\sK{{\mathbb{K}}}
\def\sL{{\mathbb{L}}}
\def\sM{{\mathbb{M}}}
\def\sN{{\mathbb{N}}}
\def\sO{{\mathbb{O}}}
\def\sP{{\mathbb{P}}}
\def\sQ{{\mathbb{Q}}}
\def\sR{{\mathbb{R}}}
\def\sS{{\mathbb{S}}}
\def\sT{{\mathbb{T}}}
\def\sU{{\mathbb{U}}}
\def\sV{{\mathbb{V}}}
\def\sW{{\mathbb{W}}}
\def\sX{{\mathbb{X}}}
\def\sY{{\mathbb{Y}}}
\def\sZ{{\mathbb{Z}}}

\def\emLambda{{\Lambda}}
\def\emA{{A}}
\def\emB{{B}}
\def\emC{{C}}
\def\emD{{D}}
\def\emE{{E}}
\def\emF{{F}}
\def\emG{{G}}
\def\emH{{H}}
\def\emI{{I}}
\def\emJ{{J}}
\def\emK{{K}}
\def\emL{{L}}
\def\emM{{M}}
\def\emN{{N}}
\def\emO{{O}}
\def\emP{{P}}
\def\emQ{{Q}}
\def\emR{{R}}
\def\emS{{S}}
\def\emT{{T}}
\def\emU{{U}}
\def\emV{{V}}
\def\emW{{W}}
\def\emX{{X}}
\def\emY{{Y}}
\def\emZ{{Z}}
\def\emSigma{{\Sigma}}

\newcommand{\etens}[1]{\mathsfit{#1}}
\def\etLambda{{\etens{\Lambda}}}
\def\etA{{\etens{A}}}
\def\etB{{\etens{B}}}
\def\etC{{\etens{C}}}
\def\etD{{\etens{D}}}
\def\etE{{\etens{E}}}
\def\etF{{\etens{F}}}
\def\etG{{\etens{G}}}
\def\etH{{\etens{H}}}
\def\etI{{\etens{I}}}
\def\etJ{{\etens{J}}}
\def\etK{{\etens{K}}}
\def\etL{{\etens{L}}}
\def\etM{{\etens{M}}}
\def\etN{{\etens{N}}}
\def\etO{{\etens{O}}}
\def\etP{{\etens{P}}}
\def\etQ{{\etens{Q}}}
\def\etR{{\etens{R}}}
\def\etS{{\etens{S}}}
\def\etT{{\etens{T}}}
\def\etU{{\etens{U}}}
\def\etV{{\etens{V}}}
\def\etW{{\etens{W}}}
\def\etX{{\etens{X}}}
\def\etY{{\etens{Y}}}
\def\etZ{{\etens{Z}}}

\newcommand{\pdata}{p_{\rm{data}}}
\newcommand{\ptrain}{\hat{p}_{\rm{data}}}
\newcommand{\Ptrain}{\hat{P}_{\rm{data}}}
\newcommand{\pmodel}{p_{\rm{model}}}
\newcommand{\Pmodel}{P_{\rm{model}}}
\newcommand{\ptildemodel}{\tilde{p}_{\rm{model}}}
\newcommand{\pencode}{p_{\rm{encoder}}}
\newcommand{\pdecode}{p_{\rm{decoder}}}
\newcommand{\precons}{p_{\rm{reconstruct}}}

\newcommand{\laplace}{\mathrm{Laplace}} 

\newcommand{\E}{\mathbb{E}}
\newcommand{\Ls}{\mathcal{L}}
\newcommand{\R}{\mathbb{R}}
\newcommand{\emp}{\tilde{p}}
\newcommand{\lr}{\alpha}
\newcommand{\reg}{\lambda}
\newcommand{\rect}{\mathrm{rectifier}}
\newcommand{\softmax}{\mathrm{softmax}}
\newcommand{\sigmoid}{\sigma}
\newcommand{\softplus}{\zeta}
\newcommand{\KL}{D_{\mathrm{KL}}}
\newcommand{\Var}{\mathrm{Var}}
\newcommand{\standarderror}{\mathrm{SE}}
\newcommand{\Cov}{\mathrm{Cov}}
\newcommand{\normlzero}{L^0}
\newcommand{\normlone}{L^1}
\newcommand{\normltwo}{L^2}
\newcommand{\normlp}{L^p}
\newcommand{\normmax}{L^\infty}

\newcommand{\parents}{Pa} 

\DeclareMathOperator*{\argmax}{arg\,max}
\DeclareMathOperator*{\argmin}{arg\,min}

\DeclareMathOperator{\sign}{sign}
\DeclareMathOperator{\Tr}{Tr}
\let\ab\allowbreak
 \usepackage{natbib} \bibliographystyle{plainnat}
\renewcommand{\bibsection}{\subsubsection*{References}}


\usepackage{url}
\usepackage[utf8]{inputenc}
\usepackage{etoolbox}
\usepackage{amsmath, amsthm}
\usepackage{amsfonts, amssymb}
\usepackage{bm}
\usepackage{ifthen}
\usepackage{letltxmacro}
\usepackage{nicefrac}
\usepackage{xstring}
\usepackage{pgf}
\usepackage{tikz}
\usetikzlibrary{arrows,automata}
\usetikzlibrary{er,positioning,bayesnet}
\usepackage[linesnumbered,ruled]{algorithm2e}
\renewcommand{\mathbf}[1]{\bm{#1}}
\usepackage{mathrsfs}
\usepackage{graphicx}
\usepackage{framed}
\newcommand{\todot}[1]{\textbf{\color{red!75!black}TODO: #1}}
\usepackage{todo}
\newcommand{\attention}[1]{{\color{blue!70!black} #1}}
\newcommand{\fixme}[1]{{\color{red!80!black} #1}}
\usepackage{booktabs,siunitx}
\usepackage{caption}
\usepackage{subcaption}
\usepackage{wrapfig}
\usepackage{cleveref}
\newcommand{\arxiv}[1]{\href{https://arxiv.org/abs/#1}{arXiv:#1}}
\newcommand{\biorxiv}[1]{\href{https://doi.org/10.1101/#1}{bioR$\chi{}$iv:#1}}
\newtheorem{theorem}{Theorem}[section]
\newtheorem{observation}[theorem]{Observation}
\newtheorem{claim}[theorem]{Claim}
\newtheorem{condition}[theorem]{Condition}
\newtheorem{example}[theorem]{Example}
\newtheorem{fact}[theorem]{Fact}
\newtheorem{lemma}[theorem]{Lemma}
\newtheorem{corollary}[theorem]{Corollary}
\newtheorem{proposition}[theorem]{Proposition}
\newtheorem{consequence}[theorem]{Consequence}
\newtheorem{question}[theorem]{Question}
\newtheorem{definition}[theorem]{Definition}
\newtheorem{remark}[theorem]{Remark}
\newtheorem{problem}[theorem]{Problem}
\crefname{theorem}{Theorem}{Theorems}
\crefname{observation}{Observation}{Observations}
\crefname{claim}{Claim}{Claims}
\crefname{algorithm}{Algorithm}{Algorithms}
\crefname{condition}{Condition}{Conditions}
\crefname{example}{Example}{Examples}
\crefname{fact}{Fact}{Facts}
\crefname{lemma}{Lemma}{Lemmas}
\crefname{corollary}{Corollary}{Corollaries}
\crefname{consequence}{Consequence}{Consequences}
\crefname{definition}{Definition}{Definitions}
\crefname{remark}{Remark}{Remarks}
\crefname{problem}{Problem}{Problems}
\crefname{proposition}{Proposition}{Propositions}
\crefname{section}{Section}{Sections}
\crefname{appendix}{Supplementary Material Section}{Supplementary Material Sections}

\newcommand{\abs}[1]{\ensuremath{\left|#1\right|}}
\newcommand{\norm}[2][]{\ensuremath{\Vert #2 \Vert_{#1}}}
\newcommand{\diff}[2]{\frac{\text{d}#1}{\text{d}#2}}
\newcommand{\pdiff}[2]{\frac{\partial #1}{\partial #2}}
\newcommand{\grad}[1]{\nabla\left(#1\right)}
\renewcommand{\Pr}[2][]{\ensuremath{\mathbb{P}_{#1}\insq{#2}}}
\newcommand{\Po}[0]{\ensuremath{\mathrm{Po}}}
\newcommand{\ina}[1]{\left<#1\right>}
\newcommand{\inb}[1]{\left\{#1\right\}}
\newcommand{\inp}[1]{\left(#1\right)}
\newcommand{\insq}[1]{\left[#1\right]}
\makeatletter
\newcommand*{\defeq}{\mathrel{\rlap{\raisebox{0.3ex}{$\m@th\cdot$}}\raisebox{-0.3ex}{$\m@th\cdot$}}=}
\newcommand*{\eqdef}{=
  \mathrel{\rlap{\raisebox{0.3ex}{$\m@th\cdot$}}\raisebox{-0.3ex}{$\m@th\cdot$}}}
\makeatother
\newcommand{\nfrac}[3][]{\nicefrac[#1]{#2}{#3}}
\newcommand{\xfrac}[3][]{\nicefrac[#1]{#2}{#3}}
\renewcommand{\deg}[1]{\ensuremath{\mathrm{deg}\inp{#1}}}
\newcommand{\Z}[0]{\ensuremath{\mathbb{Z}}}
\newcommand{\I}[1]{\ensuremath{\insq{#1}}}
\newcommand{\F}[1]{\ensuremath{\mathbb{F}_{#1}}}
\newcommand{\N}[0]{\mathbb{N}}
\renewcommand{\emptyset}[0]{\varnothing}
\newcommand{\comp}[1]{\overline{#1}}
\newcommand{\poly}[1]{\ensuremath{\mathop{\mathrm{poly}}\inp{#1}}}
\newcommand{\etal}[0]{\emph{et al.}}
\renewcommand{\vec}[1]{\mathbf{#1}}
\newcommand{\T}[0]{\ensuremath{\intercal}}
\newcommand{\skel}[0]{\ensuremath{\text{skeleton}}}
\newcommand{\countAMO}[1]{\ensuremath{\textup{\#AMO}\inp{#1}}}

\newcommand{\undir}[2]{\ensuremath{{#1} - {#2}}}

\hypersetup{hidelinks} 
\title{Counting Background Knowledge Consistent Markov Equivalent Directed  Acyclic Graphs \\ (Supplementary Material)}

\author[1]{Vidya Sagar Sharma}
\affil[1]{School of Technology and Computer Science\\
  Tata Institute of Fundamental Research, Mumbai\\
  Maharashtra, India
}







\begin{document}
\onecolumn \maketitle
\renewcommand\thesection{\Alph{section}}
\renewcommand\thesubsection{\thesection.\Alph{subsection}}
\section{Graph terminology}
\label{app:graph-terminology}
\textbf{Graphs and graph unions.} 
We mostly follow the graph theory terminology
of \cite{andersson1997characterization}.
A graph is \emph{undirected} if all its edges are
undirected, \emph{directed} if all its edges are \emph{directed}, and
\emph{partially directed} if it contains both directed and undirected edges. A
directed graph that has no directed cycle is called a \emph{directed acyclic
  graph} (DAG). A generalization of this idea is that of \emph{chain graphs}: a
partially directed graph is called a chain graph if it has no cycle which
contains (i) at least one directed edge, and (ii) in which all directed edges
are directed in the same direction as one moves  along the cycle. We denote the
neighbors of a vertex $v$ in a graph $G$ as $N_G(v)$, and an induced subgraph of
$G$ on a set $X\subseteq V$ is denoted as $G[X]$. 
The
\emph{graph union} (which we just call ``union'') $G_1\cup G_2$ includes
vertices and edges present in any one of $G_1$ or $G_2$, i.e., $V_{G_1\cup G_2} = V_{G_1} \cup V_{G_2}$, and $E_{G_1\cup G_2} = E_{G_1} \cup E_{G_2}$.  The \emph{skeleton} of
a partially directed graph $G$ is an undirected version of $G$ which we get by
ignoring the direction of all the edges: in particular, note that the {skeleton} of
a partially directed graph is also the graph union of \emph{all} the partially
directed graphs with the same skeleton as $G$.  A \emph{v-structure} (or
\emph{unshielded collider}) in a partially directed graph $G$ is an ordered
triple of vertices $(a,b,c)$ of $G$ which induce the subgraph
$a\rightarrow b \leftarrow c$ in $G$.

\textbf{Cliques, separators, chordal graphs, and UCCG.} A \emph{clique} is a set of pairwise adjacent vertices for a graph. For a graph $G$,  $u$ and $v$ are said to be pairwise adjacent to each other if $(u,v),(v,u) \in E_G$, i.e, $u-v\in E_G$.
For an undirected graph $G$, a set $S\subset V_G$ is an $x$-$y$ \emph{separator} for two non-adjacent vertices $x$ and $y$ if $x$ and $y$ are in two different undirected connected components of $G[V_G\setminus S]$.  $S$ is said to be a \emph{minimal $x$-$y$ separator} if no proper subset of $S$ separates $x$ and $y$.  A set $S$ is said to be a \emph{minimal vertex separator} if there exist vertices $x$ and $y$ for which $S$ is a minimal $x$-$y$ separator.\footnote{\citet{wienobst2020polynomial} refer to these objects as \emph{minimal separators}, but we follow here the terminology of \cite[Section 2.2]{blair1993introduction} for consistency.} An undirected graph $G$ is \emph{chordal} if, for any cycle of length $4$ or more of $G$, there exist two non-adjacent vertices of the cycle which are adjacent in
$G$.  We refer to an undirected connected chordal graph by the abbreviation
\emph{UCCG}.

\textbf{Clique trees.} A \emph{rooted clique tree} of a UCCG $G$ is a
tuple $\mathcal{T}=(T, R)$, where $T$ is a rooted tree (rooted at the node $R$) whose nodes are the maximal cliques of $G$, and which is such that the set $\{C: v\in C\}$ is connected in $T$, for all $v\in V_G$.
Clique trees satisfy the important \emph{clique-intersection property}: if $C_1,C_2,C\in V_T$ and $C$ is on the (unique) path between $C_1$ and $C_2$ in the tree $T$, then $C_1\cap C_2 \subset C$~(see, e.g., \citet{blair1993introduction}).  Further, a set $S\subset V_G$ is a minimal vertex separator in $G$ if, and only if, there are two adjacent nodes $C_1, C_2\in V_T$ such that $C_1 \cap C_2 = S$ \citep[Theorem 4.3]{blair1993introduction}.  A clique tree for a UCCG $G$ can be constructed in polynomial time.  For more details on the above results on chordal graphs and clique trees, we refer to the survey of \citet{blair1993introduction}. \section{Proofs omitted from Section~\ref{sec:main-result}}
\label{sec:app-main-result}
\begin{observation}
\label{obs:if-G-is-not-K-consistent}
If $G$ is not $\mathcal{K}$-consistent then $\#AMO(G,\mathcal{K})=0$. 
\end{observation}
\begin{proof}
   If $G$ is not $\mathcal{K}$-consistent then  there exists an edge $u\rightarrow v \in \mathcal{K}$ such that $v\rightarrow u \in E_G$, and all the AMOs of $G$ have the edge $v\rightarrow u$. This shows that no AMO of $G$ is $\mathcal{K}$-consistent.
\end{proof}
We can verify in polynomial time that $G$ is $\mathcal{K}$-consistent or not, by checking the existence of an edge $u\rightarrow v \in \mathcal{K}$ for which $v\rightarrow u$ is a directed edge in $G$. This is why for further discussion we assume that $G$ is $\mathcal{K}$-consistent.

\cref{lem:Counting-AMO-reduction} is a direct consequence of the following
lemma.

\begin{lemma}
\label{lem:AMO-reduction}
Let $G$ be an MEC consistent with a given background knowledge $\mathcal{K}$, and let $G_d$ be the directed subgraph of $G$. Then, $\alpha\in AMO(G,\mathcal{K})$ if, and only if, (i) for each undirected chordal component $H$ of $G$, $\alpha[V_H]$ is a $\mathcal{K}$-consistent AMO of $H$ and (ii) $\alpha$ is a union of $G_d$ and $\bigcup_{H}{\alpha[V_H]}$.
\end{lemma}

\begin{proof}
If $G$ is $\mathcal{K}$-consistent then each directed edge of $G$ is $\mathcal{K}$-consistent, i.e., $G_d$ is $\mathcal{K}$-consistent.
  \cite{andersson1997characterization} show that for an MEC $G$, an AMO of $G$ can be constructed by choosing an AMO from each one of the chordal components of  $G$ and taking the union of the directed subgraph of $G$ and the chosen AMOs of  the chordal components.  For every undirected connected chordal component $H$  of $G$, let us pick a $\mathcal{K}$-consistent AMO  of $H$. Then, the union of all the picked AMOs and $G_d$ is a $\mathcal{K}$-consistent AMO of  $G$.  Also if $\alpha$ is an AMO of $G$ then for all undirected connected chordal components $H$ of $G$, $\alpha[V_H]$ is $\mathcal{K}$-consistent. And $\alpha$ must be a union of $G_d$ and the union of all the $\alpha[V_H]$.  This proves \cref{lem:AMO-reduction}.
\end{proof}

 \section{Definition of $C_{\alpha}$}
\label{supplementary-sec:definition-C-alpha}
Here, we define $C_{\alpha}$.  We start with defining a few preliminary terms  flower, $<_{\mathcal{T}}$, and $<_{\alpha}$ that we use to define $C_{\alpha}$.

\begin{definition}[Flowers and bouquets, \cite{wienobst2020polynomial},
  Definition 4]
\label{def:flower}
Let $G$ be a UCCG. An \emph{$S$-flower} for a minimal vertex separator $S$ of
$G$ is a maximal subset $F$ of the set of maximal cliques of $G$ containing $S$
such that $\bigcup_{C\in F}C$ is connected in the induced subgraph
$G[V\setminus S]$. The \emph{bouquet} $B(S)$ of a minimal separator $S$ is the set of
all $S$-flowers.
\end{definition}

\begin{definition}[The $<_{\mathcal{T}}$ order for a rooted clique tree
  $\mathcal{T}$, Section 5 of \cite{wienobst2020polynomial}]
\label{def:ordering-of-flowers}
Let $G$ be a UCCG, $S$ be a minimal vertex separator of $G$, $F_1,F_2\in B(S)$, and $\mathcal{T}=(T,R)$ be a rooted clique tree of $G$. \emph{$F_1 <_{\mathcal{T}} F_2$} if $F_1$ contains a node on the unique path from $R$ to $F_2$. 
\end{definition}

\begin{definition}[The $<_{\alpha}$ order for an AMO
  $\alpha$, Section 5 of \cite{wienobst2020polynomial}]
\label{def:ordering-of-cliques}
Let $G$ be a UCCG, $\mathcal{T}=(T,R)$ be a rooted clique tree of $G$, and
$\alpha$ be an AMO of $G$.  We use $<_{\mathcal{T}}$ to define a partial order
\emph{$<_{\alpha}$} on the set of maximal cliques that represent $\alpha$, as
follows: $C_1 <_{\alpha} C_2$ if, and only if, $(i)$ $C_1\cap C_2 =S$ is a
minimal vertex separator, $(ii)$ $C_1$ and $C_2$ are elements of distinct
$S$-flowers $F_1,F_2\in B(S)$, respectively, and $(iii)$ $F_1 <_T F_2$.
\end{definition}

The following result of \cite{wienobst2020polynomial} establishes the requisite property of the ordering $<_{\alpha}$.
\begin{lemma}[\cite{wienobst2020polynomial}, Claim 1]
\label{lem:C-alpha}
  Let $G$ be a UCCG, $\alpha$ an AMO of $G$, and $\mathcal{T}=(T,R)$ a rooted
  clique tree of $G$.  Consider the order $<_{\alpha}$ defined on the maximal
  cliques $\mathcal{T}$. Then, there always exists a unique least maximal
  clique with respect to $<_{\alpha}$. 
\end{lemma} \section{Proofs omitted from Section~\ref{sec:reduction-of-the-problem}}
\label{sec:app-lbfs}

\begin{proof}[Proof of \cref{lem:partition-of-set-of-bkc-AMOs}]
  The claim follows from the fact that for each AMO $\alpha$ of $G$,
  $C_{\alpha}$ was canonically chosen from the set of maximal cliques representing
  $\alpha$.
\end{proof}





\begin{proof}[Proof of \cref{lem:direction of-edges-of-GC-in-alg}]
Proof of \cref{item-1-of-direction of-edges-of-G^C-in-alg}:
For any edge $u-v \in E_G$, if $u\in C$ and $v\notin C$ then for any AMO that is represented by an LBFS ordering that starts with $C$, $u\rightarrow v$ is a directed edge in the AMO (see ``Representation of an AMO'' of \cref{sec:preliminaries}). This further implies for any edge $u-v \in E_G$, if $u\in C$ and $v\notin C$ then $u\rightarrow v$ is a directed edge in $G^C$, as $G^C$ is the union of all the AMOs of $G$ that can be represented by an LBFS ordering that starts with $C$. This proves \cref{item-1-of-direction of-edges-of-G^C-in-alg}.

Proof of \cref{item-2-of-direction of-edges-of-G^C-in-alg}:
We prove \cref{item-2-of-direction of-edges-of-G^C-in-alg} of \cref{lem:direction of-edges-of-GC-in-alg} using induction on the size of $\mathcal{L}$. 

    \textbf{Base Case: $|\mathcal{L}|=0$.} In this case, \cref{item-2-of-direction of-edges-of-G^C-in-alg} of \cref{lem:direction of-edges-of-GC-in-alg} is vacuously true. 

    Let \cref{item-2-of-direction of-edges-of-G^C-in-alg} is true when $|\mathcal{L}|=l\geq 0$. We show that \cref{item-2-of-direction of-edges-of-G^C-in-alg} is true even for $|\mathcal{L}|=l+1$.

    Let at some iteration of \cref{alg:AMO-Union-K}, $\mathcal{L}=\{X_1,X_2,\ldots,X_l,X_{l+1}\}$. From the induction hypothesis, for an edge $u-v \in E_G$, if $u\in X_{i}$ and $v\notin C\cup X_1\cup X_2 \cup \ldots \cup X_i$ then $u\rightarrow v \in G^C$, when $i\leq l$. Let there exists an edge $u-v \in  E_G$ such that $u\in X_{l+1}$ and $v\notin C\cup X_1\cup X_2 \cup \ldots \cup X_{l+1}$. This means there must exist a vertex $x\in C\cup X_1\cup X_2 \cup \ldots \cup X_l$ for which $x-u\in E_G$ and $v-u \notin E_G$, due to which $u$ and $v$ moves to two different sets in $\mathcal{S}$, because initially $u$ and $v$ are in the same set $V\setminus C$. From the induction hypothesis, $x\rightarrow u \in G^C$. This implies all the AMOs that are represented by $C$ have edge $x\rightarrow u$. This further implies all the AMOs that are represented by $C$ have edge $u\rightarrow v$, as  $v\rightarrow u$ creates an immorality $x\rightarrow u \leftarrow v$ (from the definition of AMO, there cannot be a v-structure in an AMO of $G$). This proves \cref{item-2-of-direction of-edges-of-G^C-in-alg}.

Proof of \cref{item-3-of-direction-of-edges-of-G^C-in-alg}:
    Suppose $u,v \in X_{i}$, and $u-v\in E_G$. Let there exists an AMO $\alpha$ that is represented by $C$ and has the edge $u\rightarrow v$. Let $\tau_1$ be an LBFS ordering of $G$ that starts with $C$, and represents $\alpha$. We can construct another LBFS ordering $\tau_2$ that also starts with $C$ such that while picking the vertices of $X_{i}$, we pick $v$ before $u$. The AMO corresponding to this LBFS ordering has the edge $v\rightarrow u$. Since $G^C$ is the union of all the AMOs of $G$ that is represented by  $C$. This implies $G^C$ has the undirected edge $u-v$. This proves \cref{item-3-of-direction-of-edges-of-G^C-in-alg}.

Proof of \cref{item-3b-of-direction-of-edges-of-G^C-in-alg}:
If $u,v \in C$ then $u-v \in E_G$, because $C$ is a clique of $G$. Suppose an AMO $\alpha$ is represented by $C$ and has the  edge $u \rightarrow v$. Then, $\alpha$ must be  represented by an LBFS ordering $\tau_1$ that starts with a permutation $\pi_1(C)$ of $C$ such that $u$ comes before $v$ in $\pi_1(C)$. Let $\pi_2(C)$ be a permutation of $C$ such that $v$ comes before $u$ in $\pi_2(C)$. Let us construct an LBFS ordering $\tau_2$ by replacing $\pi_1(C)$ with $\pi_2(C)$ in $\tau_1$. Let $\beta$ be the AMO represented by the LBFS ordering $\tau_2$. $\beta$ also represented by $C$ and has the edge $v\rightarrow u$. Since $G^C$ is the union of all the AMOs of $G$ that is represented by $C$, this implies $u-v$ is an undirected edge in $G^C$, because $u\rightarrow v\in \alpha$, and $v\rightarrow u\in \beta$, and both are represented by $C$. This proves \cref{item-3b-of-direction-of-edges-of-G^C-in-alg}.  


    
Proof of \cref{item-4-of-direction-of-edges-of-G^C-in-alg}: From \cref{item-1-of-direction of-edges-of-G^C-in-alg,item-2-of-direction of-edges-of-G^C-in-alg}, all the edges with only one endpoint in $X_l$ are directed in $G^C$. And, from \cref{item-3-of-direction-of-edges-of-G^C-in-alg}, all the edges with both of the endpoints in $X_l$ are undirected in $G^C$. This further implies all the undirected connected components of $G[X_i]$ are undirected connected components of $G^C$.  
\end{proof}


 \begin{proof}[Proof of \cref{lem:output-of-Alg-1}]
 At first, we want to recall that
\cref{alg:AMO-Union-K} is background aware version of the modified LBFS algorithm of \cite{wienobst2020polynomial}. As discussed in the main paper, we do not change any line from the LBFS algorithm of \cite{wienobst2020polynomial}; the only modifications we do to their LBFS algorithm are (a) introduction of \texttt{flag}, at \cref{alg:flag-init}, which is used to check the $\mathcal{K}$-consistency of $G^C$, (b) lines \ref{alg:mod-if}-\ref{alg:mod-if-end}, which is used to update the value of \texttt{flag}, and (c) We also output the value of \texttt{flag} with $C_G(C)$. The output of \cref{alg:AMO-Union-K} has 2 components. The first component is the value of \texttt{flag}, and the second value is the value returned by the LBFS algorithm of \cite{wienobst2020polynomial}, which is $C_G(C)$. Thus, the only thing we need to verify is that the first component of our output, i.e., the value of \texttt{flag}, is  1 if $G^C$ is $\mathcal{K}$-consistent, and 0 if $G^C$ is not $\mathcal{K}$-consistent, which is equivalent to show that the value of \texttt{flag} returned by the algorithm is 0 if, and only if, $G^C$ is not $\mathcal{K}$-consistent (since the value of \texttt{flag} is either 0 or 1).

Suppose $G^C$ is not $\mathcal{K}$-consistent. Then, from the definition of $\mathcal{K}$-consistency of $G^C$ (\cref{def:bc-CGC}), there must exist an edge $v\rightarrow u$ in $G^C$ such that $u\rightarrow v \in \mathcal{K}$. From \cref{lem:direction of-edges-of-GC-in-alg}, if $v\rightarrow u \in G^C$ then either (a) $v\in C$ and $u\notin C$, or (b) at some iteration, when $\mathcal{L}=\{X_1, X_2, \ldots , X_l\}$, $v\in X_l$ and $u\notin C\cup X_1\cup X_2 \cup \ldots \cup X_l$. In both of the cases,  $v$ must be picked before $u$ at line-\ref{alg:mod1}, as $v$ is present in a set that comes before the set in which $u$ is present.  At the iteration when $v$ is picked,  the algorithm finds the edge $u\rightarrow v$  that obeys the condition stated in line-\ref{alg:mod-if}. This further sets the value of \texttt{flag} to 0. From the construction of the algorithm, once the value of \texttt{flag} sets to 0, it remains at 0. This shows that if $G^C$ is not $\mathcal{K}$-consistent then the value of \texttt{flag} is 0.

Now suppose the \texttt{flag} value returned by the algorithm is 0. At line-\ref{alg:flag-init}, the value of \texttt{flag} is initialized with 1. If 
\texttt{flag} value returned by the algorithm is 0 then there must exist an edge $u\rightarrow v \in \mathcal{K}$ (found at line-\ref{alg:mod-if}), which causes to change the value of \texttt{flag} to 0 at line-\ref{alg:mod-output-empty}. Since $u\rightarrow v$ obeys the condition state at line-\ref{alg:mod-if}, we can certainly say that the iteration when $v$ is picked at the line-\ref{alg:mod1}, $u$ must be neither in $C$ nor in any set of $\mathcal{L}$. And, $v$ must be either in $C$, if $\mathcal{L}=\emptyset$, or in $X_l$, if $\mathcal{L}=\{X_1, X_2, \ldots , X_l \}$ such that $l\geq 1$. From \cref{lem:direction of-edges-of-GC-in-alg}, $v\rightarrow u$ must be a directed edge in $G^C$. This makes $G^C$ inconsistent with $\mathcal{K}$, as $u\rightarrow v \in \mathcal{K}$ (\cref{def:bc-CGC}). This shows if the value of \texttt{flag} returned by the algorithm is 0 then  $G^C$ is not $\mathcal{K}$-consistent. This completes the proof.
\end{proof}

\begin{proof}[Proof of \cref{lem:uniqueness-of-permutation-of-clique}]
If $\alpha$ is a member of AMO$(G,\pi_1(C))$ and AMO$(G,\pi_2(C))$ both, for two different permutations $\pi_1(C)$ and $\pi_2(C)$, then there must exist two vertices $u,v\in C$ such that $u$ comes before $v$ in $\pi_1(C)$, and $v$ comes before $u$ in $\pi_2(C)$. Since $u$ and $v$ are members of the same clique, there exists an edge $u-v \in E_G$. And, since the AMO is a member of both AMO$(G,\pi_1(C))$, and AMO$(G,\pi_2(C))$ it should have both $u\rightarrow v$ and $v\rightarrow u$, which is not possible. This implies there exists a unique permutation $\pi(C)$ of $C$ that represents $\alpha$.
\end{proof}

\begin{proof}[Proof of \cref{lem:identification-of-C-alpha}]
Claims 1 and 2 of \cite{wienobst2020polynomial} translate into  the ``only if'' part of \cref{lem:identification-of-C-alpha}, while Claim 3 of \cite{wienobst2020polynomial} translates into the ``if'' part of \cref{lem:identification-of-C-alpha}.  We give details of the translation below.
{\newcommand{\pre}{<_{\alpha}}
Given an AMO $\alpha$, \cite{wienobst2020polynomial} define a partial order $\prec_\alpha$ (as described above) on the set of maximal cliques that represent $\alpha$.  Claim 1 of \cite{wienobst2020polynomial} shows that there exists a unique maximal clique representing $\alpha$ (which we name as $C_{\alpha}$) such that for any maximal clique $C \neq C_{\alpha}$ that represents $\alpha$, $C_{\alpha} \pre C$.  Claim 2 of \cite{wienobst2020polynomial} then translates immediately into the ``only if'' part of \cref{lem:identification-of-C-alpha}.

For the ``if'' part, we consider any maximal clique $C$ representing $\alpha$ and satisfying both the conditions of \cref{lem:identification-of-C-alpha}.  Suppose, if possible, that $C \neq C_{\alpha}$.  Then, from the above discussion, $C_\alpha \pre C$. The proof of Claim 3 (and the definition of $FP(C, \mathcal{T})$) then shows that if $\pi(C)$ is the permutation of $C$ representing $\alpha$, then there is a prefix $S$ of $\pi(C)$ of the form $C_i \cap C_j$ for some two adjacent cliques on the path from $R$ to $C$ in $T$.  This leads to a contradiction with item 2 of \cref{lem:identification-of-C-alpha}, and hense shows that $C \neq C_\alpha$ is not possible.
}
\end{proof}


For the proof of \cref{lem:formular-for-KT-consistent-permutaion}, we need the
 following observation of \citet{wienobst2020polynomial}.

\begin{observation}[{\citet{wienobst2020polynomial}, Proposition 1}]
  \label{lem:G-C-and-G-pi-C-is-same}
  For each permutation $\pi(C)$ of a maximal clique $C$ of $G$, all edges of $G^{\pi(C)}$ coincide with the edges of $G^{C}$, excluding the edges connecting the vertices in $C$.  In particular, $\mathcal{C}_G(\pi(C))=\mathcal{C}_G(C)$.
\end{observation}



\begin{proof}[Proof of \cref{lem:formular-for-KT-consistent-permutaion}]
    Let $G^C$ be $\mathcal{K}$-consistent, and $\pi(C)$ is a $(\mathcal{K}, \mathcal{T})$-consistent permutation of $C$. We show that the number of $\mathcal{K}$-consistent AMOs of $G$ that are canonically represented by $\pi(C)$, i.e., $|\{\alpha: \alpha \in \text{AMO}(G, \pi(C), \mathcal{K}) \text{ and } C = C_{\alpha} \}|$ equals $\Pi_{H\in \mathcal{C}_G(C)}{\#\text{AMO}(H, \mathcal{K}[H])}$. To prove this, we first show that if $\alpha$ is a $\mathcal{K}$-consistent AMO of $G$ that is canonically represented by $\pi(C)$ then  for any connected component $H$ of $\mathcal{C}_G(C)$, $\alpha[H]$ is $\mathcal{K}[H]$-consistent AMO of $H$. We also show that if we have a $\mathcal{K}[H]$-consistent AMO for each connected component $H$ of $\mathcal{C}_G(C)$ then we can construct a $\mathcal{K}$-consistent AMO of $G$ by combining them. This proves \cref{lem:formular-for-KT-consistent-permutaion}.

    We first show the first part.
    Let $\alpha$ be a $\mathcal{K}$-consistent AMO of $G$ that is canonically represented by $\pi(C)$. Then,  for any connected component $H$ of $\mathcal{C}_G(C)$, $\alpha[H]$ is $\mathcal{K}[H]$-consistent AMO of $H$. Otherwise, if for any connected component $H$ of $\mathcal{C}_G(C)$, $\alpha[H]$ is not $\mathcal{K}[H]$-consistent then there must exist an edge $u\rightarrow v \in \mathcal{K}[H]$ such that $v\rightarrow u \in \alpha[H]$. But, this implies $\alpha$ is not $\mathcal{K}$-consistent either, as if $u\rightarrow v \in \mathcal{K}[H]$ then $u\rightarrow v \in \mathcal{K}$, and if  $v \rightarrow u \in \alpha[H]$ then $v\rightarrow u \in \alpha$.

    We now show the other part. Let $H_1, H_2, \ldots, H_l$ are the undirected connected components of $\mathcal{C}_G(C)$, in the same order as we get as the output of \cref{alg:AMO-Union-K} for input $G, C$, and $\mathcal{K}$. For each $H_i \in \mathcal{C}_G(C)$, let we have a $\mathcal{K}[H_i]$-consistent AMO $D_i$, and ${\tau}_i$ be an LBFS ordering of $D_i$. Then, $\tau = \{\pi(C), {\tau}_1, {\tau}_2, \ldots , {\tau}_l\}$ is a $\mathcal{K}$-consistent LBFS ordering of $G$ starting with $\pi(C)$ that we can get from \cref{alg:AMO-Union-K}. The DAG $\alpha$ represented by $\tau$ is an AMO of $G$ represented by $\pi(C)$. And, since $\pi(C)$ is $(\mathcal{K}, \mathcal{T})$-consistent, from \cref{lem:identification-of-C-alpha}, $C = C_{\alpha}$. This implies $\alpha$ is a $\mathcal{K}$-consistent AMO of $G$ and is canonically represented by $\pi(C)$. This gives us a one-to-one mapping between the set of $\mathcal{K}$-consistent AMOs of $G$ that is canonically represented by $\pi(C)$, and the $\mathcal{K}[H]$-consistent AMOs of the connected components $H$ of $\mathcal{C}_G(C)$, which further implies the equality between the size of $\mathcal{K}$-consistent AMOs of $G$ that is canonically represented by $\pi(C)$ and $\Pi_{H\in \mathcal{C}_G(C)}{\#\text{AMO}(H, \mathcal{K}[H])}$.  This completes our proof.
\end{proof}

\begin{proof}[Proof of \cref{lem:final-counting-algorithm}]
    From \cref{lem:partition-of-set-of-bkc-AMOs}, $\#\text{AMO}(G,\mathcal{K}) = \sum_{C\in \Pi(G)}{|\{\alpha: \alpha \in \text{AMO}(G,\mathcal{K}) \text{ and } C=C_{\alpha}\}|}$. In \cref{sec:reduction-of-the-problem}, after defining $\mathcal{K}$-consistency of $G^C$ (\cref{def:bc-CGC}), we show that for any maximal clique $C$ of $G$, if $G^C$ is not $\mathcal{K}$-consistent then ${|\{\alpha: \alpha \in \text{AMO}(G,\mathcal{K}) \text{ and } C=C_{\alpha}\}|} = 0$. From \cref{lem:formular-for-KT-consistent-permutaion}, for any maximal clique $C$ of $G$, if $G^C$ is $\mathcal{K}$-consistent then for any $(\mathcal{K}, \mathcal{T})$-consistent permutation $\pi(C)$ of $C$, $|\{\alpha: \alpha \in \text{AMO}(G,\pi(C),\mathcal{K}) \text{ and }
C=C_{\alpha}\}|=\prod_{H\in \mathcal{C}_G(C)}{\#AMO(H,\mathcal{K}[H])}$. And, from \cref{lem:formular-for-non-KT-consistent-permutaion}, for any  permutation $\pi(C)$ of a maximal clique $C$ of $G$, if $\pi(C)$ is not a $(\mathcal{K}, \mathcal{T})$-consistent permutation of $C$ then $|\{\alpha: \alpha \in \text{AMO}(G,\pi(C),\mathcal{K}) \text{ and }
C=C_{\alpha}\}|=0$. This further implies for any maximal clique $C$ of $G$, if $G^C$ is $\mathcal{K}$-consistent then $|\{\alpha: \alpha \in \text{AMO}(G,\mathcal{K}) \text{ and } C=C_{\alpha}\}| = \Phi(C,FP(C,\mathcal{T}),\mathcal{K}[C]) \times
  {\prod_{H\in \mathcal{C}_G(C)}{\#AMO(H,\mathcal{K}[H])}}$, where  $\Phi(C,FP(C,\mathcal{T}),\mathcal{K}[C])$ is the number of $(\mathcal{K}, \mathcal{T})$-consistent permutations of a maximal clique $C$ of $G$ (from \cref{def:background-consistent-pi-C,def:phi-S-R-K}). All these things further imply 
$\#\text{AMO}(G,\mathcal{K}) = \sum_{C: G^C \text{ is } \mathcal{K}\text{-consistent}}
  {\Phi(C,FP(C,\mathcal{T}),\mathcal{K}[C]) \times
  {\prod_{H\in \mathcal{C}_G(C)}{\#AMO(H,\mathcal{K}[H])}}}$.
This proves the correctness of \cref{lem:final-counting-algorithm}.
\end{proof}

\begin{proof}[Proof of \cref{lem:phi-computaion}]
  Proof of \cref{item-3-of-phi-computaion}: If $R=\emptyset$, then a permutation
  $\pi(S)$ of $S$ is $\mathcal{K}$-consistent if ordering of $V_{\mathcal{K}}$
  in $\pi(S)$ is $\mathcal{K}$-consistent.
  $\Psi(V_{\mathcal{K}}, \mathcal{K})$ gives the number of
  $\mathcal{K}$-consistent permutations of $V_{\mathcal{K}}$. Number of
  permutations of $S$ that has the same ordering of $V_{\mathcal{K}}$ in it is
  $\frac{|S|!}{|V_{\mathcal{K}}|!}$. This completes the proof of
  \cref{item-3-of-phi-computaion}.

  Proof of \cref{item-1-of-phi-computaion}: If there exists an edge
  $u \rightarrow v\in \mathcal{K}$ such that $u\in S\setminus R_l$ and $v\in R_l$ then no
  $\mathcal{K}$-consistent permutation of $S$ exists that starts with $R_l$.

  Proof of \cref{item-2-of-phi-computaion}: If there does not exist an edge
  $u \rightarrow v\in \mathcal{K}$ such that $u\in S\setminus R_l$ and $v\in R_l$, then
  one way to compute $\Phi(S,R,\mathcal{K})$ is to first compute number of
  $\mathcal{K}$-consistent permutations of $S$ that do not start with
  $R_1,R_2,\ldots, R_{l-1}$, i.e.,
  $\Phi(S,R-\{R_l\},\mathcal{K})$. But, $\Phi(S,R-\{R_l\},\mathcal{K})$ also counts the $\mathcal{K}$-consistent permutations of $S$ that starts with $R_l$
  but not with any $R_i$, for $1\leq i<l$. We subtract such permutations from
  $\Phi(S,R-R_l,\mathcal{K})$. To construct a $\mathcal{K}$-consistent
  permutation of $S$ that starts with $R_l$ but does not start with any $R_i$, $1\leq i<l$, we have to first construct a permutation of $R_l$ that does
  not start with any $R_i$, $1\leq i<l$, and then we have to construct a
  $\mathcal{K}$-consistent permutation of the remaining vertices of $S$. This
  implies the number of $\mathcal{K}$-consistent permutations of $S$ that start
  with $R_l$ and not with any $R_i$, $1\leq i<l$, is
  $\Phi(R_l, R-\{R_l\},\mathcal{K})\times \Phi(S\setminus
  R_l,\emptyset,\mathcal{K})$.
\end{proof}

\begin{proof}[Proof of \cref{lem:alg-valid-perm-correctness}]
    If $R=\emptyset$ then from \cref{item-3-of-phi-computaion} of \cref{lem:phi-computaion}, $\Phi(S,R,\mathcal{K})= \frac{|S|!}{|V_{\mathcal{K}}|!} \times \Psi(V_{\mathcal{K}}, \mathcal{K})$. Line \ref{alg-vp:return-K-empty} of \cref{alg:valid-permutaion-of-clique} returns the same. 


    If $R=\{R_1,R_2,\ldots, R_l\} \neq \emptyset$, and there exist an edge $u\rightarrow v \in \mathcal{K}$ such that $u\in S\setminus R_l$ and $v\in R_l$, then from \cref{item-1-of-phi-computaion} of \cref{lem:phi-computaion}, $\Phi(S,R,\mathcal{K})=\Phi(S,R-R_l,\mathcal{K})$. Line \ref{alg-vp:return2} of \cref{alg:valid-permutaion-of-clique} returns the same.

    If $R=\{R_1,R_2,\ldots, R_l\} \neq \emptyset$, and there does not exist an edge $u\rightarrow v \in \mathcal{K}$ such that $u\in S\setminus R_l$ and $v\in R_l$, then from \cref{item-2-of-phi-computaion} of \cref{lem:phi-computaion}, $\Phi(S,R,\mathcal{K})=\Phi(S,R-R_l,\mathcal{K})-{\Phi(R_l,R-\{R_l\},\mathcal{K}[R_l])\times \Phi(S\setminus R_l,\emptyset,\mathcal{K}[S\setminus R_l])}$. The line \ref{alg-vp:final-return} of \cref{alg:valid-permutaion-of-clique} returns the same. 
\end{proof} 

\begin{proof}[Proof of \cref{lem:main-algorithm-correct}]
  At line \ref{alg-count:clique-tree-construction}, \cref{alg:Count-AMO}
  constructs a rooted clique tree of $G$. Lines
  \ref{alg:count:G-is-a-clique}-\ref{alg-count:if-G-is-a-clique-end} deals with
  a special case when $G$ is a clique. If $R=V$ (at line
  \ref{alg:count:G-is-a-clique}) then $G$ is a clique. In this case, the number
  of $\mathcal{K}$-consistent AMOs of $G$ equals the number of
  $\mathcal{K}$-consistent permutation of $V$. Lines
  \ref{alg:count:G-is-a-clique}-\ref{alg-count:if-G-is-a-clique-end} do the
  same. For the general case (when $G$ is not a clique), we implement \cref{lem:final-counting-algorithm}. We create a queue $Q$
  at line \ref{alg-count:Queue-construction}, that stores maximal cliques of
  $G$. For each maximal clique  $C$ of $G$, we run lines \ref{alg-count:while-queue-is-not-empty}-\ref{alg-count:while-end}. 
  At line \ref{alg-count:LBFS}, we call
  \cref{alg:AMO-Union-K} (our LBFS-algorithm) for input $G,C$ and
  $\mathcal{K}$. If the first component of the output of \cref{alg:AMO-Union-K}
  is 0 then $G^C$ is not $\mathcal{K}$-consistent (from
  \cref{lem:output-of-Alg-1}). This further implies
  $|\{\alpha: \alpha\in \text{AMO}(G,\pi(C),\mathcal{K}) \text{ and }
  C=C_{\alpha}\}|=0$. This is why we skip lines
  \ref{alg-count:prod-init}-\ref{alg-count:if-end} if the first component of
  LBFS$(G,C,\mathcal{K})$ (\cref{alg:AMO-Union-K}) is 0. If the first component
  LBFS$(G,C,\mathcal{K})$ is 1 then $G^C$ is $\mathcal{K}$-consistent. In this
  case, at lines \ref{alg-count:foreach-start}-\ref{alg-count:foreach-end}, we
  compute $\prod_{H\in C_G(C)}{\#AMO(H,\mathcal{K}[H])}$, by recursively calling
  \cref{alg:Count-AMO}. At line \ref{alg-count:sum-update}, we compute
  $|\{\alpha: \alpha\in \text{AMO}(G,\mathcal{K}) \text{ and } C=C_{\alpha}\}|$
  using the discussion following \cref{lem:formular-for-KT-consistent-permutaion}. At the end of
  line-\ref{alg-count:while-end},  the variable \texttt{sum} has the value $\sum_{C : \text{$G^C$
      is $\mathcal{K}$-consistent}} {\Phi(C,FP(C,\mathcal{T}),\mathcal{K}[C])
    \times} {\prod_{H\in C_G(C)}{\#AMO(H,\mathcal{K}[H])}}$, i.e., \texttt{sum}
  equals $\#AMO(G,\mathcal{K})$ (from \cref{lem:final-counting-algorithm}). $\mathtt{memo}[G]$ stores the number of $\mathcal{K}$-consistent AMOs of $G$, once it is computed.
  This completes the proof.
  
  


\end{proof}



 \section{Proofs omitted from Section~\ref{sec:time-complexity}}
\label{appendix:time-complexity}

\begin{proof}[Proof of \cref{thm:LBFS-alg}]
  The ``While'' loop on lines \ref{alg:loop}-\ref{alg:while-end} runs at most $|V_G|$ times. Using two additional arrays (one for checking whether $v$ is in $C$ or not, and another for checking whether $v$ is in $\mathcal{L}$ or not) we can run lines \ref{alg:if-1-start}-\ref{alg:if-1-end} in $O(1)$ time. Checking the existence of edge $u\rightarrow v \in \mathcal{K}$ at line \ref{alg:mod-if} takes  $O(|\mathcal{K}|)$ time cumulatively, for all $v \in V_G$. Finding neighbors of $v$ at line \ref{alg:neighbour-v} takes $O(E_G)$ time cumulatively, for all $v\in V_G$. Partitioning each set at line \ref{alg:refine}, also takes $O(E_G)$ time cumulatively. 
Since the size of $\mathcal{K}$ can be at most $E_G$, this implies the overall time complexity of \cref{alg:AMO-Union-K} is $O(|V_G|+|E_G|)$ (with the same technique that is used to implement the standard LBFS of \cite{rose1976algorithmic}).
\end{proof}


\begin{proof}[Proof of \cref{prop:number-of-times-alg-2-called}]
\Cref{alg:Count-AMO} calls itself at line \ref{alg-count:prod-multiplication}, for each $H\in \mathcal{L}$, when $\texttt{flag} =1$. The value of \texttt{flag} is always 1 when $\mathcal{K} = \emptyset$, and $\mathcal{L} = \mathcal{C}_G(C)$ (from \cref{alg:AMO-Union-K}) does not depend on $\mathcal{K}$. This further implies that the \texttt{count} function has the maximum number of distinct recursive calls to itself when $\mathcal{K}=\emptyset$. But, for $\mathcal{K}=\emptyset$, \cref{alg:Count-AMO} is the same as the Clique-Picking algorithm of \cite{wienobst2020polynomial}, who showed that the number of these distinct recursive calls is at most $2|\Pi(G)|-1$ times. This completes the proof.
\end{proof}

\begin{proof}[Proof of \cref{lem:time-complexity-of-Phi}]
Let us denote $\mathcal{R}_i=\{R_1,R_2, \ldots , R_i\}$. For the computation of $\Phi(S, \mathcal{R}_l, \mathcal{K})$, from \cref{item-1-of-phi-computaion,item-2-of-phi-computaion} of \cref{lem:phi-computaion}, we need to compute $\Phi(S,\emptyset, \mathcal{K})$, $\Phi(S\setminus R_1,\emptyset, \mathcal{K}[S\setminus R_1])$, $\Phi(S\setminus R_2,\emptyset,\mathcal{K}[S\setminus R_2]), \ldots, \Phi(S\setminus R_l,\emptyset, \mathcal{K}[S\setminus R_l])$, $\Phi(S,\mathcal{R}_1, \mathcal{K})$, $\Phi(S,\mathcal{R}_2, \mathcal{K}), \ldots, \Phi(S,\mathcal{R}_{l-1}, \mathcal{K})$, and for each $1\leq i \leq l$,  $\Phi(R_i,\emptyset, \mathcal{K}[R_i])$, $\Phi(R_i\setminus R_1,\emptyset,\mathcal{K}[R_i\setminus R_1])$, $\ldots$ , $\Phi(R_i\setminus R_{i-1},\emptyset,\mathcal{K}[R_i\setminus R_{i-1}])$, $\Phi(R_i,\mathcal{R}_1,\mathcal{K}[R_i])$, $\Phi(R_i,\mathcal{R}_2,\mathcal{K}[R_i])$, $\ldots$ , $\Phi(R_i,\mathcal{R}_{i-1},\mathcal{K}[R_i])$.


Computation of each $\Phi(X,\phi,\mathcal{K}' = \mathcal{K}[X])$ takes $O(k!\cdot k^2)$ arithmetic operations. To see this, note that \cref{item-3-of-phi-computaion} of \cref{lem:phi-computaion} gives $\Phi(X,\phi,\mathcal{K}') = \frac{|X|!}{|V_{\mathcal{K}'}|} \times \Psi(V_{\mathcal{K}'}, \mathcal{K}')$. From our assumption, the factorials are already pre-computed. On the other hand, to compute $\Psi(V_{\mathcal{K}'},\mathcal{K}')$ we can check one-by-one the $\mathcal{K}'$-consistency of each permutation of $V_{\mathcal{K}'}$.  The number of permutations of $V_{\mathcal{K}'}$ is $O(k!)$, since $|V_{\mathcal{K}'}|\leq k$ (max-clique knowledge), while the verification of whether a permutation of $V_{\mathcal{K}'}$ is $\mathcal{K}'$-consistent or not takes $O(|\mathcal{K}'|)$ time. Since $V_{\mathcal{K}'} \leq k$, we have $|\mathcal{K}'| \leq k^2$.  Thus, the computation of $\Psi(V_{\mathcal{K}'},\mathcal{K}')$ takes $O(k^2\cdot k!)$ arithmetic operations.

Since the number of required computations of the type $\Phi(X,\phi,\mathcal{K}' = \mathcal{K}[X])$ (as already listed above) is $O(l^2)$, their total cost is $O(k!\cdot k^2 \cdot l^2)$.  After all the values listed above of the type $\Phi(X,\phi,\mathcal{K}' = \mathcal{K}[X])$ have been computed, we can implement a dynamic programming procedure using \cref{item-1-of-phi-computaion,item-2-of-phi-computaion} of \cref{lem:phi-computaion} (or, alternatively, a memoized version of \cref{alg:valid-permutaion-of-clique}) to compute all the required values of type $\Phi(X, Y\neq \emptyset, \mathcal{K}[X])$ (as listed above) using $O(1)$ arithmetic operations each.  Since the number of required computations of the type $\Phi(X, Y\neq \emptyset, \mathcal{K}[X])$ (again, as already listed above) is also $O(l^2)$, it follows that the total cost of these computations is $O(l^2)$.  Adding the computational costs for both types of computations, we see that the total cost is $O(k!\cdot k^2 \cdot l^2)$ arithmetic operations.

As the value of $l$ can be at most $|\Pi(G)|$ (the number of nodes in the clique tree $\mathcal{T}$), the overall number of arithmetic operations we need to compute $\Phi(S, \mathcal{R}_l, \mathcal{K})$ is
$O(k! \cdot k^2\cdot |\Pi(G)|^2)$.

\end{proof}

\begin{proof}[Proof of \cref{thm:ACMO-Counting-BK}]
\cref{alg:Count-AMO} is analogous to Clique-Picking Algorithm of \cite{wienobst2020polynomial}. We can also say that \cref{alg:Count-AMO} is the background knowledge version of the  Clique-Picking Algorithm of \cite{wienobst2020polynomial}. At line \ref{alg-count:clique-tree-construction}, we construct a clique tree of $G$, which takes $O(|V_G|+|E_G|)$ time.
Computing $\Phi$ function at line \ref{alg-count:memo-update}, for a clique $C$, takes $O(|\Pi(G)|^2\cdot k^2 \cdot k!)$ time (from \cref{lem:time-complexity-of-Phi}). While loop (at lines \ref{alg-count:while-queue-is-not-empty}-\ref{alg-count:while-end}) runs for $O(|\Pi(G)|)$ times, as the number of maximal cliques of $G$ is $|\Pi(G)|$. Running LBFS-algorithm (\cref{alg:AMO-Union-K}) at line \ref{alg-count:LBFS} takes $O(|V|+|E|)$ time (from \cref{thm:LBFS-alg}). Computation of function $\Phi$ at line \ref{alg-count:sum-update} takes $O({k! \cdot k^2\cdot |\Pi(G)|}^2)$ time (from \cref{lem:time-complexity-of-Phi}).

Note that it was assumed in \cref{alg:valid-permutaion-of-clique} that factorials of integers from $1$ to $\abs{V_G}$ are pre-computed.  The pre-computation of this table can be done using $O(|V_G|)$ arithmetic operations.  From \cref{prop:number-of-times-alg-2-called}, the number of distinct calls to \texttt{count} function of \cref{alg:Count-AMO} is $O(|\Pi(G)|)$.  Together, the above calculations show that the running time of \cref{alg:Count-AMO} is at most $O({k! \cdot k^2\cdot |\Pi(G)|}^4)$ or $O(k! \cdot k^2\cdot |V_G|^4)$, as for a chordal graph $G$, $|\Pi(G)|$ can be at most $|V_G|$. 
\end{proof}
 \section{Detailed explanation of Experimental Results}
\label{sec:appendix-detailed-explanation-of-experimental-results}
\textbf{Construction of chordal graphs with $n$ vertices}:  We first construct a connected \emph{Erd\H{o}s-R\'{e}nyi graph} $G$ with $n$ vertices such that each of its edges is picked with probability $p$, where $p$ is a random value in [0.1, 0.3). We give a unique rank to each node of the graph. We then process the vertices in decreasing order of rank. For each vertex $x$ of the graph, if $u$ and $v$ are two neighbors of $x$ such that $u$ and $v$ are not connected, and $u$ and $v$ both have lesser rank than the rank of $x$,  then we put an edge between $u$ and $v$ in $G$. This makes $G$ an undirected chordal graph, because, by construction, the decreasing order of ranks is a perfect elimination ordering. After this, we use rejection sampling to get an undirected connected chordal graph, i.e., if $G$ is not a connected graph then we reject $G$, and repeat the above process until we get an undirected connected chordal graph $G$.

\textbf{Construction of background knowledge edges:} For each chordal graph constructed above, and for each
  $k \in \{5,6,\ldots, 13\}$, we construct a set of background knowledge edges
  such that (i) for any maximal clique $C$ of size greater than or equal to $k$, the number of vertices of the clique that are part of an edge of the background knowledge with both endpoint in $C$ is $k$; and (ii) for any maximal clique of size less than $k$, the number of vertices of the clique that are part of an edge of background knowledge equals to the size of the clique.  To do this,  we pick one by one  each maximal clique of $G$, and select the edges of the clique such that at most $k$ vertices are involved in the set of selected edges with both of its endpoints in that clique. For this, we construct a rooted clique tree $\mathcal{T}=(T, R)$ of $G$.  We start with $R$ and then do a depth-first search (DFS) on $T$ to cover all the maximal cliques of $G$. At the iteration when we are at a maximal clique $C$, we first compute the set of vertices of the picked edges having both of their endpoints in $C$. If the size of the set is $k$ (or $|C|$, if $|C| < k$) we move to the next maximal clique. Otherwise, we one by one pick edges of $C$ and add to the selected set of edges until the set of vertices of the picked edges having both of their endpoints in $C$  reaches $k$ (or $|C|$, if $|C| < k$). 
We won't get into a situation where the set of vertices of the picked edges having both of their endpoints in $C$ exceeds $k$ (due to the clique intersection property of the clique-tree).



We write a python program for the construction of chordal graphs, background knowledge edges, and implementation of  \cref{alg:Count-AMO}.  The experiments use the open source \texttt{networkx} (\cite{SciPyProceedings_11}) package.

\paragraph{Effect of changing the size of the background knowledge while keeping
  $k$ fixed} Here we describe the construction of the background knowledge edge
sets $\mathcal{K}_1$ and $\mathcal{K}_2$ used in \cref{tab:1}.  We first
construct $\mathcal{K}_1$ as above.  We then construct $\mathcal{K}_2$ by adding
a few edges to $\mathcal{K}_1$ in such a way that the value of $k$ does not
change.  We do this experiment for different $n$ and $k$, where $n$ is the
number of nodes of the chordal graph, and $k$ is the maximum number of vertices
of any clique of the chordal graph that is part
of a background knowledge edge that lies completely inside that clique, as
defined earlier also.  \Cref{tab:2} gives a more detailed version of
\cref{tab:1} (given in the main section of the paper) with more dataset points.

\begin{table}[t]
  \centering
  \begin{tabular}{ |c|c|c|c|c|c| } 
    \hline
    $n$ & $k$ &$|\mathcal{K}_1|$ & $|\mathcal{K}_2|$ & $T_1$ & $T_2$ \\ 
    \hline
    600 & 6 & 58 & 73 & 95 & 92 \\  
    \hline
    600 & 6 & 52 & 65 & 192 & 190 \\  
    \hline
    700 & 7 & 47 & 67 & 144 & 144 \\  
    \hline
    700 & 7 & 49 & 74 & 132 & 128 \\  
    \hline
    800 & 8 & 56 & 83 & 199 & 195 \\  
    \hline
    800 & 8 & 55 & 85 & 200 & 195\\  
    \hline
    900 & 9 & 46 & 89 & 258 & 256 \\  
    \hline
    900 & 9 & 39 & 68 & 257 & 252 \\  
    \hline
    1000 & 10 & 65 & 116 & 370 & 353 \\  
    \hline
    1000 & 10 & 75 & 137 & 346 & 338 \\ 
    \hline
    1100 & 11 & 55 & 121 & 467 & 455 \\ 
    \hline
    1100 & 11 & 51 & 104 & 460 & 453 \\
    \hline
  \end{tabular}
  \caption{Exploring runtime dependence on number of background knowledge edges: detailed table}
  \label{tab:2}
\end{table}

We can also see from the table that the running time decreases slightly by
increasing the size of background knowledge edges. This is because as the number
of background knowledge increases the number of background consistent
permutations of any clique decreases.

 

\begin{thebibliography}{5}
\providecommand{\natexlab}[1]{#1}
\providecommand{\url}[1]{\texttt{#1}}
\expandafter\ifx\csname urlstyle\endcsname\relax
  \providecommand{\doi}[1]{doi: #1}\else
  \providecommand{\doi}{doi: \begingroup \urlstyle{rm}\Url}\fi

\bibitem[Andersson et~al.(1997)Andersson, Madigan, and
  Perlman]{andersson1997characterization}
Steen~A. Andersson, David Madigan, and Michael~D. Perlman.
\newblock {A} {Characterization} of {Markov} {Equivalence} {Classes} for
  {Acyclic} {Digraphs}.
\newblock \emph{Annals of Statistics}, 25\penalty0 (2):\penalty0 505--541,
  1997.

\bibitem[Blair and Peyton(1993)]{blair1993introduction}
Jean R.~S. Blair and Barry Peyton.
\newblock An {introduction} to {Chordal} {Graphs} and {Clique} {Trees}.
\newblock In \emph{Graph Theory and Sparse Matrix Computation}, pages 1--29.
  Springer, 1993.

\bibitem[Hagberg et~al.(2008)Hagberg, Schult, and Swart]{SciPyProceedings_11}
Aric~A. Hagberg, Daniel~A. Schult, and Pieter~J. Swart.
\newblock Exploring network structure, dynamics, and function using networkx.
\newblock In Ga\"el Varoquaux, Travis Vaught, and Jarrod Millman, editors,
  \emph{Proceedings of the 7th Python in Science Conference}, pages 11 -- 15,
  Pasadena, CA USA, 2008.

\bibitem[Rose et~al.(1976)Rose, Tarjan, and Lueker]{rose1976algorithmic}
Donald~J. Rose, R.~Endre Tarjan, and George~S. Lueker.
\newblock {Algorithmic} {Aspects} of {Vertex} {Elimination} on {Graphs}.
\newblock \emph{SIAM Journal on Computing}, 5\penalty0 (2):\penalty0 266--283,
  1976.

\bibitem[Wien{\"o}bst et~al.(2021)Wien{\"o}bst, Bannach, and
  Li{\'s}kiewicz]{wienobst2020polynomial}
Marcel Wien{\"o}bst, Max Bannach, and Maciej Li{\'s}kiewicz.
\newblock Polynomial-{Time} {Algorithms} for {Counting} and {Sampling} {Markov}
  {Equivalent} {DAGs}.
\newblock In \emph{Proceedings of the 35th AAAI Conference on Artificial
  Intelligence (AAAI 2021)}, pages 12198--12206, 2021.

\end{thebibliography}


\end{document}
