\section{Background: Causal Graphical Models}
\label{sec:CausalGMs}
Let $G$ be a directed graph with nodes $\nodes(G)$ and edges $\edges(G)$. As in the undirected case, given a set of vertices $Z \subseteq \nodes(G)$, we denote by $G[Z]$ the directed subgraph induced by $Z$. Formally, $\edges(G[Z])=\set{(u,v)\in \edges(G): \set{u,v}\subseteq Z}$.
A \e{path} between $u$ and $v$ is a sequence of adjacent vertices $(v_1,\dots,v_j)$ such that $u=v_1$ and $v=v_j$. 
A vertex $w$ is a \e{collider} on a path if the path contains the subpath $u\shortrightarrow w \shortleftarrow v$.
The path is directed, or \e{causal}, if $v_i\rightarrow v_{i+1}$ for all $i\in \set{1,2,\dots,j-1}$. 
A directed cycle is a directed path from $u$ to $v$, combined with the directed edge $v\shortrightarrow u$. 
A directed acyclic graph (DAG) is a directed graph without directed cycles. The \e{moral graph} of a DAG $G$ is an undirected graph $G^m$ with the same vertex set as $G$, and where $(u,v)\in \edges(G^m)$ if and only if there is a directed edge between $u$ and $v$ in $G$, or if there exists a vertex $w\in \nodes(G)$ such that $u\shortrightarrow w \shortleftarrow v$ is an induced subgraph of $G$. 

If $u{\shortrightarrow} w{\in} \edges(G)$, then $u$ is a \e{parent} of $w$. If there is a directed path from $u$ to $w$, then $u$ is an \e{ancestor} of $w$ and $w$ a \e{descendant} of $u$. We follow the convention that a vertex is an ancestor and descendant of itself. The parents, ancestors and descendants of $w\in \nodes(G)$ are denoted by $\pa{G}(w)$, $\an{G}(w)$ and $\de{G}(w)$, respectively. For $Z{\subseteq} \nodes(G)$, we define $\an{G}(Z){\eqdef} \cup_{z\in Z}\an{G}(z)$, $\de{G}(Z){\eqdef} \cup_{z\in Z}\de{G}(z)$, and $\pa{G}(Z){\eqdef}\cup_{z\in Z}\pa{G}(z)$.
We denote by $\nd{G}(Z)\eqdef \nodes(G){\setminus}\de{G}(Z)$ the nondescendants of $Z$.

Let $G$ be a DAG, and $x,y{\in} \nodes(G)$. The set of \e{causal vertices} between $x$ and $y$, denoted $\cv{G}(x,y)$, are those vertices that lie on a directed $x,y$-path in $G$. The set of \e{forbidden vertices} in $G$ with respect to $x,y\in \nodes(G)$ is defined to be $\forb{G}(x,y)\eqdef \set{x}\cup \de{G}(\cv{G}(x,y))$. Accordingly, for $X,Y\subseteq \nodes(G)$, we define $\cv{G}(X,Y)$ as the vertices that lie on a directed $x,y$-path in $G$ for any $x\in X$ and $y\in Y$.
Given $X,Y\subseteq \nodes(G)$, the \e{proper back-door graph} $\Gpbd{G}(X,Y)$~\citep{DBLP:journals/ai/ZanderLT19} is defined as the graph that results from $G$ by removing from $G$ the first edge of every directed $X,Y$-path. Formally, 
\begin{equation}
	\label{eq:Gpbd}
\edges(\Gpbd{G}(X,Y))\eqdef \edges(G){\setminus}\set{x{\shortrightarrow} u: x{\in} X,  u{\in} \cv{G}(X,Y)}
\end{equation}
\eat{
Let $G$ be a DAG, and let $\bx$, $\by$ and $\bZ$ be distinct subsets of $\nodes(G)$. A path $q$ in $G$ between $X\in \bx$ and $Y\in \by$ is \e{blocked} by $\bZ$ if at least one of the following holds: (i) there is a vertex $Z\in \nodes(q) \cap \bZ$ that is not a collider on $q$, or (ii) there exists a vertex $W\in \nodes(G)$ that is a collider on $q$ such that neither $W$ nor its descendants belong to $\bZ$. We say that $\bx$ and $\by$ are \e{d-separated} by $\bZ$ if, for any $X\in \bx$ and $Y\in \by$, all paths between $X$ and $Y$ are blocked by $\bZ$.
}

\subsubsection*{Identification via Covariate Adjustment}
A \e{Bayesian Network} (BN) for a set of variables $V{=}\set{v_1,\dots,v_n}$ is a pair $\B{\eqdef}(G,P)$ where $G$ is a DAG, and $P$ a joint probability distribution for $V$ that factorizes as $P(V)=\prod_{i=1}^nP(v_i|\pa{G}(v_i))$. For a variable $u\in V$, we denote by $\bu$ an assignment to $u$, and for a subset of variables $X\subseteq V$, we denote by $\bx$ an assignment to all variables in $X$.
We say that the BN $\B$ is \e{causal} if every edge $v_i\shortrightarrow v_j \in \edges(G)$ represents a direct causal effect of $v_i$ on $v_j$. Given a causal BN $\B{=}(G,P)$ and a subset $X \subseteq V$, the \e{post intervention} distribution in $X$ is:
\begin{equation}
	\label{eq:postIntervention}
	P(\bV | do(\bx))\eqdef\begin{cases}
			\prod_{v_i\in V{\setminus}X} P(\boldsymbol{v}_i | \pa{G}(v_i)) & \substack{ \bV \text{ is consistent} \\ \text{ with } \bx }\\
			0 & \text{otherwise}
		\end{cases}
\end{equation}
where  $\bV$ is consistent with $\bx$ if $\bV$ and $\bx$ assign the same values to the variables in $X\cap V$, and $do(\bx)$ represents an intervention that sets $X=\bx$. 
In a DAG, this intevention corresponds to removing all edges into $X$ (i.e., all edges between $X$ and $\pa{G}(X)$). 
The term $P(Y | do(X{=}\bx))$ is called the \e{causal effect} of $X$ on $Y$.

 When all variables $\nodes(G)$ in the DAG $G$ are observed, the causal effect $P(Y | do(X{=}\bx))$ of $X$ on $Y$ in $G$ can be determined directly from $P$ using~\eqref{eq:postIntervention}. When some variables are unobserved, then $P(Y | do(X{=}\bx))$ cannot necessarily be computed directly from $P$. When it can, then it is said that the causal effect of $X$ on $Y$ is \e{identifiable}~\citep{Pearl09}.
 
 \begin{citeddefinitionAAAI}{\citep{Pearl09}}
 	\label{def:covAdj}
 	Given a DAG $G$, and pairwise disjoint $X,Y,Z \subseteq \nodes(G)$, $Z$ is called an \e{adjustment} for estimating the causal effect of $X$ on $Y$ if, for every distribution $P$ that factorizes according to $G$, it holds:
 	\begin{equation}
 		\label{eq:covAdj}
 		P(\by| do(\bx))=\begin{cases}
 			P(\by|\bx) & \text{if }Z=\emptyset\\
 			\sum_{\bZ}P(\by| \bx,\bZ)P(\bZ) & \text{otherwise}
 		\end{cases}
 	\end{equation}
 \end{citeddefinitionAAAI}
 \eat{
Observe that computing $P(\by| do(\bx))$ depends, exponentially, on the domain-size of $Z$, which can be incorporated into weights assigned to the variables $Z$, thus motivating the search for low-weight adjustment sets.}
Let $R \subseteq \nodes(G)$ denote the set of observable variables in $\nodes(G)$. We say that an adjustment set $Z$ is \e{valid} if $Z \subseteq R$.
There exist graphs for which $P(Y | do(X{=}\bx))$  is identifiable but for which no valid adjustment set $Z \subseteq R$ exists.
Smucler et al.~\citeyearpar{10.1093/biomet/asab018}, and van der Zander et al.~\citeyearpar{DBLP:journals/ai/ZanderLT19} established a 
graphical criterion that determines whether $P(Y | do(X{=}\bx))$ has a valid adjustment set.

Let $I \subseteq R \subseteq \nodes(G)$. We denote by $\AdjSet{X,Y}{I}{R}$ all of the adjustment sets $Z$ for $X,Y$ in $G$ according to~\eqref{eq:covAdj}, where $I\subseteq Z \subseteq R$. We call the set $\AdjSet{X,Y}{I}{R}$ the $I,R$ adjustment sets for $X,Y$ in $G$.
We say that $Z$ is a \e{minimal $I,R$ adjustment set for $X,Y$} if no proper subset of $Z$ is an $I,R$ adjustment set for $X,Y$.
We denote by $\MinlAdjSet{X,Y}{I}{R}$ the minimal $I,R$ adjustment sets for $X,Y$ in $G$.
\subsection{Characterizing Adjustment Sets as Separators in an Undirected Graph}
\label{sec:characterizingAdjSetsViaUndirectedGraphs}
In this section, we consider BNs with DAG $G$, where $R \subseteq \nodes(G)$ is the set of observable variables. We assume that $\emptyset \subset R$ since otherwise, no valid adjustment set exists.
Next, we describe the results of van der Zander et al.~\citeyearpar{DBLP:journals/ai/ZanderLT19}, and Smucler et al.~\citeyearpar{10.1093/biomet/asab018}, which showed that $\AdjSet{X,Y}{I}{R}$, the $I,R$ adjustment sets for $X,Y$ in $G$, 
are represented as separators in a certain undirected graph that we describe next.
Given a DAG $G$, two distinguished vertex-sets $X,Y\subseteq \nodes(G)$, a subset of observable variables $R \subseteq \nodes(G)$, and a subset $I \subseteq R$, we define the undirected graph: % $\adjSetGraph{\bx,\by}{\bI}{0}$ as follows: %$\H^0_{\bx,\by}(\bI,G)$ as follows:
\begin{align}
	\label{eq:HUndirected}
	\adjSetGraph{X,Y}{I}{0} \eqdef \left(\Gpbd{G}(X,Y)[\an{G}(I \cup X \cup Y)] \right)^m
\end{align} 
where $\Gpbd{G}$ is the proper back-door graph (see~\eqref{eq:Gpbd}), and $(\cdots)^m$ refers to the undirected moral graph.
\begin{definition}[$\adjSetGraph{X,Y}{I}{1}$]
	$\adjSetGraph{X,Y}{I}{1}$ is the undirected graph that results from $\adjSetGraph{X,Y}{I}{0}$ by: (1) adding all edges between $X{\cup}Y$ and $I$, and (2) saturating (see~\eqref{eq:ESatG}) all vertices of $\adjSetGraph{X,Y}{I}{0}$ that belong to $(\nodes(G){\setminus}R) {\cup} \forb{G}(X,Y)$, and removing them from the graph. 
\end{definition}
Following, is the key result that relates $(X,Y)$-separators in $\adjSetGraph{X,Y}{I}{1}$ and the valid adjustment sets $\AdjSet{X,Y}{I}{R}$.
\begin{citedtheoremAAAI}{\citep{DBLP:journals/ai/ZanderLT19,10.1093/biomet/asab018}}
	\label{thm:adjSetToSep}
	\begin{enumerate}
		\item $\AdjSet{X,Y}{I}{R}\neq \emptyset$ if and only if $X$ and $Y$ are not adjacent in $\adjSetGraph{X,Y}{I}{1}$.
		\item Let $S \subseteq \an{G}(X\cup Y \cup I)$. Then $S\in \AdjSet{X,Y}{I}{R}$ if and only if $S$ is an $X,Y$-separator in $\adjSetGraph{X,Y}{I}{1}$.
		\item $S{\in} \MinlAdjSet{X,Y}{I}{R}$ iff $S{\in} \minlsep{X,Y}{\adjSetGraph{X,Y}{I}{1}}$.
	\end{enumerate}
\end{citedtheoremAAAI}
In Theorem~\ref{thm:simpABthm} we characterized separators between vertex sets as separators between singleton vertices in a modified undirected graph. Let $x\in X$, $y \in Y$. Let $\H \eqdef \adjSetGraph{X,Y}{I}{}$ be the graph that results from $\adjSetGraph{X,Y}{I}{1}$ by adding all edges between $x$ and $N_{\adjSetGraph{X,Y}{I}{1}}(X)$, and all edges between $y$ and $N_{\adjSetGraph{X,Y}{I}{1}}(Y)$. By Theorem~\ref{thm:simpABthm}: 
\begin{align}
	\label{eq:minAdjToMinlSeps}
\MinlAdjSet{X,Y}{I}{R} {\overbrace{=}^{\text{Thm.~\ref{thm:adjSetToSep}}}}\minlsep{X,Y}{\adjSetGraph{X,Y}{I}{1}}{\overbrace{=}^{\text{Thm.}~\ref{thm:simpABthm}}}\minlsep{x,y}{\H} 
\end{align}
In addition, if $S\subseteq \an{G}(I\cup X \cup Y)$ then:
\begin{align}
S{\in} \AdjSet{X,Y}{I}{R}&~\Leftrightarrow~S\text{ an }X,Y{\sminus}\text{separator in }\adjSetGraph{X,Y}{I}{1} \nonumber \\
&~\Leftrightarrow~S\text{ an }x,y{\sminus}\text{separator in }\H 	\label{eq:AdjToSeps}
\end{align}
Eq.~\eqref{eq:minAdjToMinlSeps} and~\eqref{eq:AdjToSeps} allow us to reduce the problem of finding adjustment sets for $X,Y$ in the DAG $G$ to that of finding $x,y$-separators in the undirected graph $\H$. 
%From~\eqref{eq:minAdjToMinlSeps} and~\eqref{eq:AdjToSeps}, we have a characterization of valid adjustment sets for $X,Y$ in the DAG $G$, as $x,y$-separators in $\H$. 
\section{Ordering Adjustment Sets by Efficiency}
\label{sec:OrderingAdjSets}
Let $\B{=}(G,P)$ be a causal BN with observable variables $R \subseteq \nodes(G)$, and let $X,Y,I \subseteq R$. 
We aim to estimate the interventional mean $\mathbb{E}_P(Y | do(\bx), \bI)$.
Using the method of covariate adjustment, the non-parametric estimator for the interventional mean depends on the adjustment set $Z$. 
Following previous work~\citep{10.1093/biomet/asab018,DBLP:journals/corr/abs-2201-02037}, 
we consider unbiased estimators that converge, in distribution, to a normal distribution. 
We denote by $\sigma^2_{Z}(P)$ the variance of the normally-distributed estimator when computed using the adjustment set $Z$ (see~\eqref{eq:covAdj}).
Different adjustment sets $Z$ may yield estimators with varying levels of variance, making the choice of $Z$ crucial for obtaining reliable and accurate estimates.

Let $Z_1,Z_2 \in \AdjSet{X,Y}{I}{R}$ be two valid adjustment sets for estimating the causal effect of $X$ on $Y$ in $G$. We say that $Z_1$ is \e{more efficient} than $Z_2$, in notation $Z_1 \adjEff{G}Z_2$ if and only if $\sigma^2_{Z_1}(P)\leq \sigma^2_{Z_2}(P)$ for every joint probability distribution $P$ that factorizes according to $G$. It has been established that $\adjEff{G}$ does not induce a total order over the set of valid adjustment sets $\AdjSet{X,Y}{I}{R}$. In other words, there exist two distinct adjustment sets $Z_1,Z_2 \in \AdjSet{X,Y}{I}{R}$, such that  $\sigma^2_{Z_1}(P)< \sigma^2_{Z_2}(P)$, and  $\sigma^2_{Z_1}(P')> \sigma^2_{Z_2}(P')$, where $P$, $P'$ are two distinct joint probability distributions that factorize according to $G$~\citep{DBLP:journals/jmlr/RotnitzkyS20}. In other words, there may be pairs of $X,Y$-adjustment sets in $G$ that are incomparable with respect to efficiency.
\begin{definition}
	\label{def:dominates}
Let $Z_1,Z_2 \in \AdjSet{X,Y}{I}{R}$. We say that $Z_1$ \e{dominates} $Z_2$ if $Z_1 \adjEff{G}Z_2$ and $|Z_1|\leq |Z_2|$, and that $Z_1$ \e{strictly dominates} $Z_2$, if one of these inequalities is strict.
\end{definition}
The Pareto-Optimal frontier of adjustment sets is the subset of sets in $\AdjSet{X,Y}{I}{R}$ that are not dominated.
\eat{\batya{In previous work, \citeauthor{10.1093/biomet/asab018} established a relationship between adjustment sets $Z_1,Z_2 \in \AdjSet{X,Y}{I}{R}$ that guarantees $Z_1 \adjEff{G}Z_2$.}}

Let $H$ be an undirected graph, $A,B \subseteq  \nodes(H)$, and $S_1,S_2$ two (not necessarily minimal) $A,B$-separators in $H$. We denote by $S_1 \trianglelefteq_{_H} S_2$ that $S_1$ separates $A$ from $S_2{\setminus}S_1$, and $S_2$ separates $B$ from $S_1{\setminus}S_2$ in $H$.
\begin{citedtheoremAAAI}{\citep{10.1093/biomet/asab018}}
	\label{thm:orderAdjSets}
	Let $Z_1,Z_2 \in  \AdjSet{X,Y}{I}{R}$, such that $Z_1,Z_2 \subseteq \nodes(\adjSetGraph{X,Y}{I}{1})$. If $Z_1  \trianglelefteq_{_{\adjSetGraph{X,Y}{I}{1}}} Z_2$, then $Z_1\adjEff{G} Z_2$.
\end{citedtheoremAAAI}
\def\propTriangle{	Let $S_1,S_2$ be two $s,t$-separators in $H$. Then $S_1 \trianglelefteq_{_H} S_2$ if and only if $C_s(H\sminus S_1)\subseteq C_s(H\sminus S_2)$ and $C_t(H\sminus S_2)\subseteq C_t(H \sminus S_1)$.}
In Section~\ref{sec:minsepsvertexsets} of the Appendix, we prove a result translating Theorem~\ref{thm:orderAdjSets}’s efficiency criteria into a crucial structural property of separators for ranked enumeration.
\begin{proposition}
	\label{prop:triangle}
\propTriangle
\end{proposition}
\eat{
\begin{proof}
	If $C_s(H\sminus S_1)\subseteq C_s(H\sminus S_2)$, then $\emptyset=C_s(H\sminus S_2)\cap S_2 \supseteq C_s(H\sminus S_1)\cap S_2$, and hence  $C_s(H\sminus S_1)\cap S_2=\emptyset$. By definition, every vertex connected to $s$ in $H\sminus S_1$ must belongs to $C_s(H\sminus S_1)\cup S_1$. Since $(S_2{\setminus}S_1)\cap(C_s(H\sminus S_1)\cup S_1)=\emptyset$, then $S_1$ separates $s$ from $S_2{\setminus}S_1$. Symmetrically, we have that if $C_t(H\sminus S_2)\subseteq C_t(H\sminus S_1)$, then $(S_1{\setminus}S_2)\cap(C_t(H\sminus S_2)\cup S_2)=\emptyset$, thus $S_2$ separates $t$ from $S_1{\setminus}S_2$.
	
	If $S_1$ separates $s$ from $S_2{\setminus}S_1$, then $(S_2{\setminus}S_1)\cap C_s(H\sminus S_1)=\emptyset$. By definition, $S_1\cap C_s(H\sminus S_1)=\emptyset$, and hence $S_2 \cap  C_s(H\sminus S_1)=\emptyset$. This, in turn, means that $C_s(H\sminus S_1)$ is contained in the connected component of $H\sminus S_2$ that contains $s$. By definition, $C_s(H\sminus S_1)\subseteq C_s(H\sminus S_2)$. Symmetrically, if  $S_2$ separates $t$ from $S_1{\setminus}S_2$, then  $C_t(H\sminus S_2)\subseteq C_t(H\sminus S_1)$. So, if $S_1 \trianglelefteq_{_H} S_2$ then $C_s(G\sminus S_1)\subseteq C_s(H\sminus S_2)$ and $C_t(H\sminus S_2)\subseteq C_t(H\sminus S_1)$.
\end{proof}
}

\subsection{Proof of Theorem~\ref{thm:ParetoFrontier}}
We show how Proposition~\ref{prop:containmentCs}, Proposition~\ref{prop:triangle}, Theorem~\ref{thm:importantSepsEnum}, and Theorem~\ref{thm:orderAdjSets} are combined to prove Theorem~\ref{thm:ParetoFrontier}.

Let $x{\in} X$, $y{\in} Y$, and $\H$ the graph that results from $\adjSetGraph{X,Y}{I}{1}$  by adding all edges between $x$ and $N_{\adjSetGraph{\bx,\by}{I}{1}}(X)$, and between $y$ and $N_{\adjSetGraph{X,Y}{I}{1}}(Y)$. By Theorem~\ref{thm:simpABthm}, we have that $\minlsep{X,Y}{\adjSetGraph{X,Y}{I}{1}}=\minlsep{x,y}{\H}$.
Let $S_1,S_2$ be $X,Y$-separators in $\adjSetGraph{X,Y}{I}{1}$. From~\eqref{eq:AdjToSeps}, we have that $S_1 \trianglelefteq_{\adjSetGraph{X,Y}{I}{1}} S_2$ if and only if $S_1 \trianglelefteq_{\H} S_2$.
If, in addition, we have that $S_1,S_2$ are minimal $X,Y$-separators in $\adjSetGraph{X,Y}{I}{1}$, then by Proposition~\ref{prop:containmentCs},
we have that $C_y(\H \sminus S_1)\subseteq C_y(\H \sminus S_2)$ if and only if $C_x(\H \sminus S_2)\subseteq C_x(\H \sminus S_1)$. 
By Proposition~\ref{prop:triangle}, we have that $S_1 \trianglelefteq_{_\H} S_2$, and by Theorem~\ref{thm:orderAdjSets} that
\begin{align}
	\label{eq:fromAdjSetsToCloseMinlseps}
\text{If }C_y(\H\sminus S_1)\subseteq C_y(\H\sminus S_2)\text{, then }S_1  \adjEff{G} S_2.
\end{align}
Essentially,~\eqref{eq:fromAdjSetsToCloseMinlseps} translates the quality of adjustment sets in causal BNs with unobserved variables to a simple graphical property of minimal $x,y$-separators in an undirected graph. Therefore, the set of Pareto-Optimal adjustment sets in $\MinlAdjSet{X,Y}{I}{R}$ precisely correspond to the important minimal $x,y$-separators in $\H$ (Definition~\ref{def:importantSeps}).
By Theorem~\ref{thm:importantSepsEnum}, the set of Pareto-Optimal adjustment sets whose size is at most $k$ can be listed in time $O(k(n+m)4^k)$.


Proposition~\ref{prop:triangle}, and its consequence eq.~\eqref{eq:fromAdjSetsToCloseMinlseps} also generalize previous results of Smucler et al.~\citeyearpar{10.1093/biomet/asab018}.
By Lemma~\ref{lem:closeTos}, there exists a unique minimal $x,y$-separator $S$ that is closest to $Y$. That is, $C_y(\H\sminus S)\subseteq C_y(\H\sminus S')$ for every $S'\in \minlsep{x,y}{\H}$. From~\eqref{eq:fromAdjSetsToCloseMinlseps}, this immediately translates to a unique, minimal, optimal, valid $X,Y$-adjustment set that can be found in polynomial time, thereby restoring the result of Smucler et al.~\citeyearpar{10.1093/biomet/asab018}.
Theorem~\ref{thm:uniqueMinClosest} established that there exists a unique, minimum $x,y$-separator $S$ that is closest to $y$. From~\eqref{eq:fromAdjSetsToCloseMinlseps}, this immediately translates to a unique, minimum, optimal, valid $X,Y$-adjustment set in the causal BN, that can be found in polynomial time, thereby restoring the result of Smucler et al.~\citeyearpar{10.1093/biomet/asab018}.