\interfootnotelinepenalty=10000

\subsection{Partition Correctness of Algorithm \ref{alg:method}} \label{sec:partition_correctness}


Per Theorem \ref{theorem:z4_z8_latent}, LDP correctly labels partitions $\z_4$, $\z_7$, and $\z_8$ without conditions \ref{cond:sufficient_2} and \ref{cond:sufficient_3}, even in the presence of latent confounding. To correctly label every member of partitions $\z_1$, $\z_2$, $\z_3$, and $\z_5$, we assume the following sufficient (but not necessary) conditions: \ref{cond:sufficient_2}, \ref{cond:sufficient_3}, \ref{cond:sufficient_1}, and \ref{cond:sufficient_4}.

\rebuttal{
\begin{enumerate}[noitemsep,topsep=0pt, label=C\arabic*]
\setcounter{enumi}{2}
\item\label{cond:sufficient_1} The absence of inter-partition active paths (Definition \ref{def:inter_paths}). 
\item\label{cond:sufficient_4} Causal sufficiency in $\g$. 
\end{enumerate}
}

\rebuttal{Note that \ref{cond:sufficient_1} and \ref{cond:sufficient_4} are not needed for VAS discovery.} Given \ref{cond:sufficient_1}, all of $\z_2$ (if any exist) will be marginally dependent on $\z_4$ and will be identifiable by LDP. The second statement of \ref{cond:sufficient_3} is trivially satisfied when \ref{cond:sufficient_1} is satisfied (as $\z_5$ shares no active paths with $\z_1$ is this setting) but is significant when \ref{cond:sufficient_1} is violated. We demonstrate robustness of partition label correctness to specific violations of \ref{cond:sufficient_1} in Tables \ref{tab:results_m_butterfly}, \ref{tab:latents}. Correctness under violations of \ref{cond:sufficient_4} is described in Section \ref{sec:results:latent}, Appendix \ref{append:z4_z8_latent}, and Appendix \ref{sec:adjustment_correctness}.

Given these sufficient (but not necessary) conditions, we obtain Theorem \ref{theorem:correctness}. 

\begin{theorem} [Partition correctness of Algorithm \ref{alg:method}] Given the sufficient conditions described above, Algorithm \ref{alg:method} is guaranteed to output a correct partition of $\z$ as defined in Table~\ref{tab:partitions}.
\label{theorem:correctness}
\end{theorem}

Proof of Theorem \ref{theorem:correctness} follows from proofs of Lemmas \ref{proof:step_1}–\ref{proof:step_7}, which prove correctness for each step of Algorithm \ref{alg:method} sequentially. In footnotes, we acknowledge certain partitioning behaviors that occur when condition \ref{cond:sufficient_1} is violated. However, these acknowledgements are non-exhaustive. \\

\begin{lemma}
    [Step 1 of Algorithm \ref{alg:method}]  $X \ind Z \land Y \ind Z \iff Z \in \z_8$. \label{proof:step_1}
\end{lemma} 

\vspace{-3mm}

\begin{proof} 
    \textit{Step 1 of Algorithm \ref{alg:method} correctly identifies $\z_8$.} This subset of $\z$ is the most trivial to identify, as it is does not share an active path with either exposure nor outcome in $\g$. By definition, any $Z_8 \in \z_8$ is marginally independent of $X$ and marginally independent of $Y$. Additionally, no candidate $Z \in \z \setminus \z_8$ is marginally independent of both $X$ and $Y$. Thus, any $Z \in \z$ satisfying $X \ind Z \land Y \ind Z$ belongs to $\z_8$ and can be removed from further consideration.
\end{proof}

\begin{lemma} 
    [Step 2 of Algorithm \ref{alg:method}] $X \ind Z \land X \nind Z | Y \iff Z \in \z_4$. \label{proof:step_2}
\end{lemma} 

\vspace{-3mm}

\begin{proof} 
    \textit{Step 2 of Algorithm \ref{alg:method} correctly identifies $\z_4$.\footnote{See Appendix \ref{append:z4_z8_latent} for proof of the identifiability of $\z_4$ under latent confounding.}} Variables in $\z_4$ share an active path with outcome $Y$ in $\g$ but not exposure $X$. For any $Z_4 \in \z_4$, this results in a $v$-structure $X \cdots \rightarrow Y \leftarrow \cdots Z_4$.\footnote{Note that this requires $X$ and $Y$ to be marginally dependent, an assumption made in Section \ref{sec:identifiability}. $X \nind Y$ is true when at least one of the following conditions is true: 1) $X$ is a direct cause of $Y$, 2) $X$ is an indirect cause of $Y$ through mediators in $\z_3$, and/or 3) $X$ and $Y$ share confounders in $\z_1$.} By definition, all such $v$-structures entail $X \ind Z_4 \land X \nind Z_4 | Y$. Besides $\z_4$, only $\z_8$ is marginally independent of $X$. However, $\z_8$ is not conditionally dependent on $X$ given $Y$. Thus, no subset of $\z$ entails $X \ind Z \land X \nind Z | Y$ except $\z_4$. Any variable passing the test in Step 2 is unambiguously a member of $\z_4$. Further, $\z_4$ is correctly identified for downstream use in Step 4 to identify $\z_{\textsc{Post}}$.
\end{proof}

\begin{lemma} 
    [Step 3 of Algorithm \ref{alg:method}] $Y \nind Z \land Y \ind Z | X \iff Z \in \z_{5,7}$. \label{proof:step_3}
\end{lemma} 

\vspace{-3mm}

\begin{proof} 
    \textit{Step 3 of Algorithm \ref{alg:method} correctly identifies $\z_{5,7}$.} We prove both directions of the bidirectional statement by direct proof. This test will be passed under two conditions: 1) $Z \in \z_7$ for any arbitrary $\g$ and 2) $Z \in \z_5$ when $\g$ when $\z_1$ is the empty set (i.e., there are no backdoor paths for $X$ and $Y$). Thus, this test will capture all $\z_7$ under any circumstances but will additionally capture $\z_5$ only when $\g$ is structured such that exposure $X$ blocks all backdoor paths from $\z_{5}$ to outcome $Y$. Further, no subset of $\z$ will pass the test in Step 3 but $\z_{5,7}$. Partitions $\z_1$, $\z_2$, $\z_3$, $\z_4$, and $\z_6$ are parents or effects of $Y$ and thus $X$ cannot block the flow of association between these partitions and $Y$. $\z_8$ will not pass this test either, as it is not marginally dependent on $Y$. Therefore, $Y \nind Z \land Y \ind Z | X$ if and only if $Z$ is in $\z_{5,7}$. Further, if $\z_1$ is nonempty when LDP terminates, it can be concluded that variables passing this test are only $\z_7$ (Line 24, Algorithm \ref{alg:method}).
\end{proof}

\begin{lemma} 
    [Step 4 of Algorithm \ref{alg:method}] Given execution of prior steps in Algorithm \ref{alg:method}, $\exists \; Z_4 \in \z_4$  : $Z \nind Z_4$ or $Z \ind Z_4 | X \cup Y \iff Z \in \z_{2,3,6} \in \z_{\textsc{Post}}$. \label{proof:step_4}
\end{lemma}

\vspace{-3mm}

\begin{proof} 
    \textit{Step 4 of Algorithm \ref{alg:method} correctly identifies $\z_{2,3,6} \in \z_{\textsc{Post}}$.}
        This test exploits prior knowledge of $\z_4$ to identify all of $\z_2$ and $\z_6$ in any arbitrary $\g$ meeting sufficient conditions \ref{cond:sufficient_1}–\ref{cond:sufficient_4}. Under condition \ref{cond:sufficient_1}, no $\z_3$ will pass this test by the same logic that $\{\z_1,\z_5\}$ will not (as proven below).\footnote{If sufficient condition \ref{cond:sufficient_1} is violated, a $Z_3$ may be captured at this step if it is marginally dependent on any $Z_4$. Further, this violation can cause Step 4 to miss members of $\z_2$ that are not descendants of $Y$ (as discussed throughout Section \ref{sec:adjustment_correctness}).}  Note that $\z_4$, $\z_7$, and $\z_8$ have already been identified and removed from further consideration. Thus, this test must correctly identify $\z_2$ and $\z_6$ and must not incorrectly label these partitions as $\z_1$ or $\z_5$. We demonstrate correctness by direct proof of both directions of the bidirectional statement. 
        
        Under the assumption that $X$ and $Y$ are marginally dependent (Section \ref{sec:identifiability}), any $Z \in \z_1 \cup \z_5$ will form a $v$-structure $Z_4 \cdots \rightarrow Y \leftarrow \cdots  Z$, but members of $\z_2 \cup \z_6$ will not (Figure \ref{fig:ten_node_dag}). Such a $v$-structure implies that $Z \ind Z_4$ and $Z \nind Z_4 | X \cup Y$. As we seek to identify candidates $Z$ that do not induce such a $v$-structure, we logically negate these independence statements to test for $\z_2$ and $\z_6$. According to De Morgan's Laws, the negation of a conjunction is the disjunction of the negations. This yields the logical equivalence
        \begin{align}
             \lnot \left[(Z \ind Z_4) \land (Z \nind Z_4 | X \cup Y)\right] & \equiv (Z \nind Z_4) \lor (Z \ind Z_4 | X \cup Y). & \text{Per De Morgan's Laws.}
        \end{align}
        Thus, when $Z \nind Z_4$ or $Z \ind Z_4 | X \cup Y$ is true, we will identify $\z_2 \cup \z_6$ but not $\z_1 \cup \z_5$. Likewise, when $Z \in \z_{2} \cup \z_6$, a $v$-structure $Z_4 \rightarrow Y \leftarrow Z$ will never arise and thus $Z \nind Z_4$ or $Z \ind Z_4 | X \cup Y$. 
\end{proof}

To support Lemmas \ref{proof:step_5}-\ref{proof:step_7}, we introduce Proposition \ref{prop:indirect}.

\begin{proposition} \label{prop:indirect}
    For any $Z_1 \in \z_1$ that has an indirect active path to outcome $Y$, there must exist another $Z_{1}$ that is directly adjacent to $Y$. This extends analogously to indirect active paths between $\z_1$ and $X$. 
\end{proposition}

\begin{lemma} 
    [Step 5 of Algorithm \ref{alg:method}] Given execution of prior steps in Algorithm \ref{alg:method}, if $Y \nind Z \; \land \; Y \ind Z | X \cup \mathbf{Z}' \setminus Z$ then $Z \in \z_{1,2,3,5} \in \z_{\textsc{Mix}}$, and all backdoor paths between $\z_{\textsc{Mix}}$ and $Y$ are blocked by $X$ and the members of $\z$ that have not yet been labeled. \label{proof:step_5}
\end{lemma} 

\vspace{-3mm}

\begin{proof} 
    \textit{Step 5 of Algorithm \ref{alg:method} correctly identifies $\z_{\textsc{Mix}}$.} %This proof follows from the proof provided for Step 3. 
    Here, will assume that $\z_5$ was not yet discovered at Step 3.
    We will prove that the conditioning set used in Step 5 correctly blocks all backdoor paths between $\z_{\textsc{Mix}}$ and $Y$. Given sufficient conditions \ref{cond:sufficient_2}–\ref{cond:sufficient_4}, $\z_2$, $\z_4$, $\z_6$, and $\z_8$ have been previously identified and removed from further consideration.\footnote{If sufficient condition \ref{cond:sufficient_1} is violated, members of $\z_2$ that were not marginally dependent on any $Z_4 \in \z_4$ (and thus not identified at Step 4) could be placed in $\z_{\textsc{Mix}}$ at Step 5 instead. We prove in Section \ref{sec:adjustment_correctness} that the presence of $\z_{2}$ in $\z_{\textsc{Mix}}$ does not undermine the validity of the adjustment set returned by Algorithm \ref{alg:method}.} Thus, we assume that only $\z_1$, $\z_3$, and $\z_5$ are remaining in $\z'$. By conditioning on $X \cup \z' \setminus Z$, backdoor paths for $\{X,Y\}$ are blocked due to the inclusion of all $\z_1 \in \z'$. 
    %Including members of $\z_3$ and $\z_5$ in the conditioning set does not influence the independence test, as these variables cannot block backdoor paths. 
    Thus, conditioning on $X \cup \z' \setminus Z$ blocks all causal and non-causal association between $Z$ and $Y$. For all $Z \in \z_5$, $Y \ind Z | X \cup \mathbf{Z}' \setminus Z$. For any $Z \in \z_1$ or $Z \in \z_3$ that is not directly adjacent to $Y$, $Y \ind Z | X \cup \mathbf{Z}' \setminus Z$. All members of $\z_1$ and $\z_3$ that are adjacent to $Y$ will proceed to be identified at Step 6. Thus, $\z_{\textsc{Mix}}$ will consist of $\z_5$, a fraction of $\z_1$ (which may be the empty set), and a fraction of $\z_3$ (which may be the empty set).
\end{proof}

\begin{lemma} 
    [Step 6 of Algorithm \ref{alg:method}] Let $\z_{\textsc{Mix}} = \z_{\textsc{Mix}} \cup \z_{5,7}$. Given execution of prior steps in Algorithm \ref{alg:method}, if $\exists \; Z_{\textsc{Mix}} \in \z_{\textsc{Mix}}$ such that $Z_{\textsc{Mix}} \ind Z$ and $Z_{\textsc{Mix}} \nind Z | X$ then $Z \in \z_{1}$ and $Z_{\textsc{Mix}} \in \z_{1,5}$. Else,  $Z \in \z_{\textsc{Post}}$. After execution of these tests, we loop through the remaining $\z_{\textsc{Mix}}$ again. If $\exists \; Z_{\textsc{1,5}} \in \z_{1,5}$ such that $Z_{\textsc{1,5}} \ind Z_{\textsc{Mix}}$ and $Z_{\textsc{1,5}} \nind Z_{\textsc{Mix}} | X$, then $Z_{\textsc{Mix}} \in \z_{1}$. Else, $Z_{\textsc{Mix}} \in \z_{\textsc{Post}}$. \label{proof:step_6}
\end{lemma}

\vspace{-3mm}

\begin{proof} 
    \textit{Step 6 of Algorithm \ref{alg:method} correctly differentiates $\z_{1}$, $\z_{1,5}$, $\z_{7}$, and $\z_{\textsc{Post}}$.} This step relies on prior knowledge of $\z_{\textsc{Mix}}$, which is gained programmatically through Steps 3 and 5. Under sufficient conditions \ref{cond:sufficient_2}–\ref{cond:sufficient_4}, $\z_{\textsc{Mix}}$ initially contains $\z_5$ and the members of $\z_1$ and $\z_3$ that are not adjacent to $Y$. At Step 6, we begin by unioning $\z_{\textsc{Mix}}$ with $\z_{5,7}$ as a safeguard in case any member of $\z_5$ was lumped with $\z_7$ at Step 3.
    
    Step 6 exploits the presence of $v$-structures $Z \cdots \rightarrow X \leftarrow \cdots Z_1$ in $\g$. For any $\g$ (even when sufficient conditions are not met), the variables that can form such a $v$-structure with a $Z_1 \in \z_1$ are 1) a $Z_5 \in \z_5$ or 2) another $Z_1 \in \z_1$ that does not share an active path with the first. %The only other variables that are marginally independent of $\z_1$ are $\z_4$ and $\z_8$, both of which were previously identified. 
    
    First, we prove the first phase of Step 6. Under sufficient condition \ref{cond:sufficient_1}, $\z_5 \cdots \rightarrow X \leftarrow \cdots \z_1$ for all $\{\z_1,\z_5\}$. This means that all of $\z_5$ is marginally independent of $\z_1$, but is conditionally dependent on $\z_1$ given $X$. As described in sufficient condition \ref{cond:sufficient_3}, the existence of at least two non-overlapping backdoor paths in $\g$ can also enable some $Z_1$ to form a $v$-structure at $X$ with another member of $\z_1$. Thus, when a $v$-structure $Z_{\textsc{Mix}} \cdots \rightarrow X \leftarrow \cdots Z$ is detected, then $Z$ must be in $\z_1$ and $Z_{\textsc{Mix}}$ must be in $\z_{1,5}$. By extension, $Z_{\textsc{Mix}}$ is not in $\z_{\textsc{Post}}$ nor $\z_7$, and can be removed from the latter if it had been placed there at Step 3. Else, $Z$ must be in $\z_{\textsc{Post}}$.

    Finally, we prove the second phase of Step 6. 
    Variables still in $\z_{\textsc{Mix}}$ must be tested to distinguish the remaining members in $\z_1$ from those in $\z_{\textsc{Post}}$. Any ground truth member of $\z_1$ that remains in $\z_{\textsc{Mix}}$ at this point must be marginally dependent on all previously discovered members of $\z_1$, otherwise these would have already been placed in $\z_{1,5}$. By this point, all of $\z_5$ is now contained in $\z_{1,5}$. Under sufficient condition \ref{cond:sufficient_1}, $\z_1 \ind \z_5$ but $\z_{\textsc{Post}} \nind \z_5$. Thus, testing $\z_{\textsc{Mix}}$ against $\z_{1,5}$ for marginal independence will differentiate the remaining $\z_1 \in \z_{\textsc{Mix}}$ from the remaining $\z_{\textsc{Post}} \in \z_{\textsc{Mix}}$.%\footnote{Per the footnote above, some members of $\z_2$ could eventually be placed in $\z_1$ when sufficient condition \ref{cond:sufficient_1} is violated. In Section \ref{sec:adjustment_correctness}, we prove that this occurrence does not negate the validity of the adjustment set returned by LDP.}
\end{proof}


\begin{lemma} 
    [Step 7 of Algorithm \ref{alg:method}] Given execution of prior steps in Algorithm \ref{alg:method}, if $\exists \; Z_{1} \in \z_1$ and $Z_{1,5} \in \z_{1,5}$ such that $Z_{1,5} \nind Z_{1}$, then $Z_{1,5} \in \z_{1}$. Else, $Z_{1,5} \in \z_{5}$. \label{proof:step_7}
\end{lemma} 

\vspace{-3mm}

\begin{proof} 
    \textit{Step 7 of Algorithm \ref{alg:method} correctly differentiates $\z_{1}$ from $\z_{5}$.} This step handles cases exemplified by node $B_1$ in the butterfly structure of Figure \ref{fig:m_butterfly}, which can have  arbitrarily long, indirect, yet active paths to $Y$. During Step 5, the conditioning set $X \cup \z' \setminus Z$ contains all $\z_1$, among other variables. For a $B_1$-type confounder, this conditioning set blocks all backdoor paths to $Y$, triggering the test to label the node as a member of $\z_{\textsc{Mix}}$. To detect such a case, observe that $B_1$-type confounders have marginal dependence on the subset of $\z_1$ that was discovered at Step 6. All $Z_1 \in \z_1$ previously discovered at Step 6 are directly adjacent to $Y$. Under sufficient condition \ref{cond:sufficient_1}, all of $\z_5$ is marginally independent of $\z_{1}$. Even when sufficient condition \ref{cond:sufficient_1} is violated, no member of $\z_5$ will ever be dependent on a $Z_1$ that is directly adjacent to $Y$.
    Therefore, any member of $\z_{1,5}$ that is marginally dependent on at least one member of $\z_{1}$ discovered at Step 6 must be in $\z_1$. If such marginal dependence is not detected between a given $Z_{1,5}$ and any member of $\z_{1}$ discovered at Step 6, then $Z_{1,5} \in \z_5$ instead.
\end{proof}
