% \documentclass{uai2023} % for initial submission
\documentclass[accepted]{uai2023} % after acceptance, for a revised
% version; also before submission to
% see how the non-anonymous paper
% would look like

%% There is a class option to choose the math font
% \documentclass[mathfont=ptmx]{uai2023} % ptmx math instead of Computer
% Modern (has noticable issues)
% \documentclass[mathfont=newtx]{uai2023} % newtx fonts (improves upon
 % ptmx; less tested, no support)
% NOTE: Only keep *one* line above as appropriate, as it will be replaced
%       automatically for papers to be published. Do not make any other
%       change above this note for an accepted version.

%% Choose your variant of English; be consistent
\usepackage[american]{babel}
% \usepackage[british]{babel}
\usepackage{dsfont, amsfonts}

%% Some suggested packages, as needed:
\usepackage{natbib} % has a nice set of citation styles and commands
    \bibliographystyle{plainnat}
    \renewcommand{\bibsection}{\subsubsection*{References}}
\usepackage{mathtools} % amsmath with fixes and additions
% \usepackage{siunitx} % for proper typesetting of numbers and units
\usepackage{booktabs} % commands to create good-looking tables
\usepackage{tikz} % nice language for creating drawings and diagrams
\usepackage{enumitem}
\usepackage{mathabx}

\usepackage{amssymb}
\usepackage{amsthm}
\usepackage[capitalize,noabbrev]{cleveref}


\usepackage{subfiles}
\usepackage{tikz, subcaption}
\usetikzlibrary{positioning}
\usepackage{algorithm}
\usepackage{algpseudocode}
% \usepackage{algorithmic}
% \usepackage[ruled,vlined,linesnumbered]{algorithm2e}
\usepackage{todonotes}
\usepackage{bbm}
\usepackage{centernot}


\newtheorem{theorem}{Theorem}%[section]
\newenvironment{customthm}[1]{\renewcommand\thetheorem{#1}\theorem}{\endtheorem}    
\newtheorem{corollary}{Corollary}%[theorem]
\newtheorem{lemma}{Lemma}
\newtheorem{assumption}{Assumption}
\newenvironment{customlem}[1]{\renewcommand\thelemma{#1}\lemma}{\endlemma}
  
\newenvironment{customtheorem}[1]{\renewcommand\thetheorem{#1}\theorem}{\endtheorem}
  
\newtheorem{proposition}{Proposition}
\newenvironment{customprp}[1]{\renewcommand\theproposition{#1}\proposition}{\endproposition}
\newtheorem{definition}{Definition}
\newtheorem{remark}{Remark}
\newtheorem{claim}{Claim}
\newtheorem{conjecture}{Conjecture}
\newenvironment{myproof}[1][\proofname]{%
  \begin{proof}[#1]$ $\nobreak\ignorespaces
}{%
  \end{proof}
}
\newcommand{\V}[0]{\mathbf{V}}
\newcommand{\C}[0]{\mathbf{C}}
\newcommand{\W}[0]{\mathbf{W}}
\newcommand{\U}[0]{\mathbf{U}}
\newcommand{\E}[0]{\mathbf{E}}
\newcommand{\X}[0]{\mathbf{X}}
\newcommand{\R}[0]{\mathbf{R}}
\newcommand{\Y}[0]{\mathbf{Y}}
\newcommand{\Z}[0]{\mathbf{Z}}
\newcommand{\OO}[0]{\mathbf{O}}
\newcommand{\A}[0]{\mathbf{A}}
\newcommand{\B}[0]{\mathbf{B}}
\newcommand{\T}[0]{\mathbf{T}}
\newcommand{\D}[0]{\mathbf{D}}
\newcommand{\Pa}[2]{\textit{Pa}_{#2}(#1)}
\newcommand{\Ch}[2]{\textit{Ch}_{#2}(#1)}
\newcommand{\Anc}[2]{\textit{Anc}_{#2}(#1)}
\newcommand{\De}[2]{\textit{De}_{#2}(#1)}

\newcommand{\x}[0]{\mathbf{x}}
\newcommand{\y}[0]{\mathbf{y}}
\newcommand{\z}[0]{\mathbf{z}}
\newcommand{\w}[0]{\mathbf{w}}
\newcommand{\dd}[0]{\mathbf{d}}

\newcommand{\G}[0]{\mathcal{G}}
\newcommand{\M}[0]{\mathcal{M}}
\newcommand{\F}[0]{\mathcal{F}}
\newcommand{\dom}[2]{\mathfrak{X}_{#2}(#1)}


\newcommand{\independent}{\perp\!\!\!\perp}
\newcommand{\notindependent}{\centernot{\independent}}

% for cross referencing the main text
% PLEASE ONLY USE xr IN THE SUPPLEMENTARY MATERIAL. 
% In the main paper, hard code any cross-reference to the supplementary material. 
\usepackage{xr}
\makeatletter

\newcommand*{\addFileDependency}[1]{% argument=file name and extension
\typeout{(#1)}% latexmk will find this if $recorder=0
% however, in that case, it will ignore #1 if it is a .aux or 
% .pdf file etc and it exists! If it doesn't exist, it will appear 
% in the list of dependents regardless)
%
% Write the following if you want it to appear in \listfiles 
% --- although not really necessary and latexmk doesn't use this
%
\@addtofilelist{#1}
%
% latexmk will find this message if #1 doesn't exist (yet)
\IfFileExists{#1}{}{\typeout{No file #1.}}
}\makeatother

\newcommand*{\myexternaldocument}[1]{%
\externaldocument{#1}%
\addFileDependency{#1.tex}%
\addFileDependency{#1.aux}%
}
%------------End of helper code--------------

% put all the external documents here!
\myexternaldocument{kivva_47}

%% Provided macros
% \smaller: Because the class footnote size is essentially LaTeX's \small,
%           redefining \footnotesize, we provide the original \footnotesize
%           using this macro.
%           (Use only sparingly, e.g., in drawings, as it is quite small.)

%% Self-defined macros
\newcommand{\swap}[3][-]{#3#1#2} % just an example

\title{On Identifiability of Conditional Causal Effects\\(Supplementary Material)}

% The standard author block has changed for UAI 2023 to provide
% more space for long author lists and allow for complex affiliations
%
% All author information is authomatically removed by the class for the
% anonymous submission version of your paper, so you can already add your
% information below.
%
% Add authors
\author[1]{\href{mailto:<yaroslav.kivva@epfl.ch>?Subject=Your UAI 2023 paper}{Yaroslav Kivva}{}}
\author[1, 3]{Jalal Etesami}
\author[1,2]{Negar Kiyavash}
% % Add affiliations after the authors
\affil[1]{%
    School of Computer and Communication Sciences\\
    EPFL\\
    Lausanne, Switzerland
}
\affil[2]{%
     College of Management of Technology\\
    EPFL\\
    Lausanne, Switzerland
}
\affil[3]{%
   TUM School of Computation, Information and Technology\\
   Technical University of Munich
}
  
\begin{document}
  
\onecolumn %% Turn this off if single column is desired for the supplement

\maketitle
\section{TECHNICAL PROOFS} \label{sec:app}

\subsection{NON c-gID CAUSAL EFFECTS}


For proving Lemma \ref{lemma: construct models subcase 1}, Lemma \ref{lemma: construct models subcase 2} and Lemma \ref{lemma: construct models subcase 3}, it suffices to introduce two models  that agree on the known distributions but disagree:
\begin{itemize}
    \item on the causal effect $Q[\mathbf{L}'|\mathbf{L}'']$ (for Lemma \ref{lemma: construct models subcase 1}),
    
    \item on the causal effect $P_{\x'}(\mathbf{d}|\mathbf{s}\setminus \mathbf{d})$ (for Lemma 4),
    
    \item on the causal effect $P_{\x'}(\widetilde{\mathbf{d}}|\mathbf{s}\setminus \widetilde{\mathbf{d}})$ (for Lemma 6).
\end{itemize}
To do so, we require a result from \citep{kivva2022revisiting} and couple of definitions and notations which we present in the next section. 

\subsubsection{Baseline Models} \label{sec: baseline}
In this section, we present two models which we use as our baseline models for proving the non-identifiability parts. 

\begin{theorem}{Theorem 1 \cite{kivva2022revisiting}}\label{th: gid main}
    Suppose $\widecheck{\mathbf{S}} \subseteq \V$ is a single c-component. 
    $Q[\widecheck{\mathbf{S}}]$ is gID from $(\mathbb{A}, \G)$ if and only if there exists $\A \in \mathbb{A}$ such that $\widecheck{\mathbf{S}} \subseteq \A$ and $Q[\widecheck{\mathbf{S}}]$ is ID in $\G[\A]$.
\end{theorem}

To introduce the baseline models, we use the models from the proof of Theorem 1 in \citep{kivva2022revisiting}.
Note that in the proof of Lemma \ref{lemma: construct models subcase 2} and \ref{lemma: construct models subcase 3}, we use $\mathbf{S}_1$ and $\widecheck{\mathbf{S}}$ interchangeably, i.e., $\widecheck{\mathbf{S}} = \mathbf{S}_1$. 

Suppose that $Q[\widecheck{\mathbf{S}}]$ is not gID from $(\mathbb{A}, \G)$ and there exists $i \in [0, m]$, such that $\widecheck{\mathbf{S}} \subset \mathbf{A}_i$. Without loss of generality, let $\widecheck{\mathbf{S}} \subset \mathbf{A}_i$ for $i \in [0, \widecheck{k}]$ and $\widecheck{\mathbf{S}}\nsubseteq 
\mathbf{A}_i$ for $i \in [\widecheck{k}+1, m]$.
This allows us to define a particular graph which we use throughout our proof. 
More precisely, under these assumptions, Lemma \ref{lemma: Q ID} and the above theorem guarantee that for each $i \in [0, \widecheck{k}]$, there exists a $\widecheck{\mathbf{S}}$-rooted c-forest $\F_i$ over a subset of observed variables $\B_i$ ($\widecheck{\mathbf{S}} \subsetneq \B_i \subseteq \A_i$) such that $\F_{0}[\widecheck{\mathbf{S}}]=\F_{j}[\widecheck{\mathbf{S}}]$ for $j\in[1,\widecheck{k}]$.
 In words, induced subgraphs of $\F_{i}$s over the set $\widecheck{\mathbf{S}}$ are the same. 
 We define graph $\G'$ as the union of all the subgraphs in $\{\F_{i}\}_{i=0}^{\widecheck{k}}$ with the observed variables $\widecheck{\V}:=\bigcup_{i=0}^{\widecheck{k}}\B_{i}$ and the  unobserved variables which we denoted by $\widecheck{\U}$. 


To properly define a SEM $\M$ over a causal graph $\G$, it suffices to define the domain set of each node $X$ in $\G$ with its associated conditional distribution $P(X|\Pa{X}{\G})$. 
Note that if for some variable $X$ in $\G$, its domain $\dom{X}{}$ or $P(X|\Pa{X}{\G})$ are not specified, then by default, we assume \mbox{$\dom{X}{} := \{0\}$} and $P(X=0|\Pa{X}{\G})=1$. 

\renewcommand{\V}{\widecheck{\mathbf{V}}}
\renewcommand{\U}{\widecheck{\mathbf{U}}}
\renewcommand{\T}{\widecheck{\mathbf{T}}}
\renewcommand{\u}{\widecheck{\mathbf{u}}}
\renewcommand{\k}{\widecheck{k}}

Let $U_0$ be an unobserved variable from subgraph $\F_0$ that has one child in $\widecheck{\mathbf{S}}$ and one child in $\T:=\V\setminus \widecheck{\mathbf{S}}$.
In high-level, our baseline models $\M_1$ and $\M_2$ have the same distributions over all variables in graph $\G$ except the variable $U_0$. Especially, 
\begin{align}
    & P^{M_1}(V|\Pa{V}{\G}) = P^{\M_2}(V|\Pa{V}{\G}),\quad V \in \mathbf{V}, \forall \label{eq: M_1(V) = M_2(V)}\\
    & P^{\M_1}(U) = P^{\M_2}(U) = \frac{1}{|\dom{U}{}|}, \quad \forall U \in \mathbf{U}\setminus \{U_0\}, \label{eq: M_1(U) = M_2(U)}
\end{align}
where $|\cdot|$ denotes the cardinality of a given set. For the sake of brevity, we drop the superscripts $\M_1$ and $\M_2$ for the distributions in Equations (\ref{eq: M_1(V) = M_2(V)}) and (\ref{eq: M_1(U) = M_2(U)}). 
We denote the domain of variable $U_0$ to be $\dom{U_0}{} := \{ \gamma_1, \dots, \gamma_d\}$, where $\gamma_j$s are vectors and $d$ is an integer number to be defined later.  
In model $\M_1$, we define $U_0$ to have uniform distribution over $\dom{U_0}{}$, i.e., $P^{\M_1}(U_0 = \gamma_j) = 1/d$. 
In model $\M_2$, we define $P^{\M_2}(U_0 = \gamma_j) := p_j$, where $j \in [1:d]$ and 
\begin{align*}
    & \sum_{j=1}^d p_j = 1, \\
    & p_j > 0 \quad \forall j \in [1:d].
\end{align*}

For $i \in [0:m]$, $j \in [1:d]$, $u_0 = \gamma_j$ and any $\mathbf{v} \in \dom{\mathbf{V}}{}$, we define:
\begin{equation} \label{eq: theta and eta}
\begin{gathered}
    \theta_{i, j}(\mathbf{v}) := \sum_{\mathbf{U} \setminus \{U_0\}} \prod_{X \in \A_i} P(x \mid \Pa{X}{\G}) \prod_{U\in \mathbf{U} \setminus \{U_0\}} P(u), \\
    \eta_j(\mathbf{v}) := \sum_{\mathbf{U}\setminus \{U_0\}} \prod_{X \in \widecheck{\mathbf{S}}} P(x \mid \Pa{X}{\G}) \prod_{U\in \mathbf{U}\setminus \{U_0\}} P(u).
\end{gathered}
\end{equation}


Note that in the above equations, $u_0=\gamma_j$ may appear as a parent of an observed variable. 
Using the above definitions, we can re-write the $Q$-notation in Equation (\ref{eq: Q}) as follows
\begin{align}\label{eq: M1 Q[A_i] through thetha}
    & Q^{\M_1}[\mathbf{A}_i](\mathbf{v}) 
    = \sum_{j=1}^d \frac{1}{d} \theta_{i,j}(\mathbf{v}), \\ \label{eq: M_2 Q[A_i] through thetha}
    & Q^{\M_2}[\mathbf{A}_i](\mathbf{v}) 
    = \sum_{j=1}^d p_j \theta_{i,j}(\mathbf{v}), \\
    \label{eq: M_1 Q[S_1] through eta}
    & Q^{\M_1}[\widecheck{\mathbf{S}}](\mathbf{v}) 
    = \sum_{j=1}^d \frac{1}{d} \eta_j(\mathbf{v}), \\
    \label{eq: M_2 Q[S_1] through eta}
    & Q^{\M_2}[\widecheck{\mathbf{S}}](\mathbf{v}) 
    = \sum_{j=1}^d p_j \eta_j(\mathbf{v}).
\end{align}

Denote the set of unobserved variables in $\G'[\widecheck{\mathbf{S}}]$ by $\U^{\widecheck{\mathbf{S}}}$ and its complement set in $\U \setminus (\U^{\widecheck{\mathbf{S}}} \cup \{U_0\})$ by $\U^{\T}$. 
For each $i \in [0:\k]$, let $\widecheck{T}_i$ be a node in $\B_i\setminus \widecheck{\mathbf{S}}$ such that $\Ch{\widecheck{T}_i}{\F_i}\neq \emptyset$. Node $\widecheck{T}_i$ exists because $\F_i$ is a $\widecheck{\mathbf{S}}$-rooted c-forest. 
Figure \ref{fig:van} illustrates an example of the above definitions. 
\begin{figure}
    \centering
    \includegraphics[scale=0.2]{baseline_notation.png}
    \caption{An illustration of the definitions $\B_i,U_0,\A_i,\widecheck{\mathbf{S}}$, and $\widecheck{T}_i$.}
    \label{fig:van}
\end{figure}

We define the domains of $X\in\V\cup \U$ as follows.
Note that $\V = \widecheck{\mathbf{S}} \cup \T$ and $\U = \U^{\widecheck{\mathbf{S}}}\cup \U^{\T}\cup \{ U_0\}$.
\begin{align*}
    &\dom{X}{} := [0:\kappa], \quad \forall X \in \widecheck{\mathbf{S}},\\
    &\dom{X}{} := [0:\kappa], \quad \forall X \in \U^{\widecheck{\mathbf{S}}},\\
    &\dom{X}{} := \{0, 1\}^{\alpha(T)}, \quad \forall X \in \T,\\
    &\dom{X}{} := \{0, 1\}^{\alpha(U)}, \quad \forall X \in \mathbf{U}^{\T},\\
    &\dom{X}{} := [0:\kappa]\times\{0, 1\}^{\alpha(U_0)-1}, \quad X=U_0,
\end{align*}
where $\kappa$ is an odd number greater than 4. 
Function $\alpha(X)$ is only defined for $X \in \T\cup\U^{\T}\cup \{U_0\}$ and it denotes the number of subgraphs in $\{\F_j\}_{j=0}^{\k}$ that contains $X$.
From the above definition, it is clear that $d$, the domain size of $U_0$ is equal to $(\kappa+1)2^{\alpha(U_0)-1}$. 
 %Note that each of the variables from $\mathbf{V}\cup \mathbf{U}$ we can represent as a vector of random variables.


Suppose that $X\in \T\cup\U^{\T}\cup\{U_0\}$ and $X$ belongs to $\F_{i_1}, \F_{i_2}, \cdots, \F_{i_{\alpha(X)}}$, where $i_1 < i_2 < \dots < i_{\alpha(X)}$. 
We use $(X[i_1], X[i_2], \dots, X[i_{\alpha{X}}])$ to represent $X$. Note that depending on where $X$ belongs to, its vector size is different.
%Further, we define the distributions $P(X|\Pa{X}{\G})$ for each variable $X$ in the set $(\V \cup \U) \setminus \{U_0\}$.- Where do you define $P(X|\Pa{X}{\G})$? If you define it by considering where $X$ comes from , then you have to mention it. like if $X\in \T$ then ... 
If $X\in\U^{\T}\cup\{U_0\}$, both its distribution and its domain are specified above. 
If $X\in\T$, we define the entries of its corresponding vector as
\begin{equation*}
    X[i_j] \equiv \left(\sum_{Y \in \Pa{X}{\F_{i_j}}} Y[i_j]\right) \pmod{2},
\end{equation*}
where $j\in[1:\alpha(X)]$. This specifies the distribution of $P(X|\Pa{X}{\G})$ for $X\in\T$.
What is left to specify is the domains and the distributions of variables in $\widecheck{\mathbf{S}}$. 
     
Recall that $U_0$ has one child in $\widecheck{\mathbf{S}}$ and one child in $\T$. We denote the child in $\widecheck{\mathbf{S}}$ by $S_0$.
For each $S \in \widecheck{\mathbf{S}}\setminus \{S_0\}$ and any realization of $\Pa{S}{\G'}$, 
we define $\mathbb{I}(S)$ to be one if there exists $i\in [0:k]$ such that
\begin{enumerate}
    \item $\widecheck{T}_i \in \Pa{S}{\G'}$ and $\widecheck{T}_i[i]=0$, or
    \item there exists $X \in \Pa{S}{\G'} \setminus (\U^{\widecheck{\mathbf{S}}}\cup \{\widecheck{T}_i\})$ such that $\F_i$ contains $X$ and $X[i]=1$,
\end{enumerate}
and zero, otherwise.
It is noteworthy that according to the definition of $\widecheck{T}_i$, it belongs to $\B_i\setminus\widecheck{\mathbf{S}}\subseteq\T$ which means $\widecheck{T}_i[i]$ is well-defined according to the above definition. 
Note that the above definition holds for all $S \in \widecheck{\mathbf{S}}\setminus \{S_0\}$. When $S=S_0$, we define $\mathbb{I}(S_0)$
to be one if there exists $i\in [0:k]$, such that
\begin{enumerate}
    \item $\widecheck{T}_i \in \Pa{S}{\G'}$ and $\widecheck{T}_i[i]=0$, or
    \item $i\neq0$, $\mathcal{F}_i$ contains $U_0$, and $U_0[i]=1$, or
    \item there exists $X \in \Pa{S}{\G'} \setminus (\U^{\widecheck{\mathbf{S}}}\cup \{\widecheck{T}_i,U_0\})$ such that $\F_i$ contains $X$ and $X[i]=1$.
\end{enumerate}

For each $S\in \widecheck{\mathbf{S}}$, we define $\dom{S}{}:=\{0,...,\kappa\}$ and for $s \in \dom{S}{}$,
\begin{equation} \label{eq: def P(S|Pa(S)) gid}
P(S=s \mid \Pa{S}{\G}):=\begin{cases} 
    \frac{1}{\kappa+1} & \text{ if } \mathbb{I}(S)=1\\
    1-\kappa\epsilon &  \text{ if } \mathbb{I}(S)=0  \text{ and } s \equiv M(S) \pmod{\kappa+1}, \\
    \epsilon &  \text{ if }  \mathbb{I}(S)=0  \text{ and } s\not\equiv M(S) \pmod{\kappa+1},
\end{cases}
\end{equation}
where $0<\epsilon<\frac{1}{\kappa}$ and 
\begin{equation}
M(S):=
\begin{cases} \label{eq: M(S)}
    \sum_{x\in \Pa{S}{\G'[\widecheck{\mathbf{S}}]}}x & \text{, if } S\in \widecheck{\mathbf{S}}\setminus \{S_0\}, \\
    u_0[0]+\sum_{x\in \Pa{S}{\G'[\widecheck{\mathbf{S}}]}}x & \text{, if $S=S_0$ }.
\end{cases}
\end{equation}
Note that $M(S)$ is an integer number because $\Pa{S}{\G'[\widecheck{\mathbf{S}}]}\subseteq \U^{\widecheck{\mathbf{S}}}$ and thus all terms in the summations in \eqref{eq: M(S)} belong to $[0:\kappa]$. With this, we finish defining the models and now we are ready to present some of their properties.

%Note that the models introduced in this section are identical to the ones introduced in the \cite[Theorem 1]{kivva2022revisiting}. 



Let $\mathbf{\Gamma}$ denote a subset of $\dom{U_0}{}=\{\gamma_1,...,\gamma_d\}$ with $\frac{\kappa+1}{2}$ elements that is given by
\begin{equation*}% module is redundant here
    \mathbf{\Gamma} := \Big\{(2x,0,\cdots,0)\!:\: x\in [0:\frac{\kappa-1}{2}]\Big\}.
\end{equation*}
Recall that for $\mathbf{v}\in \dom{\mathbf{V}}{}$ and $i\in[0:m]$, $\theta_i(\mathbf{v})$ and $\eta(\mathbf{v})$ are two vectors in $\mathbb{R}^d$ with $j$-th entry corresponding to $U_0=\gamma_j$. 
Suppose that $\mathbf{\Gamma}=\{\gamma_{j_1},...,\gamma_{j_{\frac{\kappa+1}{2}}}\}$. Next result shows that in the constructed models, all entries of $\theta_i(\textbf{v})$ with indices in $\{j_1,...,j_{\frac{\kappa+1}{2}}\}$ are equal.

\begin{lemma}[\cite{kivva2022revisiting}]
    \label{lemma: gid equal indices}
    For any $\mathbf{v} \in \dom{\mathbf{V}}{}$,  $i\in[0:m]$, and both models, we have
    \begin{equation*}
        \theta_{i,j_1}(\mathbf{v}) = \theta_{i,j_2}(\mathbf{v}) = \cdots= \theta_{i,j_{\frac{\kappa+1}{2}}}(\mathbf{v}).
    \end{equation*}
\end{lemma}


The next two lemmas are used to prove the existence of parameters $\epsilon$ and $\{p_j\}_{j=1}^d$ such that the constructed models $\M_1$ and $\M_2$ agree on the known distributions but disagree on the target causal effect.
\begin{lemma}[\cite{kivva2022revisiting}]
    \label{lemma: gid not equal indices}
    There exists $0<\epsilon<\frac{1}{\kappa}$ such that there exists $\mathbf{v}_0 \in \dom{\mathbf{V}}{}$ and $1\leq r <t\leq \frac{\kappa+1}{2}$ such that 
    \begin{equation*}
        \eta_{j_r}(\mathbf{v}_0) \neq \eta_{j_t}(\mathbf{v}_0).
    \end{equation*}
\end{lemma}

\begin{lemma}[\cite{kivva2022revisiting}]
    \label{lemma: lin indep formal}
    Consider a set of vectors $\{c_i\}_{i=1}^{n}$, where $c_i \in \mathbb{R}^d$. Assume $c\in \mathbb{R}^d$ is a vector that is linearly independent of $\{c_i\}_{i=1}^{n}$, then there is a vector $b\in \mathbb{R}^d$ such that
    \begin{align*}
        & \langle c_i, b \rangle = 0, \quad \forall i \in [1:n],\\
        & \langle c, b \rangle \neq 0.
    \end{align*}
\end{lemma}


\subsection{Proof of Lemma \ref{lemma: construct models subcase 1}}

\let\oldS\S
\renewcommand{\S}{\widecheck{\mathbf{S}}}
\newcommand{\s}{\widecheck{\mathbf{s}}}


Herein, we present the proof of our first lemma. But first, we need the following technical lemmas.
Assume that $\S'$ and $\S''$ are two disjoint non-empty subsets of $\S$, such that $\S = \S' \cup \S''$. 
% {\color{blue}
% what do you mean here?
% $u_0$ is changes for different $j$? or there exists a $j$ such that $u_0 = \gamma_j$ .
% }

% {
% \color{red} We make $u_0$ equal to $\gamma_j$ and after we define $\phi_j(\cdot)$. We do it because $\phi_j(\cdot)$ implicitly depends on the value of $u_0$, i.e. . 
% }
Let $\S^{\dagger}:=\mathbf{V} \setminus \S'$ and $\s^{\dagger} \in \dom{\S^{\dagger}}{}$. For $u_0=\gamma_j$, where $j \in [1:d]$, we define
 \begin{equation} \label{eq: phi subcase 1}
    \phi_j(\s^{\dagger}) := \sum_{\S'} \sum_{\U'\setminus\{U_0\}} \prod_{X\in \S} P(x | \Pa{X}{\G}) \prod_{U \in \U'\setminus \{U_0\}}P(u).
\end{equation}
Note that $U_0$ may appear as a parent of some observed variables in the above equation. 
Recall that $\mathbf{\Gamma}=\{\gamma_{j_1},...,\gamma_{j_{\frac{\kappa+1}{2}}}\}$. 

%First, we prove the following lemma.
\begin{lemma} \label{lemma: equal indices summation subcase 1}
    For any $\s^{\dagger} \in \dom{\S^{\dagger}}{}$ and both models,  we have
    \begin{equation*}
        \phi_{j_1}(\s^{\dagger}) = \phi_{j_2}(\s^{\dagger})=\dots = \phi_{j_{\frac{k+1}{2}}}(\s^{\dagger}).
    \end{equation*}
\end{lemma}
\begin{proof}
    We fix a realization $\s^{\dagger}$ of $\S^{\dagger}$.
    Suppose that $l_1$ and $l_2$ are two integers, such that
    \begin{equation*}
    \begin{split}
        & \gamma_{l_1} = (2x, 0, \dots, 0),\\
        & \gamma_{l_2} = (2x+2 \pmod{\kappa+1}, 0, \dots, 0),
    \end{split}
    \end{equation*}
    and $x$ is an integer in $[0 : \frac{\kappa-1}{2}]$.
   % Furthermore,  we show that $\phi_{ l_1}(\s'')=\phi_{l_2}(\s'')$.
    Recall that 
    \begin{equation*}
        \phi_j(\s^{\dagger}) := \sum_{\S'} \sum_{\U\setminus\{U_0\}} \prod_{X\in \S} P(x | \Pa{X}{\G}) \prod_{U \in \U\setminus \{U_0\}}P(u).
    \end{equation*}
    We consider two cases:
    \begin{enumerate}
        \item Suppose that there exists a variable $S \in \S$ such that $\mathbb{I}(S)=1$. Then, there is a sequence of variables $U_0, \hat{S}_1, \hat{U}_1, \hat{S}_2, \hat{U}_2, \dots, \hat{U}_l, S$, such that $U_0$ is a parent of $\hat{S}_1$, $S\in \S$ is a children of $\hat{U}_l \in \U^{\S}$ and $\hat{U}_j \in \U^{\S}$ is a parent of variables $\hat{S}_j$ and  $\hat{S}_{j+1}$ for $j \in [1:l-1]$. 
    Let $\hat{\mathbf{U}}:=\{\hat{U}_1, \dots, \hat{U}_l\}$. 
    For a given realization $\mathbf{u}_{1}$ of $\U^{\S}$,  we define $\mathbf{u}_{2} \in \dom{\U^{\S}}{}$ by
    \begin{equation}
        \begin{split}
            & \mathbf{u}_{2}[\hat{U}_j] := \mathbf{u}_{1}[\hat{U}_j] + 2(-1)^{j} \pmod{\kappa+1}, \quad j\in[1:l],\\
            & \mathbf{u}_{2}[U] := \mathbf{u}_{1}[U], \quad \forall U\in \U^{\S} \setminus \hat{\mathbf{U}}.
        \end{split}
    \end{equation}
    This implies
    \begin{equation*}
    P(\hat{s}|\Pa{\hat{S}}{\G})\Big|_{(\U^{\mathbf{S}},U_0)=(\textbf{u}_1,\gamma_{l_1})}=P(\hat{s}|\Pa{\hat{S}}{\G})\Big|_{(\U^{\mathbf{S}},U_0)=(\textbf{u}_2,\gamma_{l_2})},
    \end{equation*}
    for any $\hat{S} \in \S$ and consequently,  $\phi_{l_1}(\s^{\dagger})=\phi_{l_2}(\s^{\dagger})$.
    
    
    \item Suppose that there is no variable in $\S$ with $\mathbb{I}(\cdot)=1$. 
    Denote by $S$ a node in $\S'$ with the shortest path to the node $U_0$ by bidirected edges. Suppose $\hat{s}$ is a realization of $S$ and the shortest path is  $U_0, \hat{S}_1, \hat{U}_1, \hat{S}_2, \hat{U}_2, \dots, \hat{U}_l, S$, so that $U_0$ is a parent of $\hat{S}_1$, $S$ is a child of $\hat{U}_l \in \U^{\S}$ and $\hat{U}_j \in \U^{\S}$ is a parent of variables $\hat{S}_j$ and  $\hat{S}_{j+1}$ for $j \in [1:l-1]$. 
    Let $\hat{\mathbf{U}}:=\{\hat{U}_1, \dots, \hat{U}_l\}$. 
    For a given realization $\mathbf{u}_{1}$ of $\U^{S}$,  we define $\mathbf{u}_{2} \in \dom{\U^{\S}}{}$ by
    \begin{equation}
        \begin{split}
            & \mathbf{u}_{2}[\hat{U}_j] := \mathbf{u}_{1}[\hat{U}_j] + 2(-1)^{j} \pmod{\kappa+1}, \quad j\in[1:l],\\
            & \mathbf{u}_{2}[U] := \mathbf{u}_{1}[U], \quad \forall U\in \U^{\S} \setminus \hat{\mathbf{U}},
        \end{split}
    \end{equation}
    For a given realization $\s_1$ of $\S'$, we define $\s_2 \in \dom{\S'}{}$   as follows
    \begin{equation}
        \begin{split}
            & \s_2[S''] := \s_1[S''], \quad \forall  S''\in\S'\setminus\{S\},\\
            &  \s_2[S] := \s_1[S]+2(-1)^l \pmod{\kappa+1},
        \end{split}
    \end{equation}
    Note that with the above modifications for any $\widetilde{S} \in \S$, we get
    \begin{equation*}
        \widetilde{s}_1 - M(\widetilde{S}) \equiv \widetilde{s}_2 - M(\widetilde{S}) \pmod{\kappa+1},
    \end{equation*}
    where $\widetilde{s}_1$ is a realization of $\widetilde{S}\Big|_{(\S^{\dagger},\S')=(\s^{\dagger},\s_1)}$, $\widetilde{s}_2$ is a realization of $\widetilde{S}\Big|_{(\S^{\dagger}, \S')=(\s^{\dagger}, \s_2)}$, and $M(\cdot)$ is given by Equation (\ref{eq: M(S)}).
    Therefore:
    \begin{equation*}
    P(\widetilde{s}|\Pa{\widetilde{S}}{\G})\Big|_{(\U^{\mathbf{S}},U_0, S)=(\textbf{u}_1,\gamma_{l_1}, s_1)}=P(\widetilde{s}|\Pa{\widetilde{S}}{\G})\Big|_{(\U^{\mathbf{S}},U_0, S)=(\textbf{u}_2,\gamma_{l_2}, s_2)},
    \end{equation*}
    for any $\widetilde{S} \in \S$ and thus $\phi_{l_1}(\s^{\dagger})=\phi_{l_2}(\s^{\dagger})$.
    \end{enumerate}
    
    To summarize, we proved that $\phi_{l_1}(\s^{\dagger})=\phi_{l_2}(\s^{\dagger})$. By varying $x$ within $[0 : \frac{\kappa-1}{2}]$ in the definition of $\gamma_{l_1}$ and $\gamma_{l_2}$, we  conclude the lemma.
\end{proof}

%\paragraph{Proof of Lemma 1}

In order to have consistent notations in the appendix, we restate Lemma \ref{lemma: construct models subcase 1} using $\widecheck{\mathbf{S}}, \S', \S''$ instead of $\mathbf{L}, \mathbf{L}', \mathbf{L}''$ respectively.
\begin{customlem}{\ref{lemma: construct models subcase 1}}
    Suppose $\S\subseteq \V$ is a single c-component, such that $\S = \S'\cup\S''$ for some disjoint sets $\S'$ and $\S''$. 
    $Q[\S'|\S'']$ is c-gID from $(\mathbb{A}, \G)$ if and only if $Q[\S'\cup \S'']$ is gID from $(\mathbb{A}, \G)$.
\end{customlem}



\begin{proof}
\hfill\\
    \textbf{Sufficiency:} We use Assume that $Q[\S'\cup \S'']$ is gID from $(\mathbb{A}, \G)$, then $Q[\S'|\S'']$ is c-gID from $(\mathbb{A}, \G)$.  This is an immediate result of applying Equation \eqref{eq: conditional Q}, i.e., 
    \begin{equation*}
        Q[\S'|\S''](\mathbf{v}) = \frac{Q[\S](\mathbf{v})}{\sum_{\S'} Q[\S](\mathbf{v})}
    \end{equation*}

    \textbf{Necessity:}
    We prove this by contradiction. Assume that $Q[\S'\cup \S'']$ is not gID from $(\mathbb{A}, \G)$. We will show  that $Q[\S'|\S'']$ is not c-gID from $(\mathbb{A}, \G)$. 
    To this end, we will construct two models $\M_1$ and $\M_2$ such that for each $i \in [0:m]$ and any $\mathbf{v}\in \mathbf{V}$:
    \begin{align}
        \label{eq: equal known dist subcase 1}
        Q^{\M_1}[\A_i](\mathbf{v}) &= Q^{\M_2}[\A_i](\mathbf{v}),\\
        \label{eq: equal denom num subcase 1}
        \sum_{\S'}Q^{\M_1}[\S](\mathbf{v}') &= \sum_{\S'}Q^{\M_2}[\S](\mathbf{v}'),
    \end{align}
    but there exists $\mathbf{v}_0 \in \dom{\mathbf{V}}{}$ such that:
    \begin{equation}\label{eq: not equal num subcase 1}
        Q^{\M_1}[\S](\mathbf{v}_0) \neq Q^{\M_2}[\S](\mathbf{v}_0).
    \end{equation}
    Equations (\ref{eq: equal denom num subcase 1})-(\ref{eq: not equal num subcase 1}) yield
    \begin{equation*}
         Q[\S'|\S'']^{\M_1}(\mathbf{v}_0) \neq Q[\S'|\S'']^{\M_2}(\mathbf{v}_0).
    \end{equation*}
    This means that $Q[\S'|\S'']$ is not c-gID from $(\mathbb{A}, \G)$.

    We consider two cases.

    \paragraph{First case:} 
    Suppose that there exists $i \in [0, m]$, such that $\widecheck{\mathbf{S}} \subset \mathbf{A}_i$.
    For this, we consider the models constructed in the section \ref{sec: baseline}:
    \begin{align}
        & \sum_{\S'} Q[\S]^{\M_1}(\mathbf{v}) = \sum_{j=1}^d \frac{1}{d}\phi_{j}(\mathbf{v}[\S^{\dagger}]), \\
        & \sum_{\S'} Q[\S]^{\M_2}(\mathbf{v}) = \sum_{j=1}^d p_j\phi_{j}(\mathbf{v}[\S^{\dagger}]).
    \end{align}
    and according to the Equations (\ref{eq: theta and eta}) and \eqref{eq: phi subcase 1}, we have
    \begin{align}
        & Q^{\M_2}[\A_i](\mathbf{v}) - Q^{\M_1}[\A_i](\mathbf{v}) = \sum_{j=1}^d (p_j - \frac{1}{d}) \theta_{i,j}(\mathbf{v})
        \\
        & \hspace{-0.5cm}\sum_{\S'} Q[\S]^{\M_2}(\mathbf{v}) - \sum_{\S'} Q[\S]^{\M_1}(\mathbf{v}) = \sum_{j=1}^d (p_j - \frac{1}{d}) \phi_{j}(\mathbf{v}[\S^{\dagger}])
        \\
        & Q^{\M_2}[\S](\mathbf{v}_0) -  Q^{\M_1}[\S](\mathbf{v}_0) = \sum_{j=1}^d (p_j - \frac{1}{d}) \eta_{j}(\mathbf{v}_0)
        \\
        & \sum_{j=1}^d p_j - 1 = \sum_{j=1}^d (p_j - \frac{1}{d})
    \end{align}
    
    
     Therefore, it suffices to solve a system of linear equations over parameters $\{p_j\}_{j=1}^d$ and show that it admits a solution. 
    \begin{align}
        \label{eq: linear system start}
        & \sum_{j=1}^d (p_j - \frac{1}{d}) \theta_{i,j}(\mathbf{v}) = 0, \hspace{0.2cm}\forall \mathbf{v} \in \dom{\mathbf{V}}{}, i\in [0,m],
        \\
        & \sum_{j=1}^d (p_j - \frac{1}{d}) \phi_{j}(\s^{\dagger}) = 0, \hspace{0.2cm}\forall \s^{\dagger} \in \dom{\S^{\dagger}}{}, i\in [0,m],
        \\
        & \sum_{j=1}^d (p_j - \frac{1}{d}) \eta_{j}(\mathbf{v}_0) \neq 0, \hspace{0.2cm} \exists \mathbf{v}_0 \in \dom{\V}{},
        \\
        & (p_j - \frac{1}{d}) = 0,
        \\
        \label{eq: linear system end}
        & 0<p_j<1, \hspace{0.2cm} \forall j \in [1:d].
    \end{align}

    However, the system of linear equations (\ref{eq: linear system start})-(\ref{eq: linear system end}) admits a solution with respect to $\{p_j\}_{j=1}^d$ if and only if the following system of equations has a solution with respect to parameters $\{\beta_j\}_{j=1}^{d}$:
    \begin{align}
        \label{eq: homogenous linear system start}
        &\sum_{j=1}^d \beta_j \theta_{i,j}(\mathbf{v}) =0, \hspace{0.2cm}\forall \mathbf{v} \in \dom{\mathbf{V}}{}, i \in [0:m]\\
        &\sum_{j=1}^d \beta_j \phi_{j}(\s^{\dagger}) =0, \hspace{0.2cm}\forall \s^{\dagger} \in \dom{\S^{\dagger}}{}, i \in [0:m]\\
        \label{eq: homogenous linear system ineq}
        &\sum_{j=1}^d \beta_j \eta_j(\mathbf{v}_0) \neq 0, \hspace{0.2cm} \exists \mathbf{v}_0 \in \dom{\mathbf{V}}{}\\
        \label{eq: homogenous linear system end}
        & \sum_{j=1}^d \beta_j=0.
    \end{align}
    Clearly, if $\{\beta_j^*\}$ is a solution for system (\ref{eq: homogenous linear system start})-(\ref{eq: homogenous linear system end}), then 
    \begin{equation}
        p_j^*:=\frac{1}{d}+\frac{\beta_j^*}{2hd},
    \end{equation}
    is a solution for \eqref{eq: linear system start}-\eqref{eq: linear system end}, where $h := \underset{j \in [1:d]}{max} |\beta^*_j|$.

    According to Lemma \ref{lemma: gid equal indices} and Lemma \ref{lemma: equal indices summation subcase 1}, for any $i\in [0:m]$, $\mathbf{v} \in \dom{\mathbf{V}}{}$ and  $\s^{\dagger} \in \dom{\S^{\dagger}}{}$, we have
    \begin{align*}
        & \theta_{i,j_1}(\mathbf{v}) = \theta_{i,j_2}(\mathbf{v}) = \cdots= \theta_{i,j_{\frac{\kappa+1}{2}}}(\mathbf{v}), \\
        & \phi_{j_1}(\s^{\dagger}) = \phi_{j_2}(\s^{\dagger})=\dots = \phi_{j_{\frac{k+1}{2}}}(\s^{\dagger}),
    \end{align*}
    and by Lemma \ref{lemma: gid not equal indices}, we know that there exists $\mathbf{v}_0 \in \dom{\mathbf{V}}{}$ and $1\leq r <t\leq \frac{\kappa+1}{2}$ such that 
    \begin{equation*}
        \eta_{j_r}(\mathbf{v}_0) \neq \eta_{j_t}(\mathbf{v}_0).
    \end{equation*}
    The latter means that the vector $\big(\eta_{1}(\mathbf{v}_0), \eta_{2}(\mathbf{v}_0), \dots, \eta_{d}(\mathbf{v}_0)\big)$ is linearly independent from vectors:
    \begin{align}
        & \big(1, 1, \dots, 1\big),
        \\
        & \big(\theta_{i, 1}(\mathbf{v}), \theta_{i, 2}(\mathbf{v}), \dots, \theta_{i, d}(\mathbf{v})\big), \hspace{0.2cm} \forall \mathbf{v}\in \dom{\mathbf{V}}{},\quad \forall i\in[0:m],\\
        & \big(\phi_{1}(\s^{\dagger}), \phi_{2}(\s^{\dagger}), \dots, \phi_{d}(\s^{\dagger})\big), \hspace{0.2cm} \forall \s^{\dagger}\in \dom{\S^{\dagger}}{}.
        \\
    \end{align}
    Combining the last result with Lemma \ref{lemma: lin indep formal} imply the existence of a solution  $\{\beta_j^*\}$ and  subsequently the existence of two models $\M_1$ and $\M_2$ that satisfy equation \eqref{eq: equal known dist subcase 1}, \eqref{eq: equal denom num subcase 1} and \eqref{eq: not equal num subcase 1}. %This concludes the proof of the Necessity part.
    
    \paragraph{Second case:}
    Suppose that there is no $i \in [0, m]$, such that $\S \subset \mathbf{A}_i$. Suppose $S^*\in \S$ and denote by $\G^*$ the graph obtained from graph $\G$ through the following procedure:
    \begin{enumerate}
        \item Add nodes $T_0^*$ and $U_0^*$ to graph $\G$.
        \item Draw a direct edge from $T_0^*$ to $S^*$.
        \item Draw direct edges from $U_0^*$ to $S^*$ and $T_0^*$.
    \end{enumerate}
    We define $\mathbf{A}_{m+1} := \S \cup \{T_0^*\}$ and $\mathbb{A}^* := \mathbb{A}\cup \{\A_{m+1}\}$. To summarize, we have
    \begin{itemize}
        \item $\mathbf{V}$ is a set of all observed variables in graph $\G$;
        \item $\mathbf{U}$ is a set of all unobserved variables in graph $\G$;
        \item $\mathbf{V}^* = \mathbf{V}\cup \{T_0^*\}$;
        \item $\mathbf{U}^* = \mathbf{U}\cup \{U_0^*\}$.
    \end{itemize}
    Note that $Q[\S]$ is not identifiable in $\G^*[\A_{m+1}]$ and therefore $Q[\S]$ remains not gID from $(\mathbb{A}^*, G^*)$. Since $\S \in \A_{m+1}$, according to the \textbf{First case}, we can construct models $\M_1^*$ and $\M_2^*$ for the graph $\G^*$ and set $\mathbb{A}^*$. These two models satisfy the following properties
    \begin{itemize}
        \item $\dom{U_0^*}{} = [0:\kappa]$ and $d=\kappa+1$.
        \item $\dom{T_0^*}{}$ = \{0, 1\}.
    \end{itemize}
    For the graph $\G^*$, we define 
    \begin{align*}
        & \theta_{i, j}(\mathbf{v}, T_0^*=t_0) := \sum_{\mathbf{U}} \prod_{X \in \A_i} P(x \mid \Pa{X}{\G^*}) \prod_{U\in \mathbf{U}} P(u), \quad i\in [0:m], \; j\in [1:d], \\
        & \theta_{m+1, j}(\mathbf{v}, T_0^*=t_0) := \sum_{\mathbf{U}} P(T_0^*=t_0)\prod_{X \in \A_i} P(x \mid \Pa{X}{\G^*}) \prod_{U\in \mathbf{U}} P(u), \quad j\in [1:d], \\
        & \phi_j(\s^{\dagger}) := \sum_{\S'} \sum_{\U} \prod_{X\in \S} P(x | \Pa{X}{\G^*}) \prod_{U \in \U}P(u), \quad j \in [1:d] \\
        & \eta_{j}(\mathbf{v}, T_0^*=t_0) := \sum_{\mathbf{U}} \prod_{X \in \widecheck{\mathbf{S}}} P(x \mid \Pa{X}{\G^*}) \prod_{U\in \mathbf{U}} P(u).
    \end{align*} 
Now, we are ready to construct two models $\M_1$ and $\M_2$ for $\G$.
\begin{itemize}
    \item  For all $S \in \S \setminus \{S^{*}\}$, we define
    \begin{equation*}
        P^{\M_i}(S|\Pa{S}{\G}) := P(S|\Pa{S}{\G^*}), \quad i\in\{1,2\}.
    \end{equation*}
    \item For $S=S^*$, we define
    \begin{align*}
        & P^{\M_1}(S|\Pa{S}{\G}) := P(S|\Pa{S}{\G}, T_0^*=1, U_0^*=0), \\
        & P^{\M_2}(S|\Pa{S}{\G}) := P(S|\Pa{S}{\G}, T_0^*=1, U_0^*=2).
    \end{align*}
\end{itemize}
Suppose that $\gamma_{r_1} = 0$ and $\gamma_{r_2}=2$, then
\begin{itemize}
    \item In model $\M_1$:
    \begin{align*}
        & Q[\A_i]^{\M_1}(\mathbf{v}) = \theta_{r_1, j}(\mathbf{v}, T_0^*=1), \quad i \in [0, m],\\
        & \sum_{\S'}Q^{\M_1}[\S](\mathbf{v}) = \phi_{r_1}(\mathbf{v}[\S^{\dagger}]),\\
        & Q^{\M_1}[\S](\mathbf{v}) = \eta_{r_1}(\mathbf{v}).
    \end{align*}
    
    \item In model $\M_2$:
    \begin{align*}
        & Q[\A_i]^{\M_2}(\mathbf{v}) = \theta_{r_2, j}(\mathbf{v}, T_0^*=1), \quad i \in [0, m],\\
        & \sum_{\S'}Q^{\M_2}[\S](\mathbf{v}) = \phi_{r_2}(\mathbf{v}[\S^{\dagger}]),\\
        & Q^{\M_2}[\S](\mathbf{v}) = \eta_{r_2}(\mathbf{v}).
    \end{align*}
\end{itemize}
According to the Lemmas \ref{lemma: gid equal indices} and \ref{lemma: equal indices summation subcase 1} for any $\mathbf{v}\in \dom{\mathbf{V}}{}$
\begin{align*}
    Q^{\M_1}[\A_i](\mathbf{v}) &= Q^{\M_2}[\A_i](\mathbf{v}),
    \\
    \sum_{\S'}Q^{\M_1}[\S](\mathbf{v}') &= \sum_{\S'}Q^{\M_2}[\S](\mathbf{v}),
\end{align*}
however, using Lemma \ref{lemma: gid not equal indices} and for $\mathbf{v}_0 = (0,...,0)$, we get
\begin{equation*}
    Q^{\M_1}[\S](\mathbf{v}_0) \neq Q^{\M_2}[\S](\mathbf{v}_0).
\end{equation*}
\end{proof}




\subsection{Proof of the properties in Section \ref{sec: second subcase} \& Section \ref{sec: third subcase}} \label{sec: properties}

Recall that in Sections \ref{sec: second subcase} and \ref{sec: third subcase}, we present two sets of properties which we prove them here. 
We only present the formal proof of the set of properties in Sections \ref{sec: second subcase} since the other set of properties in Section \ref{sec: third subcase} can be shown similarly.


\begin{enumerate}
    \item If path $p$ contains a chain $W'\rightarrow W \rightarrow W''$ or a fork $W' \leftarrow W \rightarrow W''$, then node $W$ does not belong to any of the sets $\X'$, $\Z'$ or $\Y'$.
    
    \item If path $p$ contains a collider $W'\rightarrow W \leftarrow W''$, then there is a directed path $p_W$ from $W$ to a node in $\Z'$. 
    Moreover, none of the intermediate nodes in the path $p_W$ belong to the set $\X'\cup\Z'\cup\Y'$.
    
    \item Path $p$ does not contain any node from the set $\X'$.
\end{enumerate}
\begin{proof}
\hfill\\
1. The first property is obvious since path $p$ is not blocked by the set $\X'\cup (\Z' \setminus \{Z'\})\cup(\Z' \setminus \{Y'\})$. 

2. Suppose $W$ is a collider as defined and let assume that $R$ is the closest descendant of the variable $W$ that unblocks path $p$. Note that $R \notin \X'$ since it unblocks $p$ in the graph $\G_{\overline{\X'},\underline{\{Z'\}}}$, i.e. no incoming edges in $\X'$. 

All variables except $R$ in the shortest directed path from $W$ to $R$ do not belong to the set $\X' \cup \Y' \cup \Z'$. 
Assume that $R \in \Y'$ and $p'$ is a path obtained by combining two paths: one from $Z'$ to $W$ in $p$ and the other one from $W$ to $R$ (defined above). 
It is easy to see that $p'$ is also unblocked, but it contains less number of colliders than $p$. 
This is impossible according to the definition of the path $p$. 
Thus, $R$ must be in the set $\Z'$. This concludes the proof of the second property.

3. We prove this by contradiction. 
Suppose that there is a variable $R\in \X'$ on the path $p$. Since $p$ is unblocked, then $X$ is a collider or a descendant of a collider. This is impossible due to property 2.
% Recall that in Section \ref{sec: third subcase} we defined an unblocked path $\widetilde{p}$ from $Z'$ to some node $Y'\in\Y'$ given $\X', \Z'\setminus\{Z'\}$. Path $\widetilde{p}$ satisfies the following properties:
\end{proof}





\subsection{Proof of Lemma \ref{lemma: construct models subcase 2}} \label{sec: supportive materials subcase 2}



Recall that $\textbf{S}=\Anc{\Y'\cup \Z'}{\G[\V \setminus \X']}$ and it is assumed that is not gID from $(\mathbb{A}, \G)$.  $\textbf{S}$ consists of $\textbf{S}_1,...,\textbf{S}_n$ as its single c-components where $\textbf{S}_1$ is not gID.
Let $\S=\mathbf{S}_1$. 
Clearly, we can add $\{\mathbf{S}_i\}_{i=2}^{n}$ to the known distributions and $\S$ remains not gID, i.e., $\S$ is not gID from $(\mathbb{A}', \G)$, where $\mathbb{A}' := \mathbb{A}\cup\{\mathbf{S}_i\}_{i=2}^{n}$. 
For simplicity, we denote $\mathbb{A}' = \{\mathbf{A}'\}_{i=0}^{m'}$.
Hence, using the method in Section \ref{sec: baseline}, we can construct two models $\M_1$ and $\M_2$ that are the same over the known distributions and different over $Q[\textbf{S}_1]$. These models  disagree on the distribution $Q[\mathbf{S}]$ as well, because $Q[\mathbf{S}] = \prod_{i=1}^{n}Q[\mathbf{S}_i]$. Below, we use these two models to introduce two new models to prove Lemma \ref{lemma: construct models subcase 2}.  


\renewcommand{\R}{\mathbf{R}}
\subsubsection{New models for Lemma \ref{lemma: construct models subcase 2}} \label{sec: appendix new models subcase 2}

Recall that $\mathcal{P}$ is a collection of paths $\{p\}\cup\{ p_W|W \in \mathbf{F}\}$, where $\mathbf{F}$ is a set of all colliders on the path $p$. Moreover, $\D$ is a set of all observed nodes on the paths in $\mathcal{P}$ excluding the ones in $\Z'$. Figure \ref{fig:va2} demonstrates some variables used in this proof and their relations for clarity.

\begin{figure}
    \centering
    \includegraphics[scale=0.2]{paths.jpg}
    \caption{An illustration of the path $p$, collider $W$ and its corresponding path $p_W$.}
    \label{fig:va2}
\end{figure}

Herein, we define new models $\M_1'$ and $\M_2'$ based on the models $\M_1$ and $\M_2$. Let $\D_{\mathcal{P}}$ be the set of all variables (observed and unobserved) on the paths in $\mathcal{P}$. We say that a variable $D$ is a \textbf{starting node} of path $\hat{p}\in\mathcal{P}$ if
\begin{itemize}
    \item $D=Z'$ and $\hat{p}=p$ or
    \item $D \in \mathbf{F}$, i.e., it is a collider on path $p$ and $\hat{p}=p_D$.
\end{itemize}
Note that $D$ can be a starting node of only  one path. According to the definition of a starting node, if $D$ is a starting node for some path then either $D$ is a collider on the path $p$ or $D$ is $Z'$.  

For $R \in \mathbf{V}\cup \mathbf{U}$, let $\alpha_p(R)$ be the number of paths in $\mathcal{P}$ that contains $R$. Furthermore, we use $\dom{R}{}^{'}$ and $\dom{R}{}$ to denote its domain in  $\M'_1$ or $\M'_2$ (variables in different models have the same domains) and in $\M_1$ or $\M_2$, respectively.  
We define $\dom{R}{}'$ as follows:
\begin{itemize}
    \item If $R$ is a starting node for a path in $\mathcal{P}$:
    \begin{align*}
        & \dom{R}{}^{'} := \dom{R}{}^{}\times[0:\kappa]^{\alpha_{p}(R)-1}.
    \end{align*}
    % \item If $R \in (\mathbf{V}\cup \mathbf{U})\setminus\S$, then:
    % \begin{align*}
    %     & \dom{R}{}^{'} := \dom{R}{}^{}\times[0:\kappa]^{\alpha_{p}(R)}.
    % \end{align*}
    % \item If $R \in \S$ and $R$ belongs to one of the paths in $\mathcal{P}$, then:
    % \begin{align*}
    %     & \dom{R}{}^{'} := \dom{R}{}^{}\times[0:\kappa]^{\alpha_{p}(R)-1}.
    % \end{align*}
    \item If $R$ is not a starting node for any of the paths in $\mathcal{P}$, then:
    \begin{align*}
        & \dom{R}{}^{'} := \dom{R}{}^{}\times[0:\kappa]^{\alpha_{p}(R)}.
    \end{align*}
\end{itemize}
Consequently, if $R$ does not belong to any of the paths in $\mathcal{P}$, then $\dom{R}{}^{'} = \dom{R}{}^{}.$
 

Consider $R \in \mathbf{V}\cup\mathbf{U}$.
According to the domains definitions above, $R$ is a vector that is a concatenation of the vector coming from $\dom{R}{}^{}$ in model $\M_1$ (or $\M_2$) and some additional coordinates.
These additional coordinates are defined based on $\alpha_p(R)$. 
More precisely, if $R$ is not a starting node of a path $\hat{p}\in\mathcal{P}$, then there is a coordinate assigned to this path, denoted by $R[\hat{p}]$, otherwise, if $R$ is a starting node of  $\hat{p}\in\mathcal{P}$, then there is no coordinate assigned this path.


%to denote a respective entry in $R$ i.e. one of the entries of the vector $[0:\kappa]^{\alpha_{p}(R)}$ for $\dom{R}{}^{'} := \dom{R}{}^{}\times[0:\kappa]^{\alpha_{p}(R)}$ and one of the entries of the vector $[0:\kappa]^{\alpha_{p}(R)-1}$ for $\dom{R}{}^{'} := \dom{R}{}^{}\times[0:\kappa]^{\alpha_{p}(R)-1}$.

Let $\mathbf{O}\subseteq\mathbf{V}\cup \mathbf{U}$. 
For any realization $\mathbf{o}\in\dom{\mathbf{O}}{}^{'}$ of $\mathbf{O}$, we denote by $\mathbf{o}^\M\in\dom{\mathbf{O}}{}$, a realization of $\mathbf{O}$  that is consistent with $\mathbf{o}$. With a slight abuse of notation, we use $\textbf{O}$ and $\textbf{O}^\M$ to denote realizations of $\textbf{O}$ in models $\M'_i$ and $\M_i$, respectively. $\textbf{O}^\M$ means realizations in $\dom{\mathbf{O}}{}$ from model $\M_i$ that are consistent with realizations in $\dom{\mathbf{O}}{}^{'}$ from model $\M'_i$.

Recall that $\D_{\mathcal{P}}$ is a set of all variables on the paths in $\mathcal{P}$. Let $D\in \D_{\mathcal{P}}$. We denote by $\mathcal{P}_D$, the set of all paths $\hat{p}$, such that $\hat{p}\in \mathcal{P}$, $D$ belongs to path $\hat{p}$, and $D$ is not a starting node of path $\hat{p}$.
We are now ready to define the probabilities of $P^{\M'_i}(D|\Pa{D}{\G})$ for any $D \in \mathbf{V}\cup \mathbf{U}$ and $i \in \{1,2\}$.
\begin{itemize}
    \item If $D$ does not belong to the set $\D_{\mathcal{P}}$, we define
    \begin{align*}
        P^{\M'_i}(D|\Pa{D}{\G}) := P^{\M_i}(D^\M|\Pa{D}{\G}).
    \end{align*}
    \item If $D$ belongs to the set $\D_{\mathcal{P}}\setminus\{Z'\}$, we define
    \begin{equation*}
        P^{\M'_i}(D|\Pa{D}{\G}) := P^{\M_i}(D^{\M}|\Pa{D}{\G})\prod_{\hat{p}\in \mathcal{P}_D}f_{\hat{p}}(D[\hat{p}]|\Pa{D}{\hat{p}}),
    \end{equation*}
    where $\Pa{D}{\hat{p}}$ denotes the parents of $D$ on path $\hat{p}$ and $f_{\hat{p}}(D|\Pa{D}{\hat{p}})$ is given below.

    \paragraph{Definition of function} $f_{\hat{p}}(D[\hat{p}]|\Pa{D}{\hat{p}})$:
    \begin{itemize}
        \item When there exists a variable $W\in \mathbf{F}$, such that $\hat{p}=p_W$ and $D$ is a child of $W$ on path $p_W$ (i.e., $W\in\Pa{D}{p_W}$), then we define
        \begin{equation*}
        f_{p_W}(D[p_W]|\Pa{D}{p_W}) :=
        \begin{cases} 
            1-\kappa\epsilon &  \text{ if }  D[p_W]\equiv W[p] \pmod{\kappa+1},\\
            \epsilon &  \text{ if }  D[p_W]\not\equiv W[p] \pmod{\kappa+1}.
        \end{cases}
        \end{equation*}
        
        \item When $\Pa{D}{\hat{p}}=\emptyset$, 
        \begin{equation*}
            f_{\hat{p}}(D[\hat{p}]) := \frac{1}{\kappa+1}.
        \end{equation*}
        
        \item Otherwise,
        \begin{equation} \label{eq: f for not starting node}
        f_{\hat{p}}(D[\hat{p}]|\Pa{D}{\hat{p}}) :=
        \begin{cases} 
            1-\kappa\epsilon &  \text{ if }  D[\hat{p}]\equiv \sum_{D' \in \Pa{D}{\hat{p}}}D'[\hat{p}] \pmod{\kappa+1}\\
            \epsilon &  \text{ if }  D[\hat{p}]\not\equiv \sum_{D' \in \Pa{D}{\hat{p}}}D'[\hat{p}] \pmod{\kappa+1},
        \end{cases}
        \end{equation}
        Note that $P^{\M'_i}(D|\Pa{D}{\G})$ is a probability distribution since for different paths $\hat{p}_1$ and $\hat{p}_2$, $D[\hat{p}_1]$ and $D[\hat{p}_2]$ are different and also 
        \begin{equation*}
            \sum_{D[\hat{p}]\in \dom{D[\hat{p}]}{}} f_{\hat{p}}(D[\hat{p}]|\Pa{D}{\hat{p}}) = 1
        \end{equation*}
    \end{itemize}
    
    % \textbf{Distribution $P'(D|\Pa{D}{\G})$:}
    % \begin{itemize}
    %     \item When $D$ does not belong to the set $\S$,
    %     \begin{equation*}
    %         P'(D|\Pa{D}{\G}) := P^{\M_i}(D^\M|\Pa{D}{\G})
    %     \end{equation*}
    %     \item When $D\in \S$, analogous to the models $\M_1$ and $\M_2$, we define
    %     \begin{equation*}
    %     P'(D \mid \Pa{D}{\G})=:
    %     \begin{cases} 
    %         \frac{1}{\kappa+1} & \text{ if } \mathbb{I}(D)=1\\
    %         1-\kappa\epsilon &  \text{ if } \mathbb{I}(D)=0  \text{ and } D[D(\mathcal{P})] \equiv M'(D) \pmod{\kappa+1}, \\
    %         \epsilon &  \text{ if }  \mathbb{I}(D)=0  \text{ and } D[D(\mathcal{P})] \not\equiv M'(D) \pmod{\kappa+1},
    %     \end{cases}
    %     \end{equation*}
    %     where
    %     \begin{equation}
    %     M'(D):=
    %     \begin{cases} \label{eq: M'(D)}
    %         \sum_{\hat{D}\in\Pa{D}{D(\mathcal{P})}}\hat{D}[D(\mathcal{P})] + \sum_{\hat{d}'\in \Pa{D}{\G'[\widecheck{\mathbf{S}}]}}\hat{d}' & \text{, if } D \in \widecheck{\mathbf{S}}\setminus \{S_0\}, \\
    %         \sum_{\hat{D}\in\Pa{D}{D(\mathcal{P})}}\hat{D}[D(\mathcal{P})] + u_0[0]+\sum_{\hat{d}'\in \Pa{D}{\G'[\widecheck{\mathbf{S}}]}}\hat{d}' & \text{, if $D=S_0$ }.
    %     \end{cases}
    %     \end{equation}
        
    % \end{itemize}
    
    
    \item If $D=Z'$ and $W$ is a parent of $Z'$ in path $p$. Note that such $W$ exists because $p$ is an unblocked backdoor path in graph $\G_{\overline{\X'},\underline{\{Z'\}}}$. Recall that $Z'$ is a variable from the set $\S$. In this case, we define
    \begin{equation}
        P^{\M'_i}(Z'|\Pa{Z'}{\G}) := P'(Z'^{\M}|\Pa{Z'}{\G})\prod_{\hat{p}\in \mathcal{P}_{Z'}}f_{\hat{p}}(Z'[\hat{p}]|\Pa{Z'}{\hat{p}}),
    \end{equation}
    where $P'(\cdot|\cdot)$ is given by
    \begin{equation*}
    P'(Z'^{\M}=z' \mid \Pa{Z'}{\G}):=
    \begin{cases} 
        \frac{1}{\kappa+1} & \text{ if } \mathbb{I}(Z')=1,\\
        1-\kappa\epsilon &  \text{ if } \mathbb{I}(Z')=0  \text{ and } z' \equiv M'(Z') \pmod{\kappa+1}, \\
        \epsilon &  \text{ if }  \mathbb{I}(Z')=0  \text{ and } z'\not\equiv M'(Z') \pmod{\kappa+1},
    \end{cases}
    \end{equation*}
    and $M'(\cdot)$ is defined similar to \eqref{eq: M(S)} and is given by
    \begin{equation}
    M'(Z'):=
    \begin{cases} \label{eq: M'(S)}
        W[p] + \sum_{x\in \Pa{Z'}{\G'[\widecheck{\mathbf{S}}]}}x^{\M} & \text{, if } Z'\in \widecheck{\mathbf{S}}\setminus \{S_0\}, \\
        W[p] + u_0^{\M}[0]+\sum_{x\in \Pa{Z'}{\G'[\widecheck{\mathbf{S}}]}}x^{\M} & \text{, if $Z'=S_0$ }.
    \end{cases}
    \end{equation}
\end{itemize}

Note that for any $W \in (\mathbf{V} \cup \mathbf{U})\setminus \{U_0\}$, we have
$$
P^{\M'_1}(W|\Pa{W}{\G}) = P^{\M'_2}(W|\Pa{W}{\G}).
$$ 
Therefore, we will use $P^{\M'}(W|\Pa{W}{\G})$ instead of $P^{\M'_1}(W|\Pa{W}{\G})$ or $P^{\M'_2}(W|\Pa{W}{\G})$ for  $W \in (\mathbf{V} \cup \mathbf{U})\setminus \{U_0\}$. 
%Analogously we define $P^{\M}(W|\Pa{W}{\G})$.

We also have
\begin{equation}
\label{eq: prob U_0 subcase 2}
\begin{gathered}
    P^{\M'_1}(U_0) = \frac{1}{d} \prod_{\hat{p}\in \mathcal{P}_{U_0}}f_{\hat{p}}(U_0[\hat{p}]), \\
    P^{\M'_2}(U_0) = P^{\M_2}(U_0^{\M}) \prod_{\hat{p}\in \mathcal{P}_{U_0}}f_{\hat{p}}(U_0[\hat{p}]).
\end{gathered}
\end{equation}

Recall that $\mathbf{S}=\Anc{\Y', Z'}{\G[\mathbf{V}\setminus\X']}$. Let $\D':=\mathbf{S}\setminus\D$ and $\D^{\dagger} := \mathbf{V} \setminus \mathbf{D}$.
For $i \in [0:m']$, $j\in [1:d]$, $\mathbf{v} \in \dom{\mathbf{V}}{}^{'}$ and $\mathbf{d}^{\dagger} \in \dom{\D^{\dagger}}{}'$, we define $\theta_{i, j}^{'}(\mathbf{v})$, $\phi_{j}^{'}(\mathbf{d}^{\dagger})$ and $\eta_{j}^{'}(\mathbf{v})$ as follows:
\begin{align}
    \label{eq: def theta subcase 2}
    & \theta_{i, j}^{'}(\mathbf{v}) := \sum_{U_0[\mathcal{P}]}\prod_{\hat{p}\in \mathcal{P}_{U_0}}f_{\hat{p}}(U_0[\hat{p}])\sum_{\mathbf{U} \setminus \{U_0\}} \prod_{X \in \A_i'} P^{\M'}(x \mid \Pa{X}{\G}) \prod_{U\in \mathbf{U} \setminus \{U_0\}} P^{\M'}(u^{\M}),\\
    \label{eq: def phi subcase 2}
    & \phi_{j}^{'}(\mathbf{d}^{\dagger}) := \sum_{U_0[\mathcal{P}]}\prod_{\hat{p}\in \mathcal{P}_{U_0}}f_{\hat{p}}(U_0[\hat{p}])\sum_{\D}\sum_{\mathbf{U} \setminus \{U_0\}} \prod_{X \in \mathbf{S}} P^{\M'}(x \mid \Pa{X}{\G}) \prod_{U\in \mathbf{U} \setminus \{U_0\}} P^{\M'}(u^{\M}),\\
    \label{eq: def eta subcase 2}
    & \eta_{j}^{'}(\mathbf{v}) := \sum_{U_0[\mathcal{P}]}\prod_{\hat{p}\in \mathcal{P}_{U_0}}f_{\hat{p}}(U_0[\hat{p}])\sum_{\mathbf{U} \setminus \{U_0\}} \prod_{X \in \mathbf{S}} P^{\M'}(x \mid \Pa{X}{\G}) \prod_{U\in \mathbf{U} \setminus \{U_0\}} P^{\M'}(u^{\M}),
\end{align}
where $\sum_{U_0[\mathcal{P}]}$ is a summation over all realizations of the random variables $\{U_0[\hat{p}]|\ \hat{p}\in \mathcal{P}_{U_0}\}$. 

Next, we prove three lemmas similar to Lemmas \ref{lemma: gid equal indices}, \ref{lemma: gid not equal indices},  and \ref{lemma: equal indices summation subcase 1}  for the new models $\M'_1$ and $\M'_2$.

\begin{lemma}
    \label{lemma: theta equal indices subcase 2}
    For any $\mathbf{v} \in \dom{\mathbf{V}}{}^{'}$ and $i\in[0:m']$, we have
    \begin{equation*}
        \theta_{i,j_1}'(\mathbf{v}) = \theta_{i,j_2}'(\mathbf{v}) = \cdots= \theta_{i,j_{\frac{\kappa+1}{2}}}'(\mathbf{v}).
    \end{equation*}
\end{lemma}
\begin{proof}
    %According to the construction of models $\M_1'$ and $\M_2'$,
    By substituting $P^{\M'}$ from the above into Equation \eqref{eq: def theta subcase 2} and rearranging the terms, we obtain
    \begin{equation*}
    \begin{gathered}
        \theta_{i, j}^{'}(\mathbf{v}) = 
        \sum_{\mathbf{U}[\mathcal{P}]} 
        \prod_{\hat{U}[\hat{p}]\in \mathbf{U}[\mathcal{P}]} f_{\hat{p}}(\hat{U})
        \prod_{\hat{X}[\hat{p}] \in \mathbf{A}'_i[\mathcal{P}]} f_{\hat{p}}(\hat{X}[\hat{p}]|\Pa{\hat{X}}{\hat{p}})\\
        \times\Big( \sum_{\textbf{\underline{U}}^{\M}}
         P'(Z'|\Pa{Z'}{\G})
         \prod_{X \in \A'_i\setminus\{Z'\}} P^{\M}(x^{\M} \mid \Pa{X}{\G}) \prod_{U\in \mathbf{U} \setminus \{U_0\}}\!P^{\M}(u^{\M})\Big),
    \end{gathered}
    \end{equation*}
    where $\mathbf{U}[\mathcal{P}]:=\bigcup_{U\in\textbf{U}}\{U[\hat{p}]|\ \hat{p}\in \mathcal{P}_{U}\}$, $\underline{\textbf{U}}:=\mathbf{U} \setminus \{U_0\}$, and by definition $\textbf{\underline{U}}^{\M}$ is all realizations of elements in set $\textbf{\underline{U}}$ in $\dom{\textbf{\underline{U}}}{}$ that are consistent with realizations in $\dom{\textbf{\underline{U}}}{}^{'}$.
    Suppose variable $W$ belongs to the path $p$ and $Z'$ is a child of $W$ in that path. By the construction of $P(Z'|\Pa{Z'}{\G})$, we have
    \begin{equation}\label{eq:pp_to_pp}
        P'(Z'+W[p]|\Pa{Z'}{\G}) = P^{\M}(Z'|\Pa{Z'}{\G}).
    \end{equation}
    This is because $M'(Z'+W[p])=M(Z')$.
    Let $\mathbf{v}'\in \dom{\mathbf{V}}{}$ be a realization that is consistent with $\mathbf{v}^{\M}[\mathbf{V}\setminus\{Z'\}]$ and 
    $$
    \mathbf{v}'[Z'] = \mathbf{v}^{\M}[Z']-\mathbf{v}[W[p]].
    $$
    In this case, using \eqref{eq:pp_to_pp}, we have
        \begin{equation*}
    \begin{gathered}
        \theta_{i, j}^{'}(\mathbf{v}) = 
        \sum_{\mathbf{U}[\mathcal{P}]} 
        \prod_{\hat{U}[\hat{p}]\in \mathbf{U}[\mathcal{P}]} f_{\hat{p}}(\hat{U})
        \prod_{\hat{X}[\hat{p}] \in \mathbf{A}'_i[\mathcal{P}]} f_{\hat{p}}(\hat{X}[\hat{p}]|\Pa{\hat{X}}{\hat{p}})\\
        \times\Big( \sum_{\textbf{\underline{U}}^{\M}}
        P^{\M}({\mathbf{v}'}^{\M}[Z']|\Pa{Z'}{\G})
         \prod_{X \in \A'_i\setminus\{Z'\}} P^{\M}(x \mid \Pa{X}{\G}) \prod_{U\in \mathbf{U} \setminus \{U_0\}}\!P^{\M}(u^{\M})\Big).
    \end{gathered}
    \end{equation*}
    Note that the terms inside the big parenthesis is equal to $\theta_{i, j}(\mathbf{v}')$ given in \eqref{eq: theta and eta}, i.e., 
    \begin{equation*}
         \theta_{i, j}^{'}(\mathbf{v}) = \sum_{\mathbf{U}[\mathcal{P}]}
        \prod_{\hat{U}[\hat{p}]\in \mathbf{U}[\mathcal{P}]} f_{\hat{p}}(\hat{U})
        \prod_{\hat{X}[\hat{p}] \in \mathbf{A}'_i[\mathcal{P}]} f_{\hat{p}}(\hat{X}[\hat{p}]|\Pa{\hat{X}}{\hat{p}})
        \theta_{i, j}(\mathbf{v}').
    \end{equation*}
%    Note that from definition of $\theta_{i, j}$ defined for models $\M_1$ and $\M_2$ we have
    % \begin{equation*}
    %     \theta_{i, j}(\mathbf{v}') = \sum_{[\mathbf{U} \setminus \{U_0\}]^{\M}}
    %     P'({\mathbf{v}'}^{\M}[Z']|\Pa{Z'}{\G})
    %      \prod_{X \in \A'_i\setminus\{Z'\}} P^{\M}(x \mid \Pa{X}{\G}) \prod_{U\in \mathbf{U} \setminus \{U_0\}}\!P^{\M}(u^{\M}),
    % \end{equation*}
    %where the right side of equation written for the realization $\mathbf{v}$.The latter implies

    
    In the last equation, all terms on the right hand side except $\theta_{i, j}(\mathbf{v}')$ are independent of the realization of $\{U_0\}^{\M}$, i.e., independent of index $j$.
    For $j\in\{j_1,...,j_{\frac{\kappa+1}{2}}\}$ and using the result of Lemma \ref{lemma: gid equal indices} that says $\theta_{i, j_1}(\mathbf{v}')=...=\theta_{i, j_{\frac{\kappa+1}{2}}}(\mathbf{v}')$, we can conclude the result. 
    %The same holds for $\theta_{i,j_1}'(\mathbf{v}')$, $\theta_{i,j_2}'(\mathbf{v}')$, \dots, $\theta_{i,j_{\frac{\kappa+1}{2}}}'(\mathbf{v}')$. By combining this result and Lemma \ref{lemma: gid equal indices}, we conclude the result.
\end{proof}

\begin{lemma} \label{lemma: phi equal indices subcase 2}
     For any $\mathbf{d}^{\dagger} \in \dom{\mathbf{D}^{\dagger}}{}'$, we have
    \begin{equation*}
        \phi_{j_1}(\mathbf{d}^{\dagger}) = \phi_{j_2}(\mathbf{d}^{\dagger})=\dots = \phi_{j_{\frac{k+1}{2}}}(\mathbf{d}^{\dagger}).
    \end{equation*}
\end{lemma}
\begin{proof}
Similar to the previous lemma, by substituting $P^{\M'}$ from their definitions into Equation \eqref{eq: def phi subcase 2} and rearranging the terms, we obtain
    \begin{equation}\label{eq: phi simplification subcase 2}
    \begin{gathered}
        \phi_{j}^{'}(\mathbf{d}^{\dagger}) := \sum_{\mathbf{U}[\mathcal{P}]}
        \sum_{\textbf{\underline{U}}^{\M}}
        \sum_{\D}
        \prod_{\hat{p}\in \mathcal{P}_{U_0}}f_{\hat{p}}(U_0[\hat{p}])
        \prod_{\hat{X}[\hat{p}] \in \mathbf{S}[\mathcal{P}]} f_{\hat{p}}(\hat{X}[\hat{p}]|\Pa{\hat{X}}{\hat{p}}) \\
        \times\Big(
         P'(Z'|\Pa{Z'}{\G})
         \prod_{X \in \mathbf{S}\setminus\{Z'\}} P^{\M}(x^{\M} \mid \Pa{X}{\G}) \prod_{U\in \mathbf{U} \setminus \{U_0\}}\!P^{\M}(u^{\M})\Big),
    \end{gathered}
    \end{equation}
    where $\mathbf{U}[\mathcal{P}]:=\bigcup_{U\in\textbf{U}}\{U[\hat{p}]|\ \hat{p}\in \mathcal{P}_{U}\}$, $\underline{\textbf{U}}:=\mathbf{U} \setminus \{U_0\}$. Suppose that $l_1$ and $l_2$ are two integers such that
    \begin{equation*}
    \begin{split}
        & \gamma_{l_1} := (2x, 0, \dots, 0)),\\
        & \gamma_{l_2} := (2x+2 \pmod{\kappa+1}, 0, \dots, 0),
    \end{split}
    \end{equation*}
    and $x$ is an integer in $[0 : \frac{\kappa-1}{2}]$.
    We will prove that $\phi_{ l_1}(\mathbf{d}^{\dagger})=\phi_{l_2}(\mathbf{d}^{\dagger})$.

    Suppose that path $p$ is the sequence of variables: $Z'$, $D'_1$, $D'_2$ \dots $D'_{k'_1}$, $D'_{k'_1+1}:=Y'$. 
    Note that there is a direct edge between any consecutive nodes in this path and furthermore, the direct edge between $Z'$ and $D'_1$ is pointing toward $Z'$, i.e., $Z'\leftarrow D_1'$. 
    
    On the other hand, since $Z'$ and $U_0$ are both in $\S$ ($\S=\mathbf{S}_1$ by construction), then there exists a shortest path  $U_0, \hat{S}_1', \hat{U}_1', \hat{S}_2', \hat{U}_2', \dots, \hat{U}_{l'}', Z'$, such that $U_0$ is a parent of $\hat{S}_1'\in \S$, $Z'$ is a child of $\hat{U}_l'\in \U^{\S}$, and $\hat{U}_j'\in \U^{\S}$ is a parent of variables $\hat{S}_j'\in \S$ and  $\hat{S}_{j+1}'\in \S$ for $j \in [1:l'-1]$. 
    Let $\hat{\mathbf{U}}':=\{\hat{U}_1', \dots, \hat{U}_l'\}$, i.e., unobserved nodes in this shortest path except $U_0$. 
    For a given realization $\mathbf{o}_{1}$ of $\mathbf{U}\cup\mathbf{D}$,  we define $\mathbf{o}_{2} \in \dom{\mathbf{U}\cup\mathbf{D}}{}'$ as follows
    %\paragraph{Definition of $\textbf{o}_2$:}
    \begin{equation}
        \begin{split}
            & \mathbf{o}_{2}^{\M}[\hat{U}'_j] := \mathbf{o}_{1}^{\M}[\hat{U}'_j] + 2(-1)^{j} \pmod{\kappa+1}, \quad j\in[1:l'],\\
            % & \mathbf{u}_{2}^{\M}[U] := \mathbf{u}_{1}^{\M}[U], \quad \forall U\in \U^{\S} \setminus \hat{\mathbf{U}},
        \end{split}
    \end{equation}
    For $D_1'$, we have
    \begin{equation}\label{eq:56}
        \begin{split}
            & \mathbf{o}_2[D_1'[p]] = \mathbf{o}_1[D_1'[p]]-2(-1)^{l'} \pmod{\kappa+1}.
        \end{split}
    \end{equation}
    Note that with these modifications, for any $\widetilde{S} \in \S\setminus\{Z'\}$, we have
    \begin{equation*}
        \widetilde{s}_2 - M(\widetilde{S}) \equiv \widetilde{s}_1 - M(\widetilde{S}) \pmod{\kappa+1},
    \end{equation*}
     where $\widetilde{s}_1$ is a realization of $\widetilde{S}\Big|_{(\mathbf{U}\cup \D, \D^{\dagger}, U_0^\M)=(\mathbf{o}_1, \dd^{\dagger}, \gamma_{l_1})}$, $\widetilde{s}_2$ is a realization of $\widetilde{S}\Big|_{(\mathbf{U}\cup\D, \D^{\dagger}, U_0^\M)=(\mathbf{o_2}, \dd^{\dagger}, \gamma_{l_2})}$, and $M(\cdot)$ is given by Equation (\ref{eq: M(S)}). Additionally, 
    \begin{equation*}
        \mathbf{o}_2^{\M}[Z'] - M'(Z') \equiv \mathbf{o}_1^{\M}[Z'] - M'(Z') \pmod{\kappa+1},
    \end{equation*}
    where $M'(\cdot)$ is defined in Equation (\ref{eq: M'(S)}).
    This implies that for any $\widetilde{S}\in \mathbf{S}$, we have
    \begin{equation*}
    P^{\M}(\widetilde{s}|\Pa{\widetilde{S}}{\G})\Big|_{(\mathbf{U}\cup\mathbf{D}, \D^{\dagger}, U_0^{\M})=(\textbf{o}_1, \dd^{\dagger}, \gamma_{l_1})}=P^{\M}(\widetilde{s}|\Pa{\widetilde{S}}{\G})\Big|_{(\mathbf{U}\cup\mathbf{D}, \D^{\dagger}, U_0^{\M})=(\textbf{o}_2, \dd^{\dagger}, \gamma_{l_2})}.
    \end{equation*}
    Let $c := -2(-1)^{l'}$, then Equation \eqref{eq:56} becomes
    \begin{equation}\label{eq:after_56_1}
        \mathbf{o}_2^{\M}[D_1'[p]] = \mathbf{o}_1^{\M}[D_1'[p]]+c \pmod{\kappa+1}.
    \end{equation}
    Suppose that $D_j'$ is not a collider on the path $p$ and  $j\in [2:k_1'+1]$. We define $\mu(D_j')$ to be the number of colliders on a part of the path $p$ from $D_1'$ to $D_{j-1}'$.
    Thus, for those $j\in[2:k_1'+1]$ that $D_j'$ is not a collider, we define
    \begin{equation}\label{eq:after_56_2}
        \mathbf{o}_2^{\M}[D_j'[p]] := \mathbf{o}_1^{\M}[D_j'[p]] + c(-1)^{\mu(D_j')}.
    \end{equation}
    % and
    % \begin{equation*}
    %     \mathbf{o}_2^{\M}[Y'[p]] := \mathbf{o}_1^{\M}[Y'[p]] + c(-1)^{\mu(Y')}.
    % \end{equation*}
    Note that the modifications in \eqref{eq:after_56_2} might only affect the function $f_{p}(\cdot|\cdot)$.  
    Next, we show that after these modifications, function $f_{p}(\cdot|\cdot)$ remains unchanged. 
    To do so, for $j \in [1:k'_1+1]$, we consider four different cases:
    \begin{enumerate}
        \item If $D_j'$ has no parents, then it is obvious that
         \begin{equation*}
            f_{p}(D_j'[p])\Big|_{(\mathbf{U}\cup\mathbf{D}, U_0^{\M})=(\textbf{o}_1, \gamma_{l_1})} = f_{p}(D_j'[p])\Big|_{(\mathbf{U}\cup\mathbf{D}, U_0^{\M})=(\textbf{o}_2, \gamma_{l_2})}.
        \end{equation*}
        \item $D_j'$ is a collider, then $\mu(D_{j+1}') = \mu(D_{j-1}')+1$ and
        \begin{align*}
            & \mathbf{o}_1[D_{j+1}'[p]] + \mathbf{o}_1[D_{j-1}'[p]] = \mathbf{o}_2[D_{j+1}'[p]] + \mathbf{o}_2[D_{j-1}'[p]],
        \end{align*}
        and hence, according to  Equation \eqref{eq: f for not starting node}, we have
        \begin{equation*}
          f_{p}(D_j'[p]|\Pa{D_j'}{p})\Big|_{(\mathbf{U}\cup\mathbf{D}, U_0^{\M})=(\textbf{o}_1, \gamma_{l_1})} = f_{p}(D_j'[p]|\Pa{D_j'}{p})\Big|_{(\mathbf{U}\cup\mathbf{D}, U_0^{\M})=(\textbf{o}_2, \gamma_{l_2})}.
        \end{equation*}
        
        \item $D'_j$ is a child of $D'_{j+1}$, then $\mu(D'_{j}) = \mu(D'_{j+1})$ and
        \begin{align*}
            & \mathbf{o}_1[D_{j}'[p]] - \mathbf{o}_1[D_{j+1}'[p]] = \mathbf{o}_2[D_{j}'[p]] - \mathbf{o}_2[D_{j+1}'[p]].
        \end{align*}
        According to  Equation \eqref{eq: f for not starting node}, we imply that
        \begin{equation*}
           f_{p}(D_j'[p]|\Pa{D_j'}{p})\Big|_{(\mathbf{U}\cup\mathbf{D}, U_0^{\M})=(\textbf{o}_1, \gamma_{l_1})} = f_{p}(D_j'[p]|\Pa{D_j'}{p})\Big|_{(\mathbf{U}\cup\mathbf{D}, U_0^{\M})=(\textbf{o}_2, \gamma_{l_2})}.
        \end{equation*}
        
        \item $D'_j$ is a child of $D'_{j-1}$, then $\mu(D_{j}') = \mu(D_{j-1}')$ and
        \begin{align*}
            & \mathbf{o}_1[D_{j}'[p]] - \mathbf{o}_1[D_{j-1}'[p]] = \mathbf{o}_2[D_{j}'[p]] - \mathbf{o}_2[D_{j-1}'[p]].
        \end{align*}
        Similarly, according to Equation \eqref{eq: f for not starting node}, we get
        \begin{equation*}
           f_{p}(D_j'[p]|\Pa{D_j'}{p})\Big|_{(\mathbf{U}\cup\mathbf{S}, U_0)=(\textbf{o}_1, \gamma_{l_1})} = f_{p}(D_j'[p]|\Pa{D_j'}{p})\Big|_{(\mathbf{U}\cup\mathbf{S}, U_0)=(\textbf{o}_2, \gamma_{l_2})}.
        \end{equation*}
    \end{enumerate}

    This concludes that for any $j\in[1:k_1'+1]$,
    \begin{equation*}
        f_{p}(D_j'[p]|\Pa{D'_j}{p})\Big|_{(\mathbf{U}\cup\mathbf{D}, U_0^{\M})=(\textbf{o}_1, \gamma_{l_1})} = f_{p}(D_j'[p]|\Pa{D_j'}{p})\Big|_{(\mathbf{U}\cup\mathbf{D}, U_0^{\M})=(\textbf{o}_2, \gamma_{l_2})}.
    \end{equation*}
    % and 
    % \begin{equation*}
    %     f_{p}(Y'[p]|\Pa{Y'}{p})\Big|_{(\mathbf{U}\cup\mathbf{D}, U_0^{\M})=(\textbf{o}_1, \gamma_{l_1})} = f_{p}(Y'[p]|\Pa{Y'}{p})\Big|_{(\mathbf{U}\cup\mathbf{D}, U_0^{\M})=(\textbf{o}_2, \gamma_{l_2})}.
    % \end{equation*}

    Note that the aforementioned transformation of $\mathbf{o}_1$ affects only those realizations of variables that are used for the marginalization in the Equation \eqref{eq: phi simplification subcase 2}. Putting the above results together implies that the terms in \eqref{eq: phi simplification subcase 2} remain unchanged, i.e., 
    \begin{align*}
        &\prod_{\hat{p}\in \mathcal{P}_{U_0}}f_{\hat{p}}(U_0[\hat{p}])
        \prod_{\hat{X}[\hat{p}] \in \mathbf{S}[\mathcal{P}]} f_{\hat{p}}(\hat{X}[\hat{p}]|\Pa{\hat{X}}{\hat{p}}) \\
        &\times\Big(
         P'(Z'|\Pa{Z'}{\G})
         \prod_{X \in \mathbf{S}\setminus\{Z'\}} P^{\M}(x^{\M} \mid \Pa{X}{\G}) \prod_{U\in \mathbf{U} \setminus \{U_0\}}\!P^{\M}(u^{\M})\Big)\Big|_{(\mathbf{U}\cup\mathbf{D}, \D^{\dagger}, U_0^{\M})=(\textbf{o}_1, \dd^{\dagger}, \gamma_{l_1})}  \\
        & = \prod_{\hat{p}\in \mathcal{P}_{U_0}}f_{\hat{p}}(U_0[\hat{p}])
        \prod_{\hat{X}[\hat{p}] \in \mathbf{S}[\mathcal{P}]} f_{\hat{p}}(\hat{X}[\hat{p}]|\Pa{\hat{X}}{\hat{p}}) \\
        &\times\Big(
         P'(Z'|\Pa{Z'}{\G})
         \prod_{X \in \mathbf{S}\setminus\{Z'\}} P^{\M}(x^{\M} \mid \Pa{X}{\G}) \prod_{U\in \mathbf{U} \setminus \{U_0\}}\!P^{\M}(u^{\M})\Big)\Big|_{(\mathbf{U}\cup\mathbf{D}, \D^{\dagger}, U_0^{\M})=(\textbf{o}_2, \dd^{\dagger}, \gamma_{l_2})}
    \end{align*}
    
    This implies that $\phi_{l_1}(\mathbf{d}^{\dagger})=\phi_{l_2}(\mathbf{d}^{\dagger})$. By varying $x$ within $[0 : \frac{\kappa-1}{2}]$ in the definition of $\gamma_{l_1}$ and $\gamma_{l_2}$, we  obtain the result.
\end{proof}

\begin{lemma}
    \label{lemma: eta not equal indices subcase 2}
    There exists $0<\epsilon<\frac{1}{\kappa}$, such that there exists $\mathbf{v}_0 \in \dom{\mathbf{V}}{}'$ and $1\leq r <t\leq \frac{\kappa+1}{2}$ such that
    \begin{equation*}
        \eta'_{j_r}(\mathbf{v}_0) \neq \eta'_{j_t}(\mathbf{v}_0).
    \end{equation*}
\end{lemma}
\begin{proof}
By substituting $P^{\M'}$ from their definitions into Equation \eqref{eq: def eta subcase 2} and rearranging the terms, we obtain
    \begin{equation}\label{eq: eta simplification subcase 2}
    \begin{gathered}
        \eta_{j}^{'}(\mathbf{v}_0) = 
        \sum_{\mathbf{U}^{\M} \setminus \{U_0\}^{\M}}
        \sum_{\mathbf{U}[\mathcal{P}]}
        \prod_{\hat{U}[\hat{p}]\in \mathbf{U}[\mathcal{P}]} f_{\hat{p}}(\hat{U})
        \prod_{\hat{X}[\hat{p}] \in \mathbf{S}[\mathcal{P}]} f_{\hat{p}}(\hat{X}[\hat{p}]|\Pa{\hat{X}}{\hat{p}}) \\
        \times\Big(
         P'(Z'|\Pa{Z'}{\G})
         \prod_{X \in \mathbf{S}\setminus\{Z'\}} P^{\M}(x^{\M} \mid \Pa{X}{\G}) \prod_{U\in \mathbf{U} \setminus \{U_0\}}\!P^{\M}(u^{\M})\Big),
    \end{gathered}
    \end{equation}
    Next, we define $\mathbf{v}_0\in \dom{\mathbf{V}}{}'$ such that the conditions in the lemma hold.
    \begin{itemize}
        \item For any path $\hat{p}\in \mathcal{P}$ and any node $W$ on the path $\hat{p}$ that is not a starting node for path $\hat{p}$, we define
        \begin{equation*}
            \mathbf{v}_0[W[\hat{p}]]:=0.
        \end{equation*}
        \item For any variable $S \in \S$, we define
        \begin{equation*}
            \mathbf{v}_0^{\M}[S] := 0.
        \end{equation*}
        \item For the remaining part of $\textbf{v}_0$, we choose a realization such that for the selected $\textbf{v}_0$, there exists a realization for the unobserved variables $\mathbf{U}$ that ensures $\mathbb{I}(S) = 0$ for all $S \in \S$. This is clearly possible due to the definition of $\mathbb{I}(S)$.
        
        % \begin{equation*}
        %     \mathbb{I}(S) = 0.
        % \end{equation*}
    \end{itemize}
    
    Assume $r$ and $t$ are such that $\gamma_{j_r} := (0, 0, \dots, 0)$ and $\gamma_{j_t} := (2, 0, \dots, 0)$.  
    To finish the proof of the lemma, it is enough to show that $\eta'_{j_r}(\mathbf{v}_0)$ and $\eta'_{j_t}(\mathbf{v}_0)$ are two different polynomial functions of parameter $\epsilon$.
    We prove that these two polynomials are different by showing that $\eta'_{j_r}(\mathbf{v}_0)\neq\eta'_{j_t}(\mathbf{v}_0)$ for $\epsilon=0$.
    
    We only need to consider the non-zero terms in Equation \eqref{eq: eta simplification subcase 2}. From \eqref{eq: eta simplification subcase 2}, we have
    %written for $\eta'_r(\mathbf{v}_0)$ and $\eta'_t(\mathbf{v}_0)$, that is
    \begin{equation}
    \label{eq: main term lemma subcase 2}
    \begin{gathered}
         \prod_{\hat{U}[\hat{p}]\in \mathbf{U}[\mathcal{P}]} f_{\hat{p}}(\hat{U})
        \prod_{\hat{X}[\hat{p}] \in \mathbf{S}[\mathcal{P}]} f_{\hat{p}}(\hat{X}[\hat{p}]|\Pa{\hat{X}}{\hat{p}}) \\
        \times\Big(
         P'(Z'|\Pa{Z'}{\G})
         \prod_{X \in \mathbf{S}\setminus\{Z'\}} P^{\M}(x^{\M} \mid \Pa{X}{\G}) \prod_{U\in \mathbf{U} \setminus \{U_0\}}\!P^{\M}(u^{\M})\Big).
    \end{gathered}
    \end{equation}
    Note that $f_{\hat{p}}(\hat{U})=\frac{1}{\kappa+1}$ and $f_{\hat{p}}(\hat{X}|\Pa{\hat{X}}{\hat{p}'})$ is non-zero only 
    \begin{itemize}
       % \item $\hat{X}$ is a collider and $\hat{p}'=p$, 
        
        \item when there exists a variable $W\in \mathbf{F}$ such that $\hat{p}'=p_W$, $\hat{X}$ is a child of $W$ in path $p_W$, and
        $$
        \hat{X}[\hat{p}'] \equiv W[p] \pmod{\kappa+1}.
        $$
    
        \item when the following holds
        $$
        \hat{X}[\hat{p}'] \equiv \sum_{\hat{X}'\in \Pa{\hat{X}}{\hat{p}'}\setminus\{W\}}\hat{X}'[\hat{p}'] \pmod{\kappa+1}.
        $$
    \end{itemize}
    Similarly, $P^\M(X|\Pa{X}{\G})$ is non-zero
    \begin{itemize}
        \item if $\mathbb{I}(X)=1$ (i.e. $P^\M(X|\Pa{X}{\G})=\frac{1}{\kappa+1}$), or
        
        \item if $X \equiv M(X) \pmod{\kappa+1}$ for $P^\M(X|\Pa{X}{\G})$,

    \end{itemize}
    $P'(Z'|\Pa{Z'}{\G})$ is non-zero 
    \begin{itemize}
         \item if $\mathbb{I}(Z')=1$ (i.e. $P^\M(Z'|\Pa{Z'}{\G})=\frac{1}{\kappa+1}$), or
        
        \item $Z' \equiv M'(Z') \pmod{\kappa+1}$ for $P'(Z'|\Pa{Z'}{\G})$.
    \end{itemize}
    Let fix a realization $\mathbf{u} \in \dom{\mathbf{U}\setminus\{U_0^{\M}\}}{}'$. 
    We consider two scenarios:
    
    \textbf{I)}
    Assume that for this realization, there is a variable $S\in \S$, such that $\mathbb{I}(S)=1$ and $S$ is the closest variable to $U_0$ considering only paths with bidirected edges in $\G'[\S]$. 
    The value of $S^{\M}$ does not depend on its parents because of $\mathbb{I}(S)=1$ and Equation \eqref{eq: def P(S|Pa(S)) gid}.
    Additionally in the graph $\G'[\S]$, there exists a path $U_0, \hat{S}_1', \hat{U}_1', \hat{S}_2', \hat{U}_2', \dots, \hat{U}_{l'}', S$, such that $U_0$ is a parent of $\hat{S}_1'\in \S$, $S$ is a child of $\hat{U}_l'\in \U^{\S}$, and $\hat{U}_j'\in \U^{\S}$ is a parent of variables $\hat{S}_j'\in \S$ and  $\hat{S}_{j+1}'\in \S$ for $j \in [1:l'-1]$. 
    Let $\hat{\mathbf{U}}':=\{\hat{U}_1', \dots, \hat{U}_l'\}$. 
    We define $\mathbf{u}' \in \dom{\mathbf{U}\setminus\{U_0^{\M}\}}{}'$ 
    that is consistent with $\mathbf{u}$ except the variables in $\hat{\mathbf{U}}'$. For these variables, we define
    \begin{equation}
        \begin{split}
            & \mathbf{u}'^{\M}[\hat{U}_j] := \mathbf{u}^{\M}[\hat{U}_j] + 2(-1)^{j} \pmod{\kappa+1}, \quad j\in[1:l'],\\
            % & \mathbf{u}_{2}^{\M}[U] := \mathbf{u}_{1}^{\M}[U], \quad \forall U\in \U^{\S} \setminus \hat{\mathbf{U}},
        \end{split}
    \end{equation}
    
    With this modification for any $\widetilde{S}\in \mathbf{S}$, we have
    \begin{equation*}
    P^{\M}(\widetilde{s}|\Pa{\widetilde{S}}{\G})\Big|_{(\mathbf{U})=(\mathbf{u}, \gamma_{j_r})}=P(\widetilde{s}|\Pa{\widetilde{S}}{\G})\Big|_{(\mathbf{U})=(\textbf{u}', \gamma_{j_t})}.
    \end{equation*}
    Therefore for all such realizations of $\mathbf{u}$, the summation of the following terms for both $\eta'_{j_r}(\mathbf{v}_0)$ and $\eta'_{j_t}(\mathbf{v}_0)$ will be the same,
    \begin{equation}
    \label{eq: main term eta subcase 2}
    \begin{gathered}
         \prod_{\hat{U}[\hat{p}]\in \mathbf{U}[\mathcal{P}]} f_{\hat{p}}(\hat{U})
        \prod_{\hat{X}[\hat{p}] \in \mathbf{S}[\mathcal{P}]} f_{\hat{p}}(\hat{X}[\hat{p}]|\Pa{\hat{X}}{\hat{p}}) \\
        \times\Big(
         P'(Z'|\Pa{Z'}{\G})
         \prod_{X \in \mathbf{S}\setminus\{Z'\}} P^{\M}(x^{\M} \mid \Pa{X}{\G}) \prod_{U\in \mathbf{U} \setminus \{U_0\}}\!P^{\M}(u^{\M})\Big).
    \end{gathered}
    \end{equation}
    %accumulate in the the same impact for both .

    \textbf{II)} Assume that for all $S\in \S$, we have $\mathbb{I}(S)=0$.
    We consider a realization $U_0^{\M}=\gamma_{j_r}$ and $\mathbf{u}$ such that:
    \begin{itemize}
        %\item for all $S\in \S$ we have $\mathbb{I}(S)=0$.
        \item $\mathbf{u}[\U^{\S}] = \mathbf{0}$, and
        \item for all $U\in \mathbf{U}$ and any path $\hat{p}\in \mathcal{P}$ which contains $U$, $\mathbf{u}[U[\hat{p}]] = 0.$
    \end{itemize}
    We claim that for such $\mathbf{u}$, 
    \begin{equation*}
    \begin{gathered}
        \prod_{\hat{U}[\hat{p}]\in \mathbf{U}[\mathcal{P}]} f_{\hat{p}}(\hat{U})
        \prod_{\hat{X}[\hat{p}] \in \mathbf{S}[\mathcal{P}]} f_{\hat{p}}(\hat{X}[\hat{p}]|\Pa{\hat{X}}{\hat{p}}) \\
        \times\Big(
         P'(Z'|\Pa{Z'}{\G})
         \prod_{X \in \mathbf{S}\setminus\{Z'\}} P^{\M}(x^{\M} \mid \Pa{X}{\G}) \prod_{U\in \mathbf{U} \setminus \{U_0\}}\!P^{\M}(u^{\M})\Big).
    \end{gathered}
    \end{equation*}
    is non-zero. To prove this claim, we consider four cases:
    \begin{itemize}
        \item  assume that $\hat{p}\in \mathcal{P}$ and exists a variable $W$ such that $\hat{p}=p_W$. Let $\hat{X}$ be a child of $W$ in path $p_W$. From the definitions of $\mathbf{u}$ and $\mathbf{v}_0$, we get 
        $$
        \hat{X}[\hat{p}] \equiv W[\hat{p}] \pmod{\kappa+1},
        $$ 
        and therefore $f_{\hat{p}}(\hat{X}[\hat{p}]|\Pa{\hat{X}}{\hat{p}})=1$.
        The above holds because $\hat{X}[\hat{p}]=0=W[\hat{p}] \pmod{\kappa+1}$.
        
        \item assume that $\hat{p}\in \mathcal{P}$ and $\hat{X}$ is a variable on this path such that it is neither a starting node on $\hat{p}$ nor a child of a starting node on path $\hat{p}$. 
        Then, from the definitions of $\mathbf{v}_0$ and $\mathbf{u}$ we get  
        $$
        \hat{X}[\hat{p}] \equiv \sum_{\hat{X}\in \Pa{\hat{X}}{\hat{p}}}\hat{X}[\hat{p}] \pmod{\kappa+1},
        $$
        and therefore $f_{\hat{p}}(\hat{X}[\hat{p}]|\Pa{\hat{X}}{\hat{p}})=1$. 
        The above holds because all the variables in the above equation are zero.
        
        \item assume $X\in \S\setminus\{Z'\}$. From the definitions of $\mathbf{v}_0$ and $\mathbf{u}$, we get 
        $$
        X^{\M} \equiv M(X) \pmod{\kappa+1},
        $$
        and therefore $P^{\M}(x^{\M}|\Pa{X}{\G})=1$.
        Again, the above holds because all the terms are zero.
        \item assume $X=Z'$, then
        $$
        Z' \equiv M'(Z') \pmod{\kappa+1},
        $$
        and consequently $P'(Z'|\Pa{Z'}{\G})=1$.
    \end{itemize}

    Now, we consider the case when $U_0^\M = \gamma_{j_t}$. 
    Assume that $W\in \mathbf{F}$ and $W'$ is the last descendant of $W$ on the path $p_W$.
    From the properties which we proved in Section \ref{sec: properties}, we have  $W'\in\mathbf{Z'}$ and by the definition of $\mathbf{v}_0$, we have $W'[p_w]=0$. 
    Assume $W''$ is a parent of $W'$ on the path $p_W$. 
    Note that  $f_{p_W}(W'[p_W]|\Pa{W'}{p_W})\neq0$  if and only if $W''[p_W]=0$. 
    Repeating the above reasoning for variables from  $W'$ to $W$, we conclude that $W[p]$ must be equal to 0, otherwise, there would be a term in Equation \eqref{eq: main term eta subcase 2} that is zero and this contradicts with the fact that Equation \eqref{eq: main term eta subcase 2} is non-zero.
    
    Assume that $Z', W'_1, W'_2, \dots, W'_{k'}, W'_{k'+1}:=Y'$ are the nodes on the path $p$. Next, we prove by backward induction that $W'_{i}=0$ for all $i\in [1:k'+1]$. 
    By definition of $\mathbf{v_0}$, we know that $Y'[p]=0$. 
    If $W'_{i}[p]=0$ for all $i \in [k''+1:k']$, we will prove that $W''_{k''}[p]=0$ as well.
    To do so, we consider the following three cases:
    \begin{itemize}
        \item $W'_{k''}$ is a collider on a path $p$. Then the fact that $W''_{k''}[p]=0$ follows immediately from the aforementioned reasoning and the fact that Equation \eqref{eq: main term eta subcase 2} is non-zero. 
        %the observations made before.
        
        \item $W'_{k''}$ is a child of $W'_{k''+1}$ and it is not a collider. Then, $f_p(W'_{k''}|\Pa{W''_{k''}}{p})\neq0$ if and only if $W'_{k''}[p] = W'_{k''+1}[p] = 0$.
        
        \item $W'_{k''}$ is a parent of $W'_{k''+1}$. Then, $f_p(W'_{k''+1}|\Pa{W''_{k''}}{p})\neq0$  if and only if $0 = W'_{k''+1}[p] = W'_{k''}[p]$.
    \end{itemize}

    This implies that  $W'_1=0$. Therefore, $P'(Z'|\Pa{Z'}{\G}) = P^{\M}(Z'|\Pa{Z'}{\G})$ because $M'(Z')=M(Z')$. 
    Furthermore, the above arguments show that all $f_{\hat{p}}(\cdot|\cdot)$ terms in Equation \eqref{eq: main term eta subcase 2} are equal to one. This simplifies the Equation \eqref{eq: main term eta subcase 2} to 
    \begin{equation*}
        \prod_{X \in \mathbf{S}} P^{\M}(x^{\M} \mid \Pa{X}{\G}) \prod_{U\in \mathbf{U} \setminus \{U_0\}}\!P^{\M}(u^{\M}).
    \end{equation*}
    However by the proof of Lemma 6 \cite{kivva2022revisiting}, we know that there is no realization of $\mathbf{U}^{\M}$ consistent with $U_0=\gamma_{j_t}$ such that:
    \begin{itemize}
        \item $\mathbb{I}(S) = 0$ for all $S \in \S$, and
%        \item $U_0^{\M}=\gamma_{j_t}$, and
        \item $x^{\M} \equiv M(X) \pmod{\kappa + 1}$ for all $X\in \S$. The latter is a necessary condition for $P^{\M}(x|\Pa{X}{\G})$ being non-zero. 
    \end{itemize}
    To summarize, we showed that for $U_0^{\M}=\gamma_{j_r}$, Equation \eqref{eq: main term eta subcase 2} is non-zero while it is zero for $U_0^{\M}=\gamma_{j_t}$. This implies that $\eta'_{j_r}(\mathbf{v}_0)\neq\eta_{j_t}'(\mathbf{v}_0)$ for $\epsilon=0$. 
    %as a corollary $\eta_{\gamma_{j_r}'(\mathbf{v}_0)}$ and $\eta_{\gamma_{j_t}'(\mathbf{v}_0)}$ are not equal as polynomial. The latter one guarantees the existence of $\epsilon \in (0, \frac{1}{\kappa})$.
\end{proof}

\subsubsection{Proof of Lemma \ref{lemma: construct models subcase 2}}
\begin{customlem}{\ref{lemma: construct models subcase 2}}
    Let $\mathbf{S}: = \Anc{\Y', \Z'}{\G[\mathbf{V} \setminus \X']}$ and $\D$ is a set of all nodes on the paths in $\mathcal{P}$ excluding $\Z'$. Then,
    \begin{equation}
        P_{\x'}(\dd|\mathbf{s}\setminus \dd)=\frac{
        Q[\mathbf{S}]
        }{
        \sum_{\D} Q[\mathbf{S}]
        } = Q[\D|\mathbf{S}\setminus\D]
    \end{equation}
    is not c-gID from $(\mathbb{A}, \G)$.
\end{customlem}
\begin{proof}
    We will show  that $Q[\mathbf{D}|\mathbf{S}\setminus\mathbf{D}]$ is not c-gID from $(\mathbb{A}', \G)$, where $\mathbb{A}' := \mathbb{A}\cup\{\mathbf{S}_i\}_{i=2}^{n}$. 
    To this end, we will construct two models $\M_1$ and $\M_2$ such that for each $i \in [0:m']$ and any $\mathbf{v}\in \mathbf{V}$:
    \begin{align}
        \label{eq: equal known dist subcase 2}
        Q^{\M_1}[\A'_i](\mathbf{v}) &= Q^{\M_2}[\A'_i](\mathbf{v}),\\
        \label{eq: equal denom num subcase 2}
        \sum_{\D}Q^{\M_1}[\mathbf{S}](\mathbf{v}) &= \sum_{\D}Q^{\M_2}[\mathbf{S}](\mathbf{v}'),
    \end{align}
    but there exists $\mathbf{v}_0 \in \dom{\mathbf{V}}{}'$ such that:
    \begin{equation}\label{eq: not equal num subcase 2}
        Q^{\M_1}[\mathbf{S}](\mathbf{v}_0) \neq Q^{\M_2}[\mathbf{S}](\mathbf{v}_0).
    \end{equation}
    Note that Equations (\ref{eq: equal denom num subcase 2})-(\ref{eq: not equal num subcase 2}) yield
    \begin{equation*}
         Q[\D|\mathbf{S}\setminus\D]^{\M_1}(\mathbf{v}_0) \neq Q[\D|\mathbf{S}\setminus\D]^{\M_2}(\mathbf{v}_0).
    \end{equation*}
    This means that $Q[\D|\mathbf{S}\setminus\D]$ is not c-gID from $(\mathbb{A}', \G)$.

    To this end, we consider two cases.

    \textbf{First case:} \\
    Suppose that there exists $i \in [0, m]$, such that $\widecheck{\mathbf{S}} \subset \mathbf{A}_i$.
    Then, consider the models $\M_1'$ and $\M_2'$ constructed in the section \ref{sec: appendix new models subcase 2}. According to the definitions of models $\M_1'$ and $\M_2'$ for any $\mathbf{v}\in \dom{\mathbf{V}}{}'$, and any $i\in [0:m']$, and any $g\in \{1, 2\}$, we have
    \begin{align*}
        & Q[\mathbf{A}'_i]^{\M_g'}(\mathbf{v}) := \sum_{U_0^{\M}}P^{\M_g}(u_0^{\M})\sum_{U_0[\mathcal{P}]}\prod_{\hat{p}\in \mathcal{P}_{U_0}}f_{\hat{p}}(U_0[\hat{p}])\sum_{\mathbf{U} \setminus \{U_0\}} \prod_{X \in \A_i'} P^{\M'}(x \mid \Pa{X}{\G}) \prod_{U\in \mathbf{U} \setminus \{U_0\}} P^{\M'}(u^{\M}),\\
        \sum_{\D}&Q[\mathbf{S}]^{\M_g'}(\mathbf{v}) := \sum_{U_0^\M}P^{\M_g}(u_0^{\M})\sum_{U_0[\mathcal{P}]}\prod_{\hat{p}\in \mathcal{P}_{U_0}}f_{\hat{p}}(U_0[\hat{p}])\sum_{\D}\sum_{\mathbf{U} \setminus \{U_0\}} \prod_{X \in \mathbf{S}} P^{\M'}(x \mid \Pa{X}{\G}) \prod_{U\in \mathbf{U} \setminus \{U_0\}} P^{\M'}(u^{\M}),\\
        & Q[\mathbf{S}]^{\M_g'}(\mathbf{v}) := \sum_{U_0^\M}P^{\M_g}(u_0^{\M})\sum_{U_0[\mathcal{P}]}\prod_{\hat{p}\in \mathcal{P}_{U_0}}f_{\hat{p}}(U_0[\hat{p}])\sum_{\mathbf{U} \setminus \{U_0\}} \prod_{X \in \mathbf{S}} P^{\M'}(x \mid \Pa{X}{\G}) \prod_{U\in \mathbf{U} \setminus \{U_0\}} P^{\M'}(u^{\M}).
    \end{align*}
    We can re-writing the above equations using the notations of $\theta'_{i, j}$, $\phi'_{j}$, and $\eta'_{j}$,
    \begin{align*}
        & Q[\mathbf{A}'_i]^{\M_1}(\mathbf{v}) = \sum_{j=1}^d \frac{1}{d}\theta'_{i, j}(\mathbf{v}), \\
        & Q[\mathbf{A}'_i]^{\M_2}(\mathbf{v}) = \sum_{j=1}^d p_j\theta'_{i, j}(\mathbf{v}), \\
        \sum_{\D} &Q[\mathbf{S}]^{\M_1}(\mathbf{v}) = \sum_{j=1}^d \frac{1}{d}\phi'_{j}(\mathbf{v}[\D^{\dagger}]), \\
        \sum_{\D} 
        &Q[\mathbf{S}]^{\M_2}(\mathbf{v}) = \sum_{j=1}^d p_j\phi'_{j}(\mathbf{v}[\D^{\dagger}]), \\
        & Q[\mathbf{S}]^{\M_1}(\mathbf{v}) = \sum_{j=1}^d \frac{1}{d}\eta'_{j}(\mathbf{v}), \\
        & Q[\mathbf{S}]^{\M_2}(\mathbf{v}) = \sum_{j=1}^d p_j\eta'_{j}(\mathbf{v}).
    \end{align*}
    The above equations imply the following equations.
    \begin{align*}
        & Q^{\M_2}[\A'_i](\mathbf{v}) - Q^{\M_1}[\A'_i](\mathbf{v}) = \sum_{j=1}^d (p_j - \frac{1}{d}) \theta_{i,j}'(\mathbf{v})
        \\
        \sum_{\D} & Q[\mathbf{S}]^{\M_2}(\mathbf{v}) - \sum_{\D} Q[\mathbf{S}]^{\M_1}(\mathbf{v}) = \sum_{j=1}^d (p_j - \frac{1}{d}) \phi_{j}'(\mathbf{v}[\D^{\dagger}])
        \\
        & Q^{\M_2}[\S](\mathbf{v}_0) -  Q^{\M_1}[\S](\mathbf{v}_0) = \sum_{j=1}^d (p_j - \frac{1}{d}) \eta_{j}'(\mathbf{v}_0)
        \\
        & \sum_{j=1}^d p_j - 1 = \sum_{j=1}^d (p_j - \frac{1}{d}).
    \end{align*}
    

     To prove the statement of the lemma it suffices to solve the following system of linear equations over parameters $\{p_j\}_{j=1}^d$ and show that it admits a solution. 
    \begin{align*}
        & \sum_{j=1}^d (p_j - \frac{1}{d}) \theta_{i,j}'(\mathbf{v}) = 0, \hspace{0.2cm}\forall \mathbf{v} \in \dom{\mathbf{V}}{}', i\in [0:m'],
        \\
        & \sum_{j=1}^d (p_j - \frac{1}{d}) \phi'_{j}(\dd^{\dagger}) = 0, \hspace{0.2cm}\forall \dd^{\dagger} \in \dom{\D^{\dagger}}{}, i\in [0:m'],
        \\
        & \sum_{j=1}^d (p_j - \frac{1}{d}) \eta'_{j}(\mathbf{v}_0) \neq 0, \hspace{0.2cm} \exists \mathbf{v}_0 \in \dom{\mathbf{V}}{}',
        \\
        & (p_j - \frac{1}{d}) = 0,
        \\
        & 0<p_j<1, \hspace{0.2cm} \forall j \in [1:d].
    \end{align*}
    Analogous to the proof of Lemma \ref{lemma: construct models subcase 1}, we use Lemmas \ref{lemma: theta equal indices subcase 2},  \ref{lemma: phi equal indices subcase 2}, and  \ref{lemma: eta not equal indices subcase 2} instead of Lemmas \ref{lemma: gid equal indices}, \ref{lemma: equal indices summation subcase 1} and \ref{lemma: gid not equal indices} respectively and conclude the result.  

    \textbf{Second case:}\\
     Suppose that there is no $i \in [0, m]$, such that $\S \subset \mathbf{A}_i$. This case is identical to the \textbf{Second case} of the Lemma \ref{lemma: construct models subcase 1}.
\end{proof}






\subsection{Proof of Lemma \ref{lemma: construct models subcase 3}}\label{sec: supportive materials subcase 3}



Recall that $\textbf{S}=\Anc{\Y'\cup \Z'}{\G[\V \setminus \X']}$ and it is assumed that is not gID from $(\mathbb{A}, \G)$.  $\textbf{S}$ consists of $\textbf{S}_1,...,\textbf{S}_n$ as its single c-components where $\textbf{S}_1$ is not gID.
Let $\S=\mathbf{S}_1$.
Clearly, we can add $\{\mathbf{S}_i\}_{i=2}^{n}$ to the known distributions and $\S$ remains not gID, i.e., $\S$ is not gID from $(\mathbb{A}', \G)$, where $\mathbb{A}' := \mathbb{A}\cup\{\mathbf{S}_i\}_{i=2}^{n}$. 
For simplicity, we denote $\mathbb{A}' = \{\mathbf{A}'\}_{i=0}^{m'}$.
Hence, using the method in Section \ref{sec: baseline}, we can construct two models $\M_1$ and $\M_2$ that are the same over the known distributions and different over $Q[\textbf{S}_1]$. These models  disagree on the distribution $Q[\mathbf{S}]$ as well, because $Q[\mathbf{S}] = \prod_{i=1}^{n}Q[\mathbf{S}_i]$. Below, we use these two models to introduce two new models to prove Lemma \ref{lemma: construct models subcase 3}.  

\subsubsection{New models for Lemma \ref{lemma: construct models subcase 3}} \label{sec: appendix new models subcase 3}
\renewcommand{\D}{\widetilde{\mathbf{D}}}
 Recall that $T$ is a node in $\S\setminus(\Z' \cup \Y')$, $p_T$ is a shortest directed path from node $T$ to the node $Z'$, $\widetilde{\mathbf{F}}$ is a set of all colliders on the path $\widetilde{p}$, $\widetilde{\mathcal{P}} := \{\widetilde{p}\} \cup \{p_T\} \cup \{ \widetilde{p}_W|W \in \widetilde{\mathbf{F}}\}$ and $\D$ is a set of all nodes on the paths from $\widetilde{\mathcal{P}}$ excluding the nodes in $\Z'$. Let $\D_{\mathcal{P}}$ be a set of all variables that belong to at least one path in $\mathcal{P}$. 
 
 Similar to the Section \ref{sec: appendix new models subcase 2} further we define new models $\widetilde{\M}_1$ and $\widetilde{\M}_2$ based on the models $\M_1$ and $\M_2$ defined in Section \ref{sec: baseline}.
 We say that a variable $D$ is a \textbf{starting node} of the path $\hat{p}\in\widetilde{\mathcal{P}}$ if
\begin{itemize}
    \item $D = T$ and $\hat{p} = p_T$, or
    \item $D = Z'$ and $\hat{p} = \widetilde{p}$, or
    \item $D \in \widetilde{\mathbf{F}}$, i.e., it is a collider on path $\widetilde{p}$, and $\hat{p} = \widetilde{p}_D$.
\end{itemize}
Note that $D$ can be a starting node of only one path.

\newcommand{\domm}[2]{\widetilde{\mathfrak{X}}_{#2}(#1)}

For $R \in \mathbf{V}\cup \mathbf{U}$, let $\widetilde{\alpha}_{p}(R)$ be the number of paths in $\widetilde{\mathcal{P}}$ that contains $R$. Furthermore, we use $\domm{R}{}$ and $\dom{R}{}$ to denote its domain in $\widetilde{\M}_1$ or $\widetilde{\M}_2$ (variables in different models have the same domains) and in $\M_1$ or $\M_2$ respectively. We define $\domm{R}{}$ as follows:
\begin{itemize}
    \item If $R$ is a starting node for one of the paths in $\mathcal{P}$
    \begin{align*}
        & \domm{R}{} := \dom{R}{}\times[0:\kappa]^{\widetilde{\alpha}_{p}(R)-1}.
    \end{align*}
    \item If $R$ is not a starting node for any of the paths in $\mathcal{P}$, then:
    \begin{align*}
        & \domm{R}{} := \dom{R}{}^{}\times[0:\kappa]^{\widetilde{\alpha}_{p}(R)}.
    \end{align*}
\end{itemize}
Consequently, if $R$ does not belong to any of the paths in $\widetilde{\mathcal{P}}$, then $\domm{R}{} := \dom{R}{}^{}$.

Consider $R \in \mathbf{V}\cup \mathbf{U}$. According to the domain's definitions above, $R$ is a vector that is a concatenation of the vector coming from $\dom{R}{}$ in model $\M_1$ (or $\M_2$) and some additional coordinates. These additional coordinates are defined based on $\widetilde{\alpha}_{p}(R)$. More precisely, if $R$ is not a starting node of a path $\hat{p}\in \widetilde{\mathcal{P}}$, then there is a coordinate assigned to this path, denoted by $R[\hat{p}]$, otherwise, if R is a starting node of $\hat{p} \in \widetilde{\mathcal{P}}$, then there is no coordinate assigned this path.

Let $\mathbf{O} \in \mathbf{V}\cup \mathbf{U}$. 
For any realization $\mathbf{o} \in \domm{\mathbf{O}}{}$ of $\mathbf{O}$ we denote by $\mathbf{o}^\M \in \dom{O}{}$ a realization of $\mathbf{O}$ that is consistent with $\mathbf{o}$. With slight abuse of notation, we use $\mathbf{O}$ and $\mathbf{O}^{\M}$ to denote realizations of $\mathbf{O}$ in models $\widetilde{\M}_i$ and $\M_i$, respectively. $\mathbf{O}^{\M}$ means realizations in $\dom{O}{}$ that are consistent with realizations in $\domm{\mathbf{O}}{}$.

Recall that $\mathbf{D}_{\widetilde{\mathcal{P}}}$ is a set of all variables on the paths in $\widetilde{\mathcal{P}}$. Let $D\in \D_{\mathcal{P}}$. We denote by $\widetilde{\mathcal{P}}_D$ the set of all paths $\hat{p}$, such that $\hat{p}\in \widetilde{\mathcal{P}}$, $D$ belongs to the path $\hat{p}$, and $D$ is not a starting node of path $\hat{p}$. We are ready now to define the probabilities of $P^{\widetilde{\M}_i}(D|\Pa{D}{\G})$ for any $D \in \mathbf{V}\cup\mathbf{U}$ and $i \in \{1, 2\}$.

\begin{itemize}
    \item If $D$ does not belong to the set $\D_{\mathcal{P}}$, we define
    \begin{align*}
        P^{\widetilde{\M}_i}(D|\Pa{D}{\G}) := P^{\M_i}(D|\Pa{D}{\G}).
    \end{align*}
    \item If $D$ belongs to the set $\D_{\mathcal{P}}\setminus \{Z'\}$, we define
    \begin{equation}
        P^{\widetilde{\M}_i}(D|\Pa{D}{\G}) := P^{\M_i}(D^{\M}|\Pa{D}{\G})\prod_{\hat{p}\in \widetilde{\mathcal{P}}_D}f_{\hat{p}}(D[\hat{p}]|\Pa{D}{\hat{p}}),
    \end{equation}
    where 
    \begin{itemize}
        \item if $D\neq Z'$ or $\hat{p} \neq p_T$ then $\Pa{D}{\hat{p}}$ is a parents of $D$ in a path $\hat{p}$;
        \item if $D = Z'$  and $\hat{p} = p_T$ then $\Pa{Z'}{\hat{p}}$ is a parents of $Z'$ on the paths $\hat{p}$ and $p_T$;
        \item $f_{\hat{p}}(D|\Pa{D}{\hat{p}})$ is given below.
    \end{itemize}

    \textbf{Definition of function} $f_{\hat{p}}(D[\hat{p}]|\Pa{D}{\hat{p}})$:
    \begin{itemize}
        \item When there exists a variable $W \in \widetilde{\mathbf{F}}$ such that $\hat{p}=\widetilde{p}_W$ and $D$ is a child of $W$ on path $p_W$,
        \begin{equation*}
        f_{\hat{p}}(D[\hat{p}]|\Pa{D}{\hat{p}}) :=
        \begin{cases} 
            1-\kappa\epsilon &  \text{ if }  D[\hat{p}]\equiv W[\widetilde{p}] \pmod{\kappa+1}\\
            \epsilon &  \text{ if }  D[\hat{p}]\not\equiv W[\widetilde{p}] \pmod{\kappa+1}.
        \end{cases}
        \end{equation*}
        \item When $\hat{p}=p_T$ and $D$ is a child of $T$ on path $\hat{p}$,
        \begin{equation*}
        f_{\hat{p}}(D[\hat{p}]|\Pa{D}{\hat{p}}) :=
        \begin{cases} 
            1-\kappa\epsilon &  \text{ if }  D[\hat{p}]\equiv T^{\M} \pmod{\kappa+1}\\
            \epsilon &  \text{ if }  D[\hat{p}]\not\equiv T^{\M} \pmod{\kappa+1}.
        \end{cases}
        \end{equation*}
        \item When $\hat{p}=p_T$ and $D=Z'$. Suppose $Z'$ is a child of $W'$ on a path $p_T$ and is a child of $W''$ on a path $\widetilde{p}$,
        \begin{equation*}
        f_{\hat{p}}(Z'[p_T]|\Pa{D}{\hat{p}}) :=
        \begin{cases} 
            1-\kappa\epsilon &  \text{ if }  Z'[p_T]\equiv  W'[p_T] + W''[\widetilde{p}]\pmod{\kappa+1}\\
            \epsilon &  \text{ if }  Z'[p_T]\not\equiv W'[p_T] + W''[\widetilde{p}]  \pmod{\kappa+1}.
        \end{cases}
        \end{equation*}
        \item When $\Pa{D}{\hat{p}}=\emptyset$, 
        \begin{equation*}
            f_{\hat{p}}(D[\hat{p}]) := \frac{1}{\kappa+1}.
        \end{equation*}
        
        \item Otherwise,
        \begin{equation} \label{eq: define f otherwise subcase 3}
        f_{\hat{p}}(D[\hat{p}]|\Pa{D}{\hat{p}}) :=
        \begin{cases} 
            1-\kappa\epsilon &  \text{ if }  D[\hat{p}]\equiv \sum_{D' \in \Pa{D}{\hat{p}}}D'[\hat{p}] \pmod{\kappa+1}\\
            \epsilon &  \text{ if }  D[\hat{p}]\not\equiv \sum_{D' \in \Pa{D}{\hat{p}}}D'[\hat{p}] \pmod{\kappa+1},
        \end{cases}
        \end{equation}
        Note that $P^{\widetilde{\M}_i}(D|\Pa{D}{\G})$ is a probability distribution since for different paths $\hat{p}_1$ and $\hat{p}_2$, $D[\hat{p}_1]$ and $D[\hat{p}_2]$ are  different and also 
        \begin{equation*}
            \sum_{D[\hat{p}]\in \domm{D[\hat{p}]}{}} f_{\hat{p}}(D[\hat{p}]|\Pa{D}{\hat{p}}) = 1
        \end{equation*}
    \end{itemize}
\end{itemize}

Note that for any $W \in (\mathbf{V}\cup \mathbf{U})\setminus \{U_0\}$, we have
$$
P^{\widetilde{\M}_1}(W|\Pa{W}{\G}) = P^{\widetilde{\M}_2}(W|\Pa{W}{\G}).
$$ 
Therefore, we will use $P^{\widetilde{\M}}(W|\Pa{W}{\G})$ instead of $P^{\widetilde{\M}_1}(W|\Pa{W}{\G})$ or $P^{\widetilde{\M}_2}(W|\Pa{W}{\G})$ for  $W \in (\mathbf{V} \cup \mathbf{U})\setminus \{U_0\}$. 

We also have
\begin{equation}
\label{eq: prob U_0 subcase 3}
\begin{gathered}
    P^{\widetilde{\M}_1}(U_0) = \frac{1}{d} \prod_{\hat{p}\in \widetilde{\mathcal{P}}_{U_0}}f_{\hat{p}}(U_0[\hat{p}]), \\
    P^{\widetilde{\M}_2}(U_0) = P^{\M_2}(U_0^{\M}) \prod_{\hat{p}\in \widetilde{\mathcal{P}}_{U_0}}f_{\hat{p}}(U_0[\hat{p}]).
\end{gathered}
\end{equation}

Recall that $\mathbf{S}=\Anc{\Y'\cup Z'}{\G[\mathbf{V}\setminus\X']}$. Let $\D':=\mathbf{S}\setminus\D$ and $\D^{\dagger}:=\mathbf{V}\setminus\D$.  
For $i \in [0:m']$, $j\in [1:d]$, $\mathbf{v} \in \domm{\mathbf{V}}{}$ and $\mathbf{d}^{\dagger} \in \domm{\D^{\dagger}}{}$, we define $\theta_{i, j}^{'}(\mathbf{v})$, $\phi_{j}^{'}(\mathbf{d}^{\dagger})$ and $\eta_{j}^{'}(\mathbf{v})$ as follows:
\begin{align}
    \label{eq: def theta subcase 3}
    & \widetilde{\theta}_{i, j}(\mathbf{v}) := \sum_{U_0[\widetilde{\mathcal{P}}]}\prod_{\hat{p}\in \widetilde{\mathcal{P}}_{U_0}}f_{\hat{p}}(U_0[\hat{p}])\sum_{\mathbf{U} \setminus \{U_0\}} \prod_{X \in \A_i'} P^{\widetilde{\M}}(x \mid \Pa{X}{\G}) \prod_{U\in \mathbf{U} \setminus \{U_0\}} P^{\widetilde{\M}}(u^{\M}),\\
    \label{eq: def phi subcase 3}
    & \widetilde{\phi}_{j}(\mathbf{d}^{\dagger}) := \sum_{U_0[\widetilde{\mathcal{P}}]}\prod_{\hat{p}\in \widetilde{\mathcal{P}}_{U_0}}f_{\hat{p}}(U_0[\hat{p}])\sum_{\D}\sum_{\mathbf{U} \setminus \{U_0\}} \prod_{X \in \mathbf{S}} P^{\widetilde{\M}}(x \mid \Pa{X}{\G}) \prod_{U\in \mathbf{U} \setminus \{U_0\}} P^{\widetilde{\M}}(u^{\M}),\\
    \label{eq: def eta subcase 3}
    & \widetilde{\eta}_{j}(\mathbf{v}) := \sum_{U_0[\widetilde{\mathcal{P}}]}\prod_{\hat{p}\in \widetilde{\mathcal{P}}_{U_0}}f_{\hat{p}}(U_0[\hat{p}])\sum_{\mathbf{U} \setminus \{U_0\}} \prod_{X \in \mathbf{S}} P^{\widetilde{\M}}(x \mid \Pa{X}{\G}) \prod_{U\in \mathbf{U} \setminus \{U_0\}} P^{\widetilde{\M}}(u^{\M}),
\end{align}
where $\sum_{U_0[\widetilde{\mathcal{P}}]}$ is a summation over realizations of the random variables $\{U_0[\hat{p}]|\;\hat{p}\in \widetilde{\mathcal{P}}_{U_0}\}$. 

Next, we prove three lemmas similar to Lemmas \ref{lemma: theta equal indices subcase 2}, \ref{lemma: phi equal indices subcase 2}, and \ref{lemma: eta not equal indices subcase 2} for the new models $\widetilde{\M}_1$ and $\widetilde{\M}_2$.

\begin{lemma}
    \label{lemma: theta indices subcase 3}
    For any $\mathbf{v} \in \domm{\mathbf{V}}{}$ and $i\in[0:m']$,
    \begin{equation*}
        \widetilde{\theta}_{i,j_1}(\mathbf{v}) = \widetilde{\theta}_{i,j_2}(\mathbf{v}) = \cdots= \widetilde{\theta}_{i,j_{\frac{\kappa+1}{2}}}(\mathbf{v}).
    \end{equation*}
\end{lemma}
\begin{proof}
    By substituting $P^{\widetilde{\M}}$ from the above into Equation \eqref{eq: def theta subcase 2} and rearranging the terms, we obtain
    \begin{equation*}
    \begin{gathered}
        \widetilde{\theta}_{i, j}(\mathbf{v}) = 
        \sum_{\mathbf{U}[\widetilde{\mathcal{P}}]} 
        \prod_{\hat{U}[\hat{p}]\in \mathbf{U}[\widetilde{\mathcal{P}}]} f_{\hat{p}}(\hat{U})
        \prod_{\hat{X}[\hat{p}] \in \mathbf{A}'_i[\widetilde{\mathcal{P}}]} f_{\hat{p}}(\hat{X}[\hat{p}]|\Pa{\hat{X}}{\hat{p}}) \times\\
        \times\Big( \sum_{\mathbf{U}^{\M} \setminus \{U_0\}^{\M}}
         \prod_{X \in \A'_i} P^{\M}(x^{\M} \mid \Pa{X}{\G}) \prod_{U\in \mathbf{U} \setminus \{U_0\}}\!P^{\M}(u^{\M})\Big)
    \end{gathered}
    \end{equation*}
    
    % Let $\mathbf{v}'\in \dom{\mathbf{V}}{}$ be a realization that is consistent with $\mathbf{v}^{\M}$.

    Note that the terms inside the big parenthesis of the above equation is equal to $\theta_{i, j}$ given by \ref{eq: theta and eta}, i.e.,
    % \begin{equation*}
    %     \theta_{i, j}(\mathbf{v}') = \sum_{\mathbf{U} \setminus \{U_0\}^{\M}}
    %      \prod_{X \in \A'_i} P^{\M}(x^{\M} \mid \Pa{X}{\G}) \prod_{U\in \mathbf{U} \setminus \{U_0\}}\!P^{\M}(u^{\M}),
    % \end{equation*}
    % where the right side of equation written for the realization $\mathbf{v}$.
    % The latter implies
    \begin{equation*}
        \widetilde{\theta}_{i, j}(\mathbf{v}) = \sum_{\mathbf{U}[\widetilde{\mathcal{P}}]} 
        \prod_{\hat{U}[\hat{p}]\in \mathbf{U}[\widetilde{\mathcal{P}]}} f_{\hat{p}}(\hat{U})
        \prod_{\hat{X}[\hat{p}] \in \mathbf{A}'_i[\widetilde{\mathcal{P}}]} f_{\hat{p}}(\hat{X}[\hat{p}]|\Pa{\hat{X}}{\hat{p}})
        \theta_{i, j}(\mathbf{v}^{\M}).
    \end{equation*}
    In the last equation, all terms on the right-hand side except $\theta_{i, j}(\mathbf{v}^{\M})$ are independent of the realization of $\{U_0\}^{\M}$, i.e., independent of index j. For $j \in \{j_1, j_2, \dots, j_{\frac{\kappa+1}{2}}\}$ and using the result of Lemma \ref{lemma: gid equal indices} that says $\theta_{i, j_1}(\mathbf{v})=\theta_{i, j_2}(\mathbf{v})=\dots=\theta_{i, j_{\frac{\kappa+1}{2}}}(\mathbf{v})$, we can conclude the result.
\end{proof}

\begin{lemma} \label{lemma: phi indices subcase 3}
     For any $\mathbf{d}^{\dagger} \in \domm{\D^{\dagger}}{}$:
    \begin{equation*}
        \widetilde{\phi}_{j_1}(\mathbf{d}^{\dagger}) = \widetilde{\phi}_{j_2}(\mathbf{d}^{\dagger})=\dots = \widetilde{\phi}_{j_{\frac{k+1}{2}}}(\mathbf{d}^{\dagger}).
    \end{equation*}
\end{lemma}
\begin{proof}
    Similar to the previous lemma, by substituting $P^{\widetilde{\M}}$ from their definitions into Equation \eqref{eq: def phi subcase 3} and rearranging the terms, we obtain:
    \begin{equation}\label{eq: phi simplification subcase 3}
    \begin{gathered}
        \widetilde{\phi}_{j}(\mathbf{d}^{\dagger}) := \sum_{U_0[\widetilde{\mathcal{P}}]}
        \sum_{\mathbf{U}^{\M} \setminus \{U_0\}^{\M}}
        \sum_{\D}
        \prod_{\hat{p}\in \widetilde{\mathcal{P}}_{U_0}}f_{\hat{p}}(U_0[\hat{p}])
        \prod_{\hat{X}[\hat{p}] \in \mathbf{S}[\widetilde{\mathcal{P}}]} f_{\hat{p}}(\hat{X}[\hat{p}]|\Pa{\hat{X}}{\hat{p}})\times \\
        \times\Big(
         \prod_{X \in \mathbf{S}} P^{\M}(x^{\M} \mid \Pa{X}{\G}) \prod_{U\in \mathbf{U} \setminus \{U_0\}}\!P^{\M}(u^{\M})\Big)
    \end{gathered}
    \end{equation}

    Suppose that $l_1$ and $l_2$ are two integers such that
    \begin{equation*}
    \begin{split}
        & \gamma_{l_1} = (2x, 0, \dots, 0)),\\
        & \gamma_{l_2} = (2x+2 \pmod{\kappa+1}, 0, \dots, 0),
    \end{split}
    \end{equation*}
    and $x$ is an integer in $[0 : \frac{\kappa-1}{2}]$.
    We will prove that $\widetilde{\phi}_{ l_1}(\mathbf{d}^{\dagger})=\widetilde{\phi}_{l_2}(\mathbf{d}^{\dagger})$.

    Suppose that path $p$ is the sequence of variables: $Z'$, $D'_1$, $D'_2$ \dots, $D'_{k'_1}$, $D'_{k'_1+1}:=Y'$ and path $p_T$ is a sequence of variables: $T_0:=T$, $T_1$, \dots, $T_{k'_2}$, $T_{k'_2+1}:=Z'$. Note that direct edge between $Z'$ and $D'_1$ is pointing toward $Z'$, i.e., $Z'\leftarrow D_1'$ and for all $i\in [0, k'_2]$ variable $T_{i}$ is a parent of $T_{i+1}$ on the path $p_T$.
    
    On the other hand, since $T$ and $U_0$ are both in $\S$ ($\S=\mathbf{S}_1$ by construction), then there exists a shortest path  $U_0, \hat{S}_1', \hat{U}_1', \hat{S}_2', \hat{U}_2', \dots, \hat{U}_{l'}', T$, such that $U_0$ is a parent of $\hat{S}_1'\in \S$, $T$ is a child of $\hat{U}_l'\in \U^{\S}$, and $\hat{U}_j'\in \U^{\S}$ is a parent of variables $\hat{S}_j'\in \S$ and  $\hat{S}_{j+1}'\in \S$ for any $j \in [1:l'-1]$. 
    Let $\hat{\mathbf{U}}':=\{\hat{U}_1', \dots, \hat{U}_l'\}$, i.e., unobserved nodes in this shortest path except $U_0$. For any given realization $\mathbf{o}_{1} \in \domm{\mathbf{U}\cup\D}{}$,  we define $\mathbf{o}_{2} \in \domm{\mathbf{U}\cup\D}{}$ as follows,
    \begin{equation}
        \begin{split}
            & \mathbf{o}_{2}^{\M}[\hat{U}'_j] := \mathbf{o}_{1}^{\M}[\hat{U}'_j] + 2(-1)^{j} \pmod{\kappa+1}, \quad \forall j\in[0:l'],\\
            & \mathbf{o}_{2}^{\M}[T] := \mathbf{o}_{1}^{\M}[\hat{U}'_j] + 2(-1)^{l'} \pmod{\kappa+1}.
        \end{split}
    \end{equation}
    Note that if $\mathbf{o}_1^{\M}[U_0] = \gamma_{l_1}$ then $\mathbf{o}_2^{\M}[U_0] = \gamma_{l_2}$.
    With these modifications for any $S \in \S$, we obtain
    \begin{equation*}
        s_1 - M(S) \equiv s_2 - M(S) \pmod{\kappa+1},
    \end{equation*}
    where $s_1$ is a realization of $S\Big|_{(\mathbf{U}\cup\D, \D^{\dagger})=(\mathbf{o}_1, \dd^{\dagger})}$, $s_2$ is a realization of $S\Big|_{(\mathbf{U}\cup\D, \D^{\dagger})=(\mathbf{o}_2, \dd^{\dagger})}$, $M(\cdot)$ is given by Equation (\ref{eq: M(S)}). 
    This implies for any $S\in \mathbf{S}$, we have
    \begin{equation*}
    P^{\M}(s|\Pa{S}{\G})\Big|_{(\mathbf{U}\cup\D, \D^{\dagger})=(\textbf{o}_1, \dd^{\dagger})}=P(s|\Pa{S}{\G})\Big|_{(\mathbf{U}\cup\D, \D^{\dagger})=(\textbf{o}_2, \dd^{\dagger})}.
    \end{equation*}
    Let $c = -2(-1)^{l'}$ and we define
    \begin{align*}
        & \mathbf{o}_2^{\M}[T_j[p_T]] := \mathbf{o}_1^{\M}[T_j[p_T]] - c \pmod{\kappa+1},\quad \forall j \in [1:k'_2],
        \\
        & \mathbf{o}_2^{\M}[D'_1[\widetilde{p}]] :=  \mathbf{o}_1^{\M}[D'_1[\widetilde{p}]] + c \pmod{\kappa+1}.
    \end{align*}
    This implies that for all $j \in [1:k'_2+1]$ we have
    \begin{equation*}
        f_{p_T}(T_j|\Pa{T_j}{p_T})\Big|_{(\mathbf{U}\cup\D, \D^{\dagger})=(\mathbf{o}_1, \dd^{\dagger})} = f_{p_T}(T_j|\Pa{T_j}{p_T})\Big|_{(\mathbf{U}\cup\D, \D^{\dagger})=(\mathbf{o}_2, \dd^{\dagger})}.
    \end{equation*}
    Assume that $D_j'$ is not a collider on the path $\widetilde{p}$ and $j\in [2:k_1'+1]$. We define $\mu(D_j')$ to be the number of colliders on a part of the path $\widetilde{p}$ from $D_1'$ to $D_{j-1}'$. Thus, for those $j\in[2:k_1'+1]$ that $D_j'$ is not a collider, we define
    \begin{equation}\label{eq: phi modifications p subcase 3}
        \mathbf{o}_2^{\M}[D_j'[\widetilde{p}]] := \mathbf{o}_1^{\M}[D_j'[\widetilde{p}]] + c(-1)^{\mu(D_j')}.
    \end{equation}
    Note that the modifications in \eqref{eq: phi modifications p subcase 3} might only affect the function $f_{\widetilde{p}}(\cdot|\cdot)$. Next, we show that after these modifications, function $f_{\widetilde{p}}(\cdot|\cdot)$ remains unchanged. To do so, for $j \in [1:k_1'+1]$ we consider four different cases:
    \begin{enumerate}
        \item If $D_j'$ has no parents, then it is obvious that
         \begin{equation*}
            f_{\widetilde{p}}(D_j'[\widetilde{p}])\Big|_{(\mathbf{U}\cup\D)=(\textbf{o}_1)} = f_{\widetilde{p}}(D_j'[\widetilde{p}])\Big|_{(\mathbf{U}\cup\D)=(\textbf{o}_2)}.
        \end{equation*}
        \item If $D_j'$ is a collider, then $\mu(D_{j+1}') = \mu(D_{j-1}')+1$ and
        \begin{align*}
            & \mathbf{o}_1[D_{j+1}'[\widetilde{p}]] + \mathbf{o}_1[D_{j-1}'[\widetilde{p}]] = \mathbf{o}_2[D_{j+1}'[\widetilde{p}]] + \mathbf{o}_2[D_{j-1}'[\widetilde{p}]],
        \end{align*}
        and hence, according to the Equation \eqref{eq: define f otherwise subcase 3}, we have
        \begin{equation*}
          f_{\widetilde{p}}(D_j'[\widetilde{p}]|\Pa{D_j'}{\widetilde{p}})\Big|_{(\mathbf{U}\cup\D)=(\mathbf{o}_1)} = f_{\widetilde{p}}(D_j'[\widetilde{p}]|\Pa{D_j'}{\widetilde{p}})\Big|_{(\mathbf{U}\cup\D)=(\textbf{o}_2)}.
        \end{equation*}
        
        \item If $D'_j$ is a child of $D'_{j+1}$, then $\mu(D'_{j}) = \mu(D'_{j+1})$ and
        \begin{align*}
            & \mathbf{o}_1[D_{j}'[\widetilde{p}]] - \mathbf{o}_1[D_{j+1}'[\widetilde{p}]] = \mathbf{o}_2[D_{j}'[\widetilde{p}]] - \mathbf{o}_2[D_{j+1}'[\widetilde{p}]].
        \end{align*}
        According to Equation \eqref{eq: define f otherwise subcase 3}, we imply that
        \begin{equation*}
           f_{\widetilde{p}}(D_j'[\widetilde{p}]|\Pa{D_j'}{\widetilde{p}})\Big|_{(\mathbf{U}\cup\D)=(\textbf{o}_1)} = f_{\widetilde{p}}(D_j'[\widetilde{p}]|\Pa{D_j'}{\widetilde{p}})\Big|_{(\mathbf{U}\cup\D)=(\textbf{o}_2)}.
        \end{equation*}
        
        \item If $D'_j$ is a child of $D'_{j-1}$, then $\mu(D_{j}') = \mu(D_{j-1}')$ and
        \begin{align*}
            & \mathbf{o}_1[D_{j}'[\widetilde{p}]] - \mathbf{o}_1[D_{j-1}'[\widetilde{p}]] = \mathbf{o}_2[D_{j}'[\widetilde{p}]] - \mathbf{o}_2[D_{j-1}'[\widetilde{p}]].
        \end{align*}
        Similarly, according to Equation \eqref{eq: define f otherwise subcase 3}, we get
        \begin{equation*}
           f_{\widetilde{p}}(D_j'[\widetilde{p}]|\Pa{D_j'}{\widetilde{p}})\Big|_{(\mathbf{U}\cup\D)=(\textbf{o}_1)} = f_{\widetilde{p}}(D_j'[\widetilde{p}]|\Pa{D_j'}{\widetilde{p}})\Big|_{(\mathbf{U}\cup\D)=(\textbf{o}_2)}.
        \end{equation*}
    \end{enumerate}

    This concludes that for any $j\in[1:k_1'+1]$,
    \begin{equation*}
        f_{\widetilde{p}}(D_j'[\widetilde{p}]|\Pa{D_j'}{\widetilde{p}})\Big|_{(\mathbf{U}\cup\D)=(\textbf{o}_1)} = f_{\widetilde{p}}(D_j'[\widetilde{p}]|\Pa{D_j'}{\widetilde{p}})\Big|_{(\mathbf{U}\cup\D)=(\textbf{o}_2)}.
    \end{equation*}

    Note that the aforementioned transformation of $\mathbf{o}_1$ affects only those realizations of variables that are used for marginalization in the Equation \eqref{eq: phi simplification subcase 3}. Putting the above results together implies that the terms in Equation \eqref{eq: phi simplification subcase 3} remain unchanged, i.e.,
    \begin{align*}
        & \prod_{\hat{p}\in \widetilde{\mathcal{P}}_{U_0}}f_{\hat{p}}(U_0[\hat{p}])
        \prod_{\hat{X}[\hat{p}] \in \mathbf{S}[\widetilde{\mathcal{P}}]} f_{\hat{p}}(\hat{X}[\hat{p}]|\Pa{\hat{X}}{\hat{p}}) \\
        & \times\Big(
        \prod_{X \in \mathbf{S}} P^{\M}(x^{\M} \mid \Pa{X}{\G}) \prod_{U\in \mathbf{U}}\!P^{\M}(u^{\M})\Big)\Big|_{(\mathbf{U}\cup\D)=(\textbf{o}_1)} = \\
        & = \prod_{\hat{p}\in \widetilde{\mathcal{P}}_{U_0}}f_{\hat{p}}(U_0[\hat{p}])
        \prod_{\hat{X}[\hat{p}] \in \mathbf{S}[\widetilde{\mathcal{P}}]} f_{\hat{p}}(\hat{X}[\hat{p}]|\Pa{\hat{X}}{\hat{p}}) \\
        & \times\Big(
        \prod_{X \in \mathbf{S}} P^{\M}(x^{\M} \mid \Pa{X}{\G}) \prod_{U\in \mathbf{U} \setminus \{U_0\}}\!P^{\M}(u^{\M})\Big)\Big|_{(\mathbf{U}\cup\D)=(\textbf{o}_2)}
    \end{align*}
    
    This implies that $\widetilde{\phi}_{l_1}(\mathbf{d}^{\dagger})=\widetilde{\phi}_{l_2}(\mathbf{d}^{\dagger})$. By varying $x$ within $[0 : \frac{\kappa-1}{2}]$ in the definition of $\gamma_{l_1}$ and $\gamma_{l_2}$, we  obtain the result.
\end{proof}

\begin{lemma}
    \label{lemma: eta indices subcase 3}
    There exists $0<\epsilon<\frac{1}{\kappa}$, such that there exists $\mathbf{v}_0 \in \domm{\mathbf{V}}{}$ and $1\leq r <t\leq \frac{\kappa+1}{2}$ such that
    \begin{equation*}
        \widetilde{\eta}_{j_r}(\mathbf{v}_0) \neq \widetilde{\eta}_{j_t}(\mathbf{v}_0).
    \end{equation*}
\end{lemma}
\begin{proof}
    By substituting $P^{\widetilde{\M}}$ from their definitions into Equation \eqref{eq: def eta subcase 3} and rearranging the terms, we obtain
    \begin{equation}\label{eq: eta simplification subcase 3}
    \begin{gathered}
        \widetilde{\eta}_{j}(\mathbf{v}_0) = 
        \sum_{\mathbf{U}^{\M}\setminus \{U_0\}^{\M}}
        \sum_{\mathbf{U}[\widetilde{\mathcal{P}}]}
        \prod_{\hat{U}[\hat{p}]\in \mathbf{U}[\widetilde{\mathcal{P}}]} f_{\hat{p}}(\hat{U})
        \prod_{\hat{X}[\hat{p}] \in \mathbf{S}[\widetilde{\mathcal{P}}]} f_{\hat{p}}(\hat{X}[\hat{p}]|\Pa{\hat{X}}{\hat{p}}) \times\\
        \times\Big(
         \prod_{X \in \mathbf{S}} P^{\M}(x^{\M} \mid \Pa{X}{\G}) \prod_{U\in \mathbf{U} \setminus \{U_0\}}\!P^{\M}(u^{\M})\Big),
    \end{gathered}
    \end{equation}

    Next, we define $\mathbf{v}_0\in \domm{\mathbf{V}}{}$ such that the conditions in the lemma hold.
    
    \begin{itemize}
        \item For any path $\hat{p}\in \widetilde{\mathcal{P}}$ and any node $W$ on the path $\hat{p}$ that is not a starting node for path $\hat{p}$ we define:
        \begin{equation*}
            \mathbf{v}_0[W[\hat{p}]]:=0;
        \end{equation*}
        \item For any variable $S \in \S$, we define
        \begin{equation*}
            \mathbf{v}_0^{\M}[S] := 0;
        \end{equation*}
        \item For the remaining part of $\mathbf{v}_0$, we choose a realization such that for the selected $\mathbf{v}_0$, there exists a realization for the unobserved variables $\mathbf{U}$ that ensures $\mathbb{I}(I)(S)=0$ for all $S\in \S$. This is clearly possible due to the definition of $\mathbb{I}(S)$.
    \end{itemize}
    
    Assume $r$ and $t$ are such that $\gamma_{j_r} = (0, 0, \dots, 0)$ and $\gamma_{j_t} = (2, 0, \dots, 0)$.  To finish the proof of the lemma, it is enough to show that $\widetilde{\eta}_{j_r}(\mathbf{v}_0)$ and $\widetilde{\eta}_{j_t}(\mathbf{v}_0)$ are two different polynomial functions of parameter $\epsilon$. We prove that those two polynomials are different by showing that $\widetilde{\eta}_{j_r}(\mathbf{v}_0)\neq\widetilde{\eta}_{j_t}(\mathbf{v}_0)$ for $\epsilon=0$. 
    
    We only need to consider the non-zero terms in Equation \eqref{eq: eta simplification subcase 3}. From \eqref{eq: eta simplification subcase 3}, we have
    \begin{equation}
    \label{eq: main term lemma subcase 3}
    \begin{gathered}
         \prod_{\hat{U}[\hat{p}]\in \mathbf{U}[\widetilde{\mathcal{P}}]} f_{\hat{p}}(\hat{U})
        \prod_{\hat{X}[\hat{p}] \in \mathbf{S}[\widetilde{\mathcal{P}}]} f_{\hat{p}}(\hat{X}[\hat{p}]|\Pa{\hat{X}}{\hat{p}})\\
        \times\Big(
         \prod_{X \in \mathbf{S}} P^{\M}(x^{\M} \mid \Pa{X}{\G}) \prod_{U\in \mathbf{U} \setminus \{U_0\}}\!P^{\M}(u^{\M})\Big).
    \end{gathered}
    \end{equation}
    Note that $f_{\hat{p}}(\hat{U})=\frac{1}{\kappa+1}$ and $f_{\hat{p}}(\hat{X}|\Pa{\hat{X}}{\hat{p}})$ is non-zero only:
    \begin{itemize}
        \item when $\hat{p} = p_T$, $\hat{X}$ is a child of $T$ on the path $p_T$, and
        \begin{equation*}
            \hat{X}[\hat{p}] \equiv T^{\M} \pmod{\kappa + 1}.
        \end{equation*}

        \item when $\hat{p} = p_T$, $\hat{X}=Z'$, and
        \begin{equation*}
            Z'[\hat{p}] \equiv W'[\hat{p}] + W''[\widetilde{p}] \pmod{\kappa + 1},
        \end{equation*}
        where $W'$ is a parent of $Z'$ on the path $p_T$ and $W''$ is a parent of $Z'$ on the path $\widetilde{p}$.
        
        \item when there exists a variable $W\in \mathbf{F}$ such that $\hat{p}'=\widetilde{p}_W$, $\hat{X}$ is a child of $W$ in path $\widetilde{p}_W$, and
        $$
        \hat{X}[\hat{p}] \equiv W[\widetilde{p}] \pmod{\kappa+1}.
        $$
        
        \item when the following holds
        $$
        \hat{X}[\hat{p}] \equiv \sum_{\hat{X}'\in \Pa{\hat{X}}{\hat{p}}\setminus\{W\}}\hat{X}'[\hat{p}] \pmod{\kappa+1}.
        $$
    \end{itemize}
    Similarly, $P^\M(X|\Pa{X}{\G})$ is non-zero
    \begin{itemize}
        \item if $\mathbb{I}(X)=1$ (i.e. $P^\M(X^{\M}|\Pa{X}{\G})=\frac{1}{\kappa+1}$), or
        
        \item if $X^{\M} \equiv M(X) \pmod{\kappa+1}$ for $P^\M(X^{\M}|\Pa{X}{\G})$.
    \end{itemize}

    Let fix a realization $\mathbf{u} \in \domm{\mathbf{U}\setminus\{U_0^{M}\}}{}$. We consider two scenarios:
    
    \textbf{I)} Assume that for this realization, there is a variable $S\in \S$, such that $\mathbb{I}(S)=1$ and $S$ is the closest variable to $U_0$ considering only paths with bidirected edges in $\G'[\S]$. The value of $S^{\M}$ does not depend on its parents because of $\mathbb{I}(S)=1$ and Equation \eqref{eq: def P(S|Pa(S)) gid}.
    Additionally in the graph $\G'[\S]$ there exists a path $U_0, \hat{S}_1', \hat{U}_1', \hat{S}_2', \hat{U}_2', \dots, \hat{U}_{l'}', S$, such that $U_0$ is a parent of $\hat{S}_1'\in \S$, $S$ is a child of $\hat{U}_l'\in \U^{\S}$, and $\hat{U}_j'\in \U^{\S}$ is a parent of variables $\hat{S}_j'\in \S$ and  $\hat{S}_{j+1}'\in \S$ for $j \in [1:l'-1]$. 
    Let $\hat{\mathbf{U}}':=\{\hat{U}_1', \dots, \hat{U}_l'\}$. 
    We define $\mathbf{u}' \in \domm{\mathbf{U}\setminus\{U_0^{\M}\}}{}$ 
    that is consistent with $\mathbf{u}$ except the variables in $\U$. For these variables, we define
    \begin{equation}
        \begin{split}
            & \mathbf{u}'^{\M}[\hat{U}_j] := \mathbf{u}^{\M}[\hat{U}_j] + 2(-1)^{j} \pmod{\kappa+1}, \quad j\in[1:l'],\\
            % & \mathbf{u}_{2}^{\M}[U] := \mathbf{u}_{1}^{\M}[U], \quad \forall U\in \U^{\S} \setminus \hat{\mathbf{U}},
        \end{split}
    \end{equation}
    
    With this modification for any $\widetilde{S}\in \mathbf{S}$, we have
    \begin{equation*}
    P^{\M}(\widetilde{s}|\Pa{\widetilde{S}}{\G})\Big|_{(\mathbf{U})=(\mathbf{u}, \gamma_{l_1})}=P(\widetilde{s}|\Pa{\widetilde{S}}{\G})\Big|_{(\mathbf{U})=(\textbf{u}', \gamma_{l_2})}.
    \end{equation*}
    Therefore for all such realizations of $\mathbf{u}$ the summation of the following terms for both $\widetilde{\eta}_{j_r}(\mathbf{v}_0)$ and $\widetilde{\eta}_{j_t}(\mathbf{v}_0)$ will be the same,
    \begin{equation}
    \label{eq: main term eta subcase 3}
    \begin{gathered}
         \prod_{\hat{U}[\hat{p}]\in \mathbf{U}[\widetilde{\mathcal{P}}]} f_{\hat{p}}(\hat{U})
        \prod_{\hat{X}[\hat{p}] \in \mathbf{S}[\widetilde{\mathcal{P}}]} f_{\hat{p}}(\hat{X}[\hat{p}]|\Pa{\hat{X}}{\hat{p}}) \times\\
        \times\Big(
         \prod_{X \in \mathbf{S}} P^{\M}(x^{\M} \mid \Pa{X}{\G}) \prod_{U\in \mathbf{U} \setminus \{U_0\}}\!P^{\M}(u^{\M})\Big).
    \end{gathered}
    \end{equation}

    \textbf{II)} Assume that for all $S\in \S$, we have $\mathbb{I}(S)=0$. We consider a realization $U_0^{\M}=\gamma_{j_r}$ and $\mathbf{u}$ such that:
    \begin{itemize}
        \item $\mathbf{u}[\U^{\S}] = \mathbf{0}$.
        \item for all $U\in \mathbf{U}$ and any path $\hat{p}\in \mathcal{P}$ which contains $U$, $\mathbf{u}[U[\hat{p}]] = 0$.
    \end{itemize}
    We claim that for such $\mathbf{u}$,
    \begin{equation*}
    \begin{gathered}
        \prod_{\hat{U}[\hat{p}]\in \mathbf{U}[\widetilde{\mathcal{P}}]} f_{\hat{p}}(\hat{U})
        \prod_{\hat{X}[\hat{p}] \in \mathbf{S}[\widetilde{\mathcal{P}}]} f_{\hat{p}}(\hat{X}[\hat{p}]|\Pa{\hat{X}}{\hat{p}}) \times\\
        \times\Big(
         \prod_{X \in \mathbf{S}} P^{\M}(x^{\M} \mid \Pa{X}{\G}) \prod_{U\in \mathbf{U} \setminus \{U_0\}}\!P^{\M}(u^{\M})\Big).
    \end{gathered}
    \end{equation*}
    is non-zero. To prove this claim we consider 5 cases:
    \begin{itemize}
        \item assume that $\hat{p}=p_T$ and $\hat{X}=Z'$.  Denote by $W'$ parent of $Z'$ on the path $p_T$ and by $W''$ parent of $Z'$ on the path $\widetilde{p}$. From the definition of $\mathbf{u}$ and $\mathbf{v_0}$, we get
        \begin{equation*}
            \hat{X}[\hat{p}] \equiv W'[\hat{p}] + W''[\widetilde{p}],
        \end{equation*}
        and therefore $f_{\hat{p}(\hat{X}[\hat{p}]|\Pa{\hat{X}}{\hat{p}})} = 1$.
        The latter is true because $\hat{X}[\hat{p}]\equiv W'[\hat{p}]\equiv W''[\widetilde{p}]\equiv 0 \pmod{\kappa+1}$.
        
        \item assume that $\hat{p} = p_T$ and $\hat{X}$ is a child of T. From the definition of $\mathbf{u}$ and $\mathbf{v}_0$ we get
        \begin{equation*}
            \hat{X} \equiv T^{\M} \pmod{\kappa+1},
        \end{equation*}
        and therefore $f_{\hat{p}(\hat{X}[\hat{p}]|\Pa{\hat{X}}{\hat{p}})} = 1$. The above holds because all the variables in the above equation are zero.
        
        \item  assume that $\hat{p}\in \widetilde{\mathcal{P}}$ and exists a variable $W$ such that $\hat{p}=\widetilde{p}_W$. Let $\hat{X}$ is a child of $W$ in a path $\widetilde{p}_W$. From the definitions of $\mathbf{u}$ and $\mathbf{v}_0$, we get
        $$
        \hat{X}[\hat{p}] \equiv W[\hat{p}] \pmod{\kappa+1},
        $$ 
        and therefore $f_{\hat{p}}(\hat{X}[\hat{p}]|\Pa{\hat{X}}{\hat{p}})=1$. Again, the above holds because all the terms are zero.
        
        \item assume that $\hat{p}\in \widetilde{\mathcal{P}}$ and $\hat{X}$ is a variable on this path such that it is neither a starting node of the path $\hat{p}$ nor a child of a starting node on the path $\hat{p}$. Then, from the definitions of $\mathbf{v}_0$ and $\mathbf{u}$, we get
        $$
        \hat{X}[\hat{p}] \equiv \sum_{\hat{X}\in \Pa{\hat{X}}{\hat{p}}\setminus\{W\}}\hat{X}[\hat{p}] \pmod{\kappa+1},
        $$
        and therefore $f_{\hat{p}}(\hat{X}[\hat{p}]|\Pa{\hat{X}}{\hat{p}})=1$. Again, the above holds because all the terms are zero.
        
        \item assume $X\in \S$. Then, from the definitions of $\mathbf{v}_0$ and $\mathbf{u}$, we get
        $$
        X^{\M} \equiv M(X) \pmod{\kappa+1},
        $$
        and consequently $P^{\M}(x^{\M}|\Pa{X}{\G})=1$.
    \end{itemize}

    Now we consider the case when $U_0^\M = \gamma_{j_t}$. 
    % Assume that $W\in \mathbf{F}$ and $W'$ is the last descendant of the path $\widetilde{p}_W$ of variable $W$. Recall the properties which we proved in the beginning, then $W'$ is in a set $\mathbf{Z'}$ and by the definition of $\mathbf{v}_0$ we have $W'[\widetilde{p}_W]=0$. Assume $W''$ is a parent of $W'$ on the path $\widetilde{p}_W$. Note that $f_{\widetilde{p}_W}(W'[\widetilde{p}_W]|\Pa{W'}{\widetilde{p}_W})$ is not equal to zero if and only if $W''[\widetilde{p}_W]=0$. Repeating this process by going from the node $W'$ to $W$ we conclude that $W[\widetilde{p}]$ must be equal to 0, otherwise the term defined by Equation \ref{eq: main term eta subcase 3} would be equal to 0. 
    % Assume that $Z', W'_1, W'_2, \dots, W'_{k'}, W'_{k'+1}:=Y'$ is a path $\widetilde{p}$. Then we prove by induction that $W'_{i}=0$ for all $i\in [1:k'+1]$. Be definition of $\mathbf{v_0}$ we know that $Y'[\widetilde{p}]=0$. Assume that $W'_{i}[\widetilde{p}]=0$ for all $i \in [k''+1:k']$, let's prove that $W''_{k''}[\widetilde{p}]=0$ too. We consider the following three cases that concludes the proof of before claimed fact.
    % \begin{itemize}
    %     \item $W'_{k''}$ is a collider on a path $\widetilde{p}$. Then the fact that $W''_{k''}[\widetilde{p}]=0$ follows immediately from the observations made before.
    %     \item $W'_{k''}$ is a child of $W'_{k''+1}$ and is not a collider. Then $f_{\widetilde{p}}(W'_{k''}|\Pa{W''_{k''}}{p})$ is not equal to zero if and only if $W'_{k''}[p] = W'_{k''+1}[p] = 0$.
    %     \item $W'_{k''}$ is a parent of $W'_{k''+1}$. Then $f_p(W'_{k''+1}|\Pa{W''_{k''}}{\widetilde{p}})$ is not equal to zero if and only if $0 = W'_{k''+1}[\widetilde{p}] = W'_{k''}[\widetilde{p}]$.
    % \end{itemize}

    % Since $W'_1$ must be equal to 0 then $P'(Z'|\Pa{Z'}{\G}) = P^{M}(Z'|\Pa{Z'}{\G})$. In the context of all these arguments we simplify the Equation \eqref{eq: main term eta subcase 2} to the following:
    Note that the following term depends only the realization of $\mathbf{U}^{\M}$ and $\mathbf{v}_0^{\M}$.
    \begin{equation*}
        \prod_{X \in \mathbf{S}} P^{\M}(x^{\M} \mid \Pa{X}{\G}) \prod_{U\in \mathbf{U} \setminus \{U_0\}}\!P^{\M}(u^{\M}).
    \end{equation*}
    However by the proof of Lemma 6 \cite{kivva2022revisiting} we know that there is no realization of $\mathbf{U}^{\M}$ such that:
    \begin{itemize}
        \item $\mathbb{I}(S)=0$ for all $S\in \S$, and
        \item $U_0^{\M}=\gamma_{j_t}$, and
        \item $x^{\M} \equiv M(X) (\kappa + 1)$ for all $X\in \S$. The latter is a necessary condition for $P^{\M}(x|\Pa{X}{\G})$ being non-zero. 
    \end{itemize}

    To summarize, we showed that for $U_0^{\M}=\gamma_{j_r}$, Equation \eqref{eq: main term eta subcase 3} is non-zero while it is zero for $U_0^{\M}=\gamma_{j_t}$. This implies that $\widetilde{\eta}_{j_r}(\mathbf{v}_0)\neq\widetilde{\eta}_{j_t}(\mathbf{v}_0)$ for $\epsilon=0$.
\end{proof}

\subsubsection{Proof of Lemma \ref{lemma: construct models subcase 3}}
\begin{customlem}{\ref{lemma: construct models subcase 3}}
    Let $\mathbf{S}: = \Anc{\Y', \Z'}{\G[\mathbf{V} \setminus \X']}$ and $\D$ is a set of all nodes on the paths in $\mathcal{P}$ excluding $\Z'$. Then,
    \begin{equation}
        P_{\x'}(\widetilde{\dd}|\mathbf{s}\setminus \widetilde{\dd})=\frac{
        Q[\mathbf{S}]
        }{
        \sum_{\D} Q[\mathbf{S}]
        } = Q[\D|\mathbf{S}\setminus\D]
    \end{equation}
    is not c-gID from $(\mathbb{A}, \G)$.
\end{customlem}
\begin{proof}
    We will show  that $Q[\D|\mathbf{S}\setminus\D]$ is not c-gID from $(\mathbb{A}', \G)$, where $\mathbb{A}' := \mathbb{A}\cup\{\mathbf{S}_i\}_{i=2}^{n}$. 
    To this end, we will specify two models $\M_1$ and $\M_2$ such that for each $i \in [0:m']$ and any $\mathbf{v}\in \domm{\mathbf{V}}{}$:
    \begin{align}
        \label{eq: equal known dist subcase 3}
        Q^{\M_1}[\A'_i](\mathbf{v}) &= Q^{\M_2}[\A'_i](\mathbf{v}),\\
        \label{eq: equal denom num subcase 3}
        \sum_{\D}Q^{\M_1}[\mathbf{S}](\mathbf{v}') &= \sum_{\D}Q^{\M_2}[\mathbf{S}](\mathbf{v}'),
    \end{align}
    but there exists $\mathbf{v}_0 \in \domm{\mathbf{V}}{}$ such that:
    \begin{equation}\label{eq: not equal num subcase 3}
        Q^{\M_1}[\mathbf{S}](\mathbf{v}_0) \neq Q^{\M_2}[\mathbf{S}](\mathbf{v}_0).
    \end{equation}
    Note that using Equations (\ref{eq: equal denom num subcase 3})-(\ref{eq: not equal num subcase 2}) yield
    \begin{equation*}
         Q[\D|\mathbf{S}\setminus\D]^{\M_1}(\mathbf{v}_0) \neq Q[\D|\mathbf{S}\setminus\D]^{\M_2}(\mathbf{v}_0).
    \end{equation*}
    This means that $Q[\D|\mathbf{S}\setminus\D]$ is not c-gID from $(\mathbb{A}', \G)$.

    Two this end, we consider two cases.

    \textbf{First case:} \\
    Suppose that there exists $i \in [0, m]$, such that $\widecheck{\mathbf{S}} \subset \mathbf{A}_i$.
    Further we consider models $\widetilde{\M}_1$ and $\widetilde{\M}_2$ constructed in Section \ref{sec: appendix new models subcase 3}. According to the definitions of models $\widetilde{\M}_1$ and $\widetilde{\M}_2$ for any $\mathbf{v}\in \domm{\mathbf{V}}{}$, and any $i\in [0:m']$, and any $g\in\{1, 2\}$:
    \begin{align*}
        & Q[\mathbf{A}'_i]^{\widetilde{\M}_g}(\mathbf{v}) := \sum_{U_0^\M}P^{\M_g}(u_0^{\M})\sum_{U_0[\widetilde{\mathcal{P}}]}\prod_{\hat{p}\in \widetilde{\mathcal{P}}_{U_0}}f_{\hat{p}}(U_0[\hat{p}])\sum_{\mathbf{U} \setminus \{U_0\}} \prod_{X \in \A_i'} P^{\widetilde{\M}}(x \mid \Pa{X}{\G}) \prod_{U\in \mathbf{U} \setminus \{U_0\}} P^{\widetilde{\M}}(u),\\
        \sum_{\D}&Q^{\widetilde{\M}_g}[S](\mathbf{v}) := \sum_{U_0^\M}P^{\M_g}(u_0^{\M})\sum_{U_0[\widetilde{\mathcal{P}}]}\prod_{\hat{p}\in \widetilde{\mathcal{P}}_{U_0}}f_{\hat{p}}(U_0[\hat{p}])\sum_{\D}\sum_{\mathbf{U} \setminus \{U_0\}} \prod_{X \in \mathbf{S}} P^{\widetilde{\M}}(x \mid \Pa{X}{\G}) \prod_{U\in \mathbf{U} \setminus \{U_0\}} P^{\widetilde{\M}}(u),\\
        & Q^{\widetilde{\M}_g}[\mathbf{S}](\mathbf{v}) := \sum_{U_0^\M}P^{\M_g}(u_0^{\M})\sum_{U_0[\widetilde{\mathcal{P}}]}\prod_{\hat{p}\in \widetilde{\mathcal{P}}_{U_0}}f_{\hat{p}}(U_0[\hat{p}])\sum_{\mathbf{U} \setminus \{U_0\}} \prod_{X \in \mathbf{S}} P^{\widetilde{\M}}(x \mid \Pa{X}{\G}) \prod_{U\in \mathbf{U} \setminus \{U_0\}} P^{\widetilde{\M}}(u).
    \end{align*}
    We can re-writing the above equations using the notations of $\widetilde{\theta}_{i, j}$, $\widetilde{\phi}_{j}$, and $\widetilde{\eta}_{j}$,
    \begin{align*}
        & Q[\mathbf{A}'_i]^{\widetilde{\M}_1}(\mathbf{v}) = \sum_{j=1}^d \frac{1}{d}\widetilde{\theta}_{i, j}(\mathbf{v}), \\
        & Q[\mathbf{A}'_i]^{\widetilde{\M}_2}(\mathbf{v}) = \sum_{j=1}^d p_j\widetilde{\theta}_{i, j}(\mathbf{v}), \\
        \sum_{\D} &Q[\mathbf{S}]^{\widetilde{\M}_1}(\mathbf{v}) = \sum_{j=1}^d \frac{1}{d}\widetilde{\phi}_{j}(\mathbf{v}[\D^{\dagger}]), \\
        \sum_{\D} 
        &Q[\mathbf{S}]^{\widetilde{\M}_2}(\mathbf{v}) = \sum_{j=1}^d p_j\widetilde{\phi}_{j}(\mathbf{v}[\D^{\dagger}]), \\
        & Q[\mathbf{S}]^{\widetilde{\M}_1}(\mathbf{v}) = \sum_{j=1}^d \frac{1}{d}\widetilde{\eta}_{j}(\mathbf{v}), \\
        & Q[\mathbf{S}]^{\widetilde{\M}_2}(\mathbf{v}) = \sum_{j=1}^d p_j\widetilde{\eta}_{j}(\mathbf{v}).
    \end{align*}
    The above equations imply the following equations.
    \begin{align*}
        & Q^{\widetilde{M}_2}[\A'_i](\mathbf{v}) - Q^{\widetilde{\M}_1}[\A'_i](\mathbf{v}) = \sum_{j=1}^d (p_j - \frac{1}{d}) \widetilde{\theta}_{i,j}(\mathbf{v})
        \\
        \sum_{\D} & Q[\mathbf{S}]^{\widetilde{\M}_2}(\mathbf{v}) - \sum_{\D} Q[\mathbf{S}]^{\widetilde{\M}_1}(\mathbf{v}) = \sum_{j=1}^d (p_j - \frac{1}{d}) \widetilde{\phi}_{j}(\mathbf{v}[\D^{\dagger}])
        \\
        & Q^{\widetilde{\M}_2}[\mathbf{S}](\mathbf{v}_0) -  Q^{\widetilde{\M}_1}[\mathbf{S}](\mathbf{v}_0) = \sum_{j=1}^d (p_j - \frac{1}{d}) \widetilde{\eta}_{j}(\mathbf{v}_0)
        \\
        & \sum_{j=1}^d p_j - 1 = \sum_{j=1}^d (p_j - \frac{1}{d}).
    \end{align*}
    

     To prove the statement of the lemma it suffices to solve a following system of linear equations over parameters $\{p_j\}_{j=1}^d$ and show that it admits a solution. 
    \begin{align*}
        & \sum_{j=1}^d (p_j - \frac{1}{d}) \widetilde{\theta}_{i,j}(\mathbf{v}) = 0, \hspace{0.2cm}\forall \mathbf{v} \in \domm{\mathbf{V}}{}, i\in [0:m'],
        \\
        & \sum_{j=1}^d (p_j - \frac{1}{d}) \widetilde{\phi}_{j}(\dd^{\dagger}) = 0, \hspace{0.2cm}\forall \dd^{\dagger} \in \domm{\D^{\dagger}}{}, i\in [0:m'],
        \\
        & \sum_{j=1}^d (p_j - \frac{1}{d}) \widetilde{\eta}_{j}(\mathbf{v}_0) \neq 0, \hspace{0.2cm} \exists \mathbf{v}_0 \in \domm{\mathbf{V}}{},
        \\
        & (p_j - \frac{1}{d}) = 0,
        \\
        & 0<p_j<1, \hspace{0.2cm} \forall j \in [1:d].
    \end{align*}
     Analogous to the proof of Lemma \ref{lemma: construct models subcase 1}, we use Lemmas \ref{lemma: theta indices subcase 3},  \ref{lemma: phi indices subcase 3}, and  \ref{lemma: eta indices subcase 3} instead of Lemmas \ref{lemma: gid equal indices}, \ref{lemma: equal indices summation subcase 1} and \ref{lemma: gid not equal indices} respectively and conclude the result.  

    \textbf{Second case:}\\
    Suppose that there is no $i \in [0, m]$, such that $\S \subset \mathbf{A}_i$. This case we solve exactly the same as the \textbf{Second case} of the Lemma \ref{lemma: construct models subcase 1}.
\end{proof}




\subsection{Proof of Lemma \ref{lemma: eliminate var in cond}}

\renewcommand{\V}{\mathbf{V}}
\renewcommand{\U}{\mathbf{U}}
\begin{customlem}{\ref{lemma: eliminate var in cond}}
     Suppose that $\X$, $\Y$ and $\Z$ are disjoint subsets of $\mathbf{V}$ in graph $\G$ and variables $Z_1 \in \Z$, $Z_2 \in \Y \cup \Z$, such that there is a directed edge from $Z_1$ to $Z_2$ in $\G$. If the causal effect $P_{\x}(\y|\z)$ is not c-gID from $(\mathbb{A}, \G)$, then the causal effect $P_{\x}(\y|\z\setminus\{z_1\})$ is also not c-gID from $(\mathbb{A}, \G)$. 
\end{customlem}
\begin{proof}
By the basic probabilistic manipulations, we get
\begin{equation*}
\begin{split}
    & P_{\x}(\y|\z) = \frac{P_x(\y, \z)}{P_{x}(\z)},\\
    & P_{\x}(\y|\z\setminus\{z_1\}) = \frac{P_x(\y, \z\setminus\{z_1\})}{P_{x}(\z\setminus\{z_1\})}.
\end{split}
\end{equation*}
Using Markov factorization property in graph $\G$, we have
\begin{equation*}
\begin{split}
    & P_{\x}(\y, \z) = 
    \sum_{\V\setminus(\X\cup \Y \cup \Z)} \sum_{\U} \prod_{W \in \V\setminus \X}P(w \mid \Pa{W}{\G}) \prod_{U \in \U} P(u),
    \\
    & P_{\x}(\z) = 
    \sum_{\V\setminus(\X \cup \Z)} \sum_{\U} \prod_{W \in \V\setminus \X}P(w \mid \Pa{W}{\G}) \prod_{U \in \U} P(u).
\end{split}
\end{equation*}
And similarly, we have
\begin{equation}
\begin{split}
    \label{eq: P_x(y, z/z1)}
    & P_{\x}(\y, \z\setminus\{Z_1\}) = 
    \sum_{Z_1}\sum_{\V\setminus(\X\cup \Y \cup \Z)} \sum_{\U} \prod_{W \in \V\setminus \X}P(w \mid \Pa{W}{\G}) \prod_{U \in \U} P(u),
    \\
    & P_{\x}(\z\setminus\{Z_1\}) = 
    \sum_{Z_1}\sum_{\V\setminus(\X \cup \Z)} \sum_{\U} \prod_{W \in \V\setminus \X}P(w \mid \Pa{W}{\G}) \prod_{U \in \U} P(u).
\end{split}
\end{equation}
Since $P_{\x}(\y|\z)$ is not c-gID from $(\mathbb{A}, \G)$, there exists $\M_1$ and $\M_2$ such that
\begin{equation*}
    Q^{\M_1}[\A_i](\mathbf{v}) = Q^{\M_2}[\A_i](\mathbf{v}),\; \forall \mathbf{v}\in \dom{\V}{},\; \forall i \in [0: m],
\end{equation*}
\begin{equation*}
    P_{\x}^{\M_1}(\y|\z)\neq P_{\x}^{\M_2}(\y|\z),\; \exists \x \in \dom{\X}{}, \; \exists \y \in \dom{\Y}{}.
\end{equation*}
Using $\M_1$ and $\M_2$, we construct two models $\M_1'$ and $\M_2'$. To do so, we first take any surjective function $F\!:\: \dom{Z_1}{}\rightarrow \{0, 1\}$ and define a function $\Psi \!:\: \{0, 1\}\times \dom{Z_1}{} \rightarrow (0,1)$ that satisfies $\Psi(0, z_1)+\Psi(1, z_1)=1$ for any $z_1 \in \dom{Z_1}{}$.

For any node $S$ that either belongs to the set of unobserved variables  or belongs to $\V \setminus (\{Z_2\}\cup \Ch{Z_2}{\G})$, we define
\begin{equation*}
    P^{\M_i'}(s|\Pa{S}{\G}) := P^{\M_i}(s|\Pa{S}{\G}), \quad i \in \{1, 2\}.
\end{equation*}
The domain of $Z_2$ in $\M_i'$ is defined as $\dom{Z_2}{}^{\M}\times \{0, 1\}$, where $\dom{Z_2}{}^{\M}$ is the domain of $Z_2$ in $\M$ (either $\M_1$ or $\M_2$). 
For $z_2 \in \dom{Z_2}{}^\M$, $i\in \{1,2\}$, and $k\in \{0, 1\}$, we define
\begin{equation*}
    P^{\M_i'}((z_2, k) 
    \mid \Pa{Z_2}{\G}\setminus\{Z_1\}, z_1) :=
    P^{\M_i}(z_2 \mid \Pa{Z_2}{\G})\times \Psi(F(z_1)\oplus k, z_1).
\end{equation*}
Due to the property of function $\Psi$,  the above definitions are valid probabilities, i.e., for any realizations $(\Pa{Z_2}{\G}, z_1)$, the following holds
\begin{equation*}
    \sum_{k\in \{0,1\}} \sum_{z_2\in \dom{Z_2}{}^{\M}} P^{\M_i'}((z_2, k)|pa(Z_2), z_1) = 1.
\end{equation*}
For each $S \in \Ch{Z_2}{\G}$, we define:
\begin{equation*}
    P^{\M_i'}(s \mid \Pa{S}{\G}\setminus \{Z_2\}, (z_2, k)) :=
    P^{\M_i}(s \mid \Pa{S}{\G}\setminus \{Z_2\}, z_2), \quad i \in \{1, 2\}, k \in \{0, 1\}.
\end{equation*}

Next, we show that $Q^{\M_1'}[\A_i](\mathbf{v}) = Q^{\M_2'}[\A_i](\mathbf{v})$ for each $\mathbf{v}\in \dom{\V}{}$ and $i \in [0:m]$.
Suppose $\mathbf{v}$ is a realization of $\V$ in $\M'_1$ with realizations $z_1$ and $(z_2, k)$ for $Z_1$ and $Z_2$, respectively. 
Consider two cases: 
\begin{itemize}
    \item  $Z_2 \notin \A_i$: In this case, we have
    \begin{align*}
        Q^{\M_1'}[\A_i](\mathbf{v}) 
        &= \sum_{\U}\prod_{A\in \A_i} P^{\M_1'}(a \mid \Pa{A}{\G})\prod_{U\in \U}P^{\M_1'}(u) \\
        & = \sum_{\U} \prod_{A\in \A_i}P^{\M_1}(a \mid \Pa{A}{\G})\prod_{U\in \U} P^{\M_1}(u) 
        = Q^{\M_1}[\A_i](\mathbf{v}) 
        = Q^{\M_2}[\A_i](\mathbf{v}) \\
        & = \sum_{\U} \prod_{A\in \A_i} P^{\M_2}(a \mid \Pa{A}{\G}) \prod_{U\in \U} P^{\M_2}(u) \\
        &= \sum_{\U} \prod_{A\in \A_i} P^{\M_2'}(a \mid \Pa{A}{\G}) \prod_{U\in \U} P^{\M_2'}(u) \\ 
        &= Q^{\M_2'}[\A_i](\mathbf{v}).
    \end{align*}
    
    \item  $Z_2 \in \mathbf{A}_i$: In this case, we have
    \begin{align*}
        Q^{\M_1'}[\A_i](\mathbf{v}) 
        &= \sum_{\U} \prod_{A\in \A_i} P^{\M_1'} (a \mid \Pa{A}{\G})\prod_{U\in \U} P^{\M_1'}(u) \\
        & = \Psi\left(F(z_1)\oplus k, z_1\right) \sum_{\U} \prod_{A\in \A_i} P^{\M_1}(a \mid  \Pa{A}{\G}) \prod_{U\in \U}P^{\M_1}(u) \\
        &= \Psi(F(z_1)\oplus k, z_1) Q^{\M_1}[\A_i](\mathbf{v}) = \Psi(F(z_1)\oplus k, z_1) Q^{\M_2}[\A_i](\mathbf{v}) \\
        &= \Psi(F(z_1)\oplus k, z_1) \sum_{\U} \prod_{A\in \A_i} P^{M_2}(a \mid \Pa{A}{\G}) \prod_{U\in \U} P^{M_2}(u) \\
        &= \sum_{\U}\prod_{A\in \A_i} P^{\M_2'}(a \mid \Pa{A}{\G})) \prod_{U\in \U}P^{\M_2'}(u) \\
        &= Q^{\M_2'}[\A_i](\mathbf{v}).
    \end{align*}
\end{itemize}

Therefore, $Q^{\M_1'}[\A_i](\mathbf{v}) = Q^{\M_2'}[\A_i](\mathbf{v})$ for each $\mathbf{v}\in \dom{\V}{}$ and $i \in [0:m]$.

On the other hand, we know that there exists $\hat{\x} \in \dom{\X}{}^{\M}$, $\hat{\y} \in \dom{\Y}{}^{\M}$ and $\hat{\z} \in \dom{\Z}{}^{\M}$ such that $P^{\M_1}_{\hat{\x}}(\hat{\y}|\hat{\z})\neq  P^{\M_2}_{\hat{\x}}(\hat{\y}|\hat{\z})$. 


According to Equations \eqref{eq: P_x(y, z/z1)}, we have
\begin{align*}
    & P_{\x}^{\M_i'}(\y, \z\setminus\{Z_1\}) = 
    \sum_{z_1 \in \dom{Z_1}{}}\sum_{\V\setminus(\X\cup \Y \cup \Z)} \sum_{\U} P^{\M_i'}((z_2, k)|\Pa{Z_2}{\G}) \prod_{W \in \V\setminus (\X\cup \{Z_2\})}P^{\M_i'}(w \mid \Pa{W}{\G}) \prod_{U \in \U} P(u)\\
    & = \sum_{z_1 \in \dom{Z_1}{}}\sum_{\V\setminus(\X\cup \Y \cup \Z)} \sum_{\U} \Psi(F(z_1)\oplus k, z_1)P^{\M_i}(z_2|\Pa{Z_2}{\G}) \prod_{W \in \V\setminus (\X\cup \{Z_2\})}P^{\M_i}(w \mid \Pa{W}{\G}) \prod_{U \in \U} P(u)\\
    & =  \sum_{z_1 \in \dom{Z_1}{}}\Psi(F(z_1)\oplus k, z_1)
    \sum_{\V\setminus(\X\cup \Y \cup \Z)} \sum_{\U} P^{\M_i}(z_2|\Pa{Z_2}{\G}) \prod_{W \in \V\setminus (\X\cup \{Z_2\})}P^{\M_i}(w \mid \Pa{W}{\G}) \prod_{U \in \U} P(u)\\
    & = \sum_{z_1 \in \dom{Z_1}{}}\Psi(F(z_1)\oplus k, z_1) P^{\M_i}_\x(\y, \z).
\end{align*}
Let us denote $\dom{Z_1}{} = \{\alpha_1, \alpha_2, \dots, \alpha_n\}$. For $z_1=\alpha_j$ and $j \in [1:n]$, we also denote
\begin{align*}
    & \psi_{j} := \Psi(F(\alpha_j)\oplus 0, \alpha_j),\\
    & \beta_j^{\M_i}:=P^{\M_i}_{\hat{\x}}(\hat{\y}, \hat{\z}[\Z\setminus\{Z_1\}], \alpha_j) .
\end{align*}
This leads to
\begin{align*}
    & P_{\x}^{\M_i}(\y, \z\setminus\{Z_1\}) = \sum_{j=1}^n\psi_j\beta_j^{\M_i},
\end{align*}
for realizations $\y$ consistent with $\hat{\y}$, realization $\x$ consistent with $\hat{\x}$, $\z$ consistent with $\hat{\z}$, and $Z_2 = (z_2, k)$ consistent with $\hat{\y}\cup\hat{\z}$ and $k=0$. Recall that $\psi_j$ is a real number from the interval $(0, 1)$. 
Note that $\psi_j$ is independent from any other $\psi_l$ for $l\neq j$.


Next, we consider two cases:
\begin{itemize}
    \item Assume that $Z_2\in \Z$. In this case, we have
    \begin{align*}
        & P_{\x}^{\M_i'}(\z\setminus\{Z_1\}) = 
        \sum_{z_1 \in \dom{Z_1}{}}\sum_{\V\setminus(\X \cup \Z)} \sum_{\U} P^{\M_i'}((z_2, k)|\Pa{Z_2}{\G}) \prod_{W \in \V\setminus (\X\cup \{Z_2\})}P^{\M_i'}(w \mid \Pa{W}{\G}) \prod_{U \in \U} P(u)\\
        & = \sum_{z_1 \in \dom{Z_1}{}}\sum_{\V\setminus(\X \cup \Z)} \sum_{\U} \Psi(F(z_1)\oplus k, z_1)P^{\M_i}(z_2|\Pa{Z_2}{\G}) \prod_{W \in \V\setminus (\X\cup \{Z_2\})}P^{\M_i}(w \mid \Pa{W}{\G}) \prod_{U \in \U} P(u)\\
        & =  \sum_{z_1 \in \dom{Z_1}{}}\Psi(F(z_1)\oplus k, z_1)
        \sum_{\V\setminus(\X\cup \Z)} \sum_{\U} P^{\M_1}(z_2|\Pa{Z_2}{\G}) \prod_{W \in \V\setminus (\X\cup \{Z_2\})}P^{\M_i}(w \mid \Pa{W}{\G}) \prod_{U \in \U} P(u)\\
        & = \sum_{z_1 \in \dom{Z_1}{}}\Psi(F(z_1)\oplus k, z_1) P^{\M_i}(\z).
    \end{align*}
    For $j\in [1:n]$ and $z_1 = \alpha_j$, we denote
    \begin{align*}
         & \gamma_j^{\M_i}:=P^{\M_i}_{\hat{\x}}(\hat{\z}[\Z\setminus\{Z_1\}], \alpha_j),
    \end{align*}
    which leads to
    \begin{align*}
        & P_{\x}^{\M_i}(\z\setminus\{Z_1\}) = \sum_{j=1}^n\psi_j\gamma_j^{\M_i},
    \end{align*}
    for realizations $\y$ consistent with $\hat{\y}$, realization $\x$ consistent with $\hat{\x}$, $\z$ consistent with $\hat{\z}$, and $Z_2 = (z_2, k)$ consistent with $\hat{\y}\cup\hat{\z}$ and $k=0$.
    Thus, for such realizations, we have
    $$
    P_{\x}^{\M_i}(\hat{\y}|\hat{\z}\setminus\{Z_1\}) = \frac{\sum_{j=1}^n\psi_j\beta_j^{\M_i}}{\sum_{j=1}^n\psi_j\gamma_j^{\M_i}}.
    $$
    By the assumption of the lemma, there exists $j\in [1:n]$ such that
    \begin{equation*}
        \frac{\beta_j^{\M_1}}{\gamma_{j}^{\M_1}} \neq \frac{\beta_j^{\M_2}}{\gamma_{j}^{\M_2}},
    \end{equation*}
    or equivalently,
    \begin{equation*}
        \beta_j^{\M_1} \gamma_{j}^{\M_2} \neq \beta_j^{\M_2} \gamma_{j}^{\M_1}.
    \end{equation*}
    Without loss of generality, we assume that the aforementioned inequality holds for $j=1$.
    Next, we prove that there exists a parameters $\{\psi_{j}\}_{j=1}^{n}$ such that
    \begin{equation*}
        \frac{\sum_{j=1}^n\psi_j\beta_j^{\M_1}}{\sum_{j=1}^n\psi_j\gamma_j^{\M_1}} \neq \frac{\sum_{j=1}^n\psi_j\beta_j^{\M_2}}{\sum_{j=1}^n\psi_j\gamma_j^{\M_2}},
    \end{equation*}
    or equivalently,
    % \begin{equation*}
    %     \sum_{j=1}^n\psi_j\beta_j^{\M_1} \sum_{j=1}^n\psi_j\gamma_j^{\M_2} \neq \sum_{j=1}^n\psi_j\beta_j^{\M_2} \sum_{j=1}^n\psi_j\gamma_j^{\M_1}
    % \end{equation*}
    % or
    \begin{equation*}
        \sum_{j=1}^n\psi_j\beta_j^{\M_1} \sum_{j=1}^n\psi_j\gamma_j^{\M_2} - \sum_{j=1}^n\psi_j\beta_j^{\M_2} \sum_{j=1}^n\psi_j\gamma_j^{\M_1} \neq 0.
    \end{equation*}
    Note that the left hand side is a quadratic equation with respect to parameter $\psi_1$, e.g.,
    \begin{equation*}
        (\beta_1^{\M_1} \gamma_{1}^{\M_2} - \beta_1^{\M_2} \gamma_{1}^{\M_1})\psi_1^2
    \end{equation*}
    Since $\beta_1^{\M_1} \gamma_{1}^{\M_2} - \beta_1^{\M_2} \gamma_{1}^{\M_1}\neq0$, then we can find  $\{\psi_{j}\}_{j=1}^{n}$, such that
    \begin{equation*}
        \sum_{j=1}^n\psi_j\beta_j^{\M_1} \sum_{j=1}^n\psi_j\gamma_j^{\M_2} - \sum_{j=1}^n\psi_j\beta_j^{\M_2} \sum_{j=1}^n\psi_j\gamma_j^{\M_1} \neq 0.
    \end{equation*}
    This is possible because $\psi_i\in(0,1)$. This concludes the proof of the lemma for this case.
    
    
    \item Assume that $Z_2\in \Y$. Suppose that $P_{\x}^{\M_1}(\y, z_1|\z\setminus\{Z_1\}) = P_{\x}^{\M_2}(\y, z_1|\z\setminus\{Z_1\})$ for all $\x\in \dom{\X}{}$, $\y\in \dom{\Y}{}$ and $\z\in \dom{\Z}{}$. Then,
    \begin{equation*}
        P^{\M_1}_{\x}(\y|\z) = \frac{P^{\M_1}(\y, z_1|\z\setminus\{Z_1\})}{P^{\M_1}_{\x}(z_1|\z\setminus\{Z_1\})} = \frac{P^{\M_1}(\y, z_1|\z\setminus\{Z_1\})}{P^{\M_2}_{\x}(z_1|\z\setminus\{Z_1\})} = P^{\M_2}_{\x}(\y|\z).
    \end{equation*}
    This is impossible as $P^{\M_1}_{\hat{\x}}(\hat{\y}|\hat{\z})\neq P^{\M_2}_{\hat{\x}}(\hat{\y}|\hat{\z})$. 
    Thus, there exist $\hat{x}' \in \dom{\X}{} $, $\hat{y}' \in \dom{\Y}{}$, and $\hat{z}' \in \dom{\Z}{}$, such that
    \begin{equation*}
        P_{\hat{\x}'}^{\M_1}(\hat{\y}', \hat{z}_1'|\hat{\z}'\setminus\{Z_1\}) \neq P_{\hat{\x}'}^{\M_2}(\hat{\y}', \hat{z}'_1|\hat{\z}'\setminus\{Z_1\}).
    \end{equation*}
    On the other hand, we have 
    \begin{align*}
        & P_{\x}^{\M_i'}(\y, \z) = 
       \sum_{\V\setminus(\X\cup \Y \cup \Z)} \sum_{\U} P^{\M_i'}((z_2, k)|\Pa{Z_2}{\G}) \prod_{W \in \V\setminus (\X\cup \{Z_2\})}P^{\M_i'}(w \mid \Pa{W}{\G}) \prod_{U \in \U} P(u)\\
        & = \sum_{\V\setminus(\X\cup \Y \cup \Z)} \sum_{\U} \Psi(F(z_1)\oplus k, z_1)P^{\M_i}(z_2|\Pa{Z_2}{\G}) \prod_{W \in \V\setminus (\X\cup \{Z_2\})}P^{\M_i}(w \mid \Pa{W}{\G}) \prod_{U \in \U} P(u)\\
        & = \Psi(F(z_1)\oplus k, z_1)
        \sum_{\V\setminus(\X\cup \Y \cup \Z)} \sum_{\U} P^{\M_i}(z_2|\Pa{Z_2}{\G}) \prod_{W \in \V\setminus (\X\cup \{Z_2\})}P^{\M_i}(w \mid \Pa{W}{\G}) \prod_{U \in \U} P(u)\\
        & =\Psi(F(z_1)\oplus k, z_1) P^{\M_i}_\x(\y, \z).
    \end{align*}
    For $j \in [1:n]$, we define
    \begin{equation*}
        {\beta_j'}^{\M_i}:=P^{\M_i}_{\hat{\x}}(\hat{\y}', \hat{\z}'
        [\Z\setminus\{Z_1\}], \alpha_j).
    \end{equation*}
    Suppose $m \in [1:n]$, where $z_1=\alpha_m$ and it is consistent with $\hat{\z}'$. We assign $k=0$ and denote
    \begin{equation*}
        {\beta_m'}^{\M_i}:=P_{\hat{x}'}^{\M_i}(\hat{\y}',\hat{\z}').
    \end{equation*}
    This results in
    \begin{equation*}
        P_{\mathbf{\hat{x}}'}^{\M_i'}(\hat{\y}', \hat{\z}') = {\beta_m'}^{\M_i}\psi_m.
    \end{equation*}
    We also have
    \begin{align*}
        & P_{\x}^{\M_i'}(\z\setminus\{Z_1\}) = 
        \sum_{z_1 \in \dom{Z_1}{}}\sum_{\V\setminus(\X \cup \Z)} \sum_{\U} P^{\M_i'}((z_2, k)|\Pa{Z_2}{\G}) \prod_{W \in \V\setminus (\X\cup \{Z_2\})}P^{\M_i'}(w \mid \Pa{W}{\G}) \prod_{U \in \U} P(u)\\
        & = \sum_{z_1 \in \dom{Z_1}{}}\sum_{\V\setminus(\X \cup \Z)} \sum_{\U} \Psi(F(z_1)\oplus k, z_1)P^{\M_i}(z_2|\Pa{Z_2}{\G}) \prod_{W \in \V\setminus (\X\cup \{Z_2\})}P^{\M_i}(w \mid \Pa{W}{\G}) \prod_{U \in \U} P(u)\\
        & =  \sum_{z_1 \in \dom{Z_1}{}}
        \sum_{\V\setminus(\X\cup \Z)} \sum_{\U} \sum_{k \in \{0, 1\}}\Psi(F(z_1)\oplus k, z_1) P^{\M_i}(z_2|\Pa{Z_2}{\G}) \prod_{W \in \V\setminus (\X\cup \{Z_2\})}P^{\M_i}(w \mid \Pa{W}{\G}) \prod_{U \in \U} P(u)\\
        & = \sum_{z_1 \in \dom{Z_1}{}} P^{\M_i}(\z).
    \end{align*}
    For $j\in [1:n]$ and $z_1 = \alpha_j$, we denote
    \begin{align*}
         & {\gamma'_j}^{\M_i}:=P^{\M_i}_{\hat{\x}}(\hat{\z}'[\Z\setminus\{Z_1\}]),
    \end{align*}
    and from the above equation, we get
    \begin{align*}
        & P_{\x}^{\M_i}(\z\setminus\{Z_1\}) = \sum_{j=1}^n\gamma_j^{\M_i},
    \end{align*}
    for realizations $\y$ consistent with $\hat{\y}'$, realization $\x$ consistent with $\hat{\x}'$, $\z$ consistent with $\hat{\z}'$, and $Z_2 = (z_2, k)$ consistent with $\hat{\y}'\cup\hat{\z}'$ and $k=0$. 
    We have 
    $$
    P_{\x}^{\M_i}(\hat{\y}|\hat{\z}\setminus\{Z_1\}) = \frac{\sum_{j=1}^n\psi_j{\beta_j'}^{\M_i}}{\sum_{j=1}^n\gamma_j^{\M_i}}.
    $$

    By the assumption of the lemma, we have
    \begin{equation*}
        \frac{{\beta_m'}^{\M_1}}{\sum_{j=1}^n\gamma_j^{\M_1}} \neq \frac{{\beta_m'}^{\M_2}}{\sum_{j=1}^n\gamma_j^{\M_2}}.
    \end{equation*}
    Next, we prove that there exists a set of parameters $\{\psi_{j}\}_{j=1}^{n}$, such that
    \begin{equation*}
        \frac{\sum_{j=1}^n\psi_j{\beta_j'}^{\M_1}}{\sum_{j=1}^n\gamma_j^{\M_1}} \neq \frac{\sum_{j=1}^n\psi_j{\beta_j'}^{\M_2}}{\sum_{j=1}^n\gamma_j^{\M_2}}
    \end{equation*}
    or equivalently,
    \begin{equation*}
        \frac{\sum_{j=1}^n\psi_j{\beta_j'}^{\M_1}}{\sum_{j=1}^n\gamma_j^{\M_1}} - \frac{\sum_{j=1}^n\psi_j{\beta_j'}^{\M_2}}{\sum_{j=1}^n\gamma_j^{\M_2}} \neq 0.
    \end{equation*}
    Note that left hand side of the above equation is  linear with respect to parameter $\psi_m$ with the following coefficient,
    \begin{equation*}
        \frac{{\beta_m'}^{\M_1}}{\sum_{j=1}^n\gamma_j^{\M_1}} - \frac{{\beta_m'}^{\M_2}}{\sum_{j=1}^n\gamma_j^{\M_2}}\neq 0.
    \end{equation*}
    This ensures that we can can find a realization of $\{\psi_{j}\}_{j=1}^{n}$, such that
    \begin{equation*}
        \frac{\sum_{j=1}^n\psi_j{\beta_j'}^{\M_1}}{\sum_{j=1}^n\gamma_j^{\M_1}} - \frac{\sum_{j=1}^n\psi_j{\beta_j'}^{\M_2}}{\sum_{j=1}^n\gamma_j^{\M_2}} \neq 0.
    \end{equation*}
    This concludes the proof of the lemma for second case.
\end{itemize}

\end{proof}

%====================================================================================%

\subsection{Proof of Lemma \ref{lemma: for_the_main}}



\begin{customlem}{\ref{lemma: for_the_main}}
Suppose that $\X$, $\Y$ and $\Z$ are disjoint subsets of $\mathbf{V}$ in graph $\G$ and variables $Z_1 \in \Y$, $Z_2 \in \Y \cup \Z$, such that there is a directed edge from $Z_1$ to $Z_2$ in $\G$. If the causal effect $P_{\x}(\y|\z)$ is not c-gID from $(\mathbb{A}, \G)$, then the causal effect $P_{\x}(\y\setminus\{z_1\}|\z)$ is also not c-gID from $(\mathbb{A}, \G)$. 
\end{customlem}
\begin{proof}
By the basic probabilistic manipulations, we get
\begin{equation*}
\begin{split}
    & P_{\x}(\y|\z) = \frac{P_x(\y, \z)}{P_{x}(\z)},\\
    & P_{\x}(\y\setminus\{z_1\}|\z) = \frac{P_x(\y\setminus\{z_1\}, \z)}{P_{x}(\z)}.
\end{split}
\end{equation*}
Using Markov factorization property in graph $\G$, $P_{\mathbf{x}}(\mathbf{y})$ will be
\begin{equation*}
\begin{split}
    & P_{\x}(\y, \z) = 
    \sum_{\V\setminus(\X\cup \Y \cup \Z)} \sum_{\U} \prod_{W \in \V\setminus \X}P(w \mid \Pa{W}{\G}) \prod_{U \in \U} P(u),
    \\
    & P_{\x}(\z) = 
    \sum_{\V\setminus(\X \cup \Z)} \sum_{\U} \prod_{W \in \V\setminus \X}P(w \mid \Pa{W}{\G}) \prod_{U \in \U} P(u).
\end{split}
\end{equation*}
And similarly, we have
\begin{equation}
\begin{split}
    \label{eq: P_x(y/z1, z)}
    & P_{\x}(\y\setminus\{Z_1\}, \z) = 
    \sum_{Z_1}\sum_{\V\setminus(\X\cup \Y \cup \Z)} \sum_{\U} \prod_{W \in \V\setminus \X}P(w \mid \Pa{W}{\G}) \prod_{U \in \U} P(u),
    \\
    & P_{\x}(\z) = 
    \sum_{Z_1}\sum_{\V\setminus(\X \cup \Z)} \sum_{\U} \prod_{W \in \V\setminus \X}P(w \mid \Pa{W}{\G}) \prod_{U \in \U} P(u).
\end{split}
\end{equation}
Since $P_{\x}(\y|\z)$ is not gID from $(\mathbb{A}, \G)$, there exists $\M_1$ and $\M_2$ such that
\begin{equation*}
    Q^{\M_1}[\A_i](\mathbf{v}) = Q^{\M_2}[\A_i](\mathbf{v}),\; \forall \mathbf{v}\in \dom{\V}{},\; \forall i \in [0: m],
\end{equation*}
\begin{equation*}
    P_{\x}^{\M_1}(\y|\z)\neq P_{\x}^{\M_2}(\y|\z),\; \exists \x \in \dom{\X}{}, \; \exists \y \in \dom{\Y}{}.
\end{equation*}
Using $\M_1$ and $\M_2$, we construct two models $\M_1'$ and $\M_2'$. 
Define a surjective function $F\!:\: \dom{Z_1}{}\rightarrow \{0, 1\}$ and a function $\Psi \!:\: \{0, 1\}\times \dom{Z_1}{} \rightarrow (0,1)$ such that $\Psi(0, z_1)+\Psi(1, z_1)=1$ for each $z_1 \in \dom{Z_1}{}$.

For any node $S$ which is either unobserved or in $\V \setminus (\{Z_2\}\cup \Ch{Z_2}{\G})$, we define
\begin{equation*}
    P^{\M_i'}(s|\Pa{S}{\G}) = P^{\M_i}(s|\Pa{S}{\G}),
\end{equation*}
where $i \in \{1, 2\}$.
The domain of $Z_2$ in $\M_i'$ is defined as $\dom{Z_2}{}^{\M}\times \{0, 1\}$, where $\dom{Z_2}{}^{\M}$ is the domain of $Z_2$ in $\M$ (either $\M_1$ or $\M_2$). 
For $z_2 \in \dom{Z_2}{}^\M$, $i\in \{0,1\}$, and $k\in \{0, 1\}$, we define
\begin{equation*}
    P^{\M_i'}((z_2, k) 
    \mid \Pa{Z_2}{\G}\setminus\{Z_1\}, z_1) =
    P^{\M_i}(z_2 \mid \Pa{Z_2}{\G}) \Psi(F(z_1)\oplus k, z_1).
\end{equation*}
Moreover, for a fixed realization $(\Pa{Z_2}{\G}, z_1)$, we have
\begin{equation*}
    \sum_{k\in \{0,1\}} \sum_{z_2\in \dom{Z_2}{}^{\M}} P^{\M_i'}((z_2, k)|pa(Z_2), z_1) = 1.
\end{equation*}

For each $S \in \Ch{Z_2}{\G}$, we define:
\begin{equation*}
    P^{\M_i'}(s \mid \Pa{S}{\G}\setminus \{Z_2\}, (z_2, k)) =
    P^{\M_i}(s \mid \Pa{S}{\G}\setminus \{Z_2\}, z_2).
\end{equation*}

Next, we show that $Q^{\M_1'}[\A_i](\mathbf{v}) = Q^{\M_2'}[\A_i](\mathbf{v})$ for each $\mathbf{v}\in \dom{\V}{}$ and $i \in [0:m]$.
Suppose $\mathbf{v}$ is a realization of $\V$ in $\M'_1$ with realizations $z_1$ and $(z_2, k)$ for $Z_1$ and $Z_2$, respectively. 
Consider two cases: 
\begin{itemize}
    \item  $Z_2 \notin \A_i$: In this case, we have
    \begin{align*}
        Q^{\M_1'}[\A_i](\mathbf{v}) 
        &= \sum_{\U}\prod_{A\in \A_i} P^{\M_1'}(a \mid \Pa{A}{\G})\prod_{U\in \U}P^{\M_1'}(u) \\
        & = \sum_{\U} \prod_{A\in \A_i}P^{\M_1}(a \mid \Pa{A}{\G})\prod_{U\in \U} P^{\M_1}(u) 
        = Q^{\M_1}[\A_i](\mathbf{v}) 
        = Q^{\M_2}[\A_i](\mathbf{v}) \\
        & = \sum_{\U} \prod_{A\in \A_i} P^{\M_2}(a \mid \Pa{A}{\G}) \prod_{U\in \U} P^{\M_2}(u) \\
        &= \sum_{\U} \prod_{A\in \A_i} P^{\M_2'}(a \mid \Pa{A}{\G}) \prod_{U\in \U} P^{\M_2'}(u) \\ 
        &= Q^{\M_2'}[\A_i](\mathbf{v}).
    \end{align*}
    
    \item  $Z_2 \in \mathbf{A}_i$: In this case, we have
    \begin{align*}
        Q^{\M_1'}[\A_i](\mathbf{v}) 
        &= \sum_{\U} \prod_{A\in \A_i} P^{\M_1'} (a \mid \Pa{A}{\G})\prod_{U\in \U} P^{\M_1'}(u) \\
        & = \Psi\left(F(z_1)\oplus k, z_1\right) \sum_{\U} \prod_{A\in \A_i} P^{\M_1}(a \mid  \Pa{A}{\G}) \prod_{U\in \U}P^{\M_1}(u) \\
        &= \Psi(F(z_1)\oplus k, z_1) Q^{\M_1}[\A_i](\mathbf{v}) = \Psi(F(z_1)\oplus k, z_1) Q^{\M_2}[\A_i](\mathbf{v}) \\
        &= \Psi(F(z_1)\oplus k, z_1) \sum_{\U} \prod_{A\in \A_i} P^{M_2}(a \mid \Pa{A}{\G}) \prod_{U\in \U} P^{M_2}(u) \\
        &= \sum_{\U}\prod_{A\in \A_i} P^{\M_2'}(a \mid \Pa{A}{\G})) \prod_{U\in \U}P^{\M_2'}(u) \\
        &= Q^{\M_2'}[\A_i](\mathbf{v}).
    \end{align*}
\end{itemize}

Therefore, $Q^{\M_1'}[\A_i](\mathbf{v}) = Q^{\M_2'}[\A_i](\mathbf{v})$ for each $\mathbf{v}\in \dom{\V}{}$ and $i \in [0:m]$.

On the other hand, we know that there exists $\hat{\x} \in \dom{\X}{}^{\M}$, $\hat{\y} \in \dom{\Y}{}^{\M}$ and $\hat{\z} \in \dom{\Z}{}^{\M}$ such that $P^{\M_1}_{\hat{\x}}(\hat{\y}|\hat{\z})\neq  P^{\M_2}_{\hat{\x}}(\hat{\y}|\hat{\z})$. 

According to Equations \eqref{eq: P_x(y/z1, z)}, we have
\begin{align*}
    & P_{\x}^{\M_i'}(\y\setminus\{Z_1\}, \z) = 
    \sum_{z_1 \in \dom{Z_1}{}}\sum_{\V\setminus(\X\cup \Y \cup \Z)} \sum_{\U} P^{\M_i'}((z_2, k)|\Pa{Z_2}{\G}) \prod_{W \in \V\setminus (\X\cup \{Z_2\})}P^{\M_i'}(w \mid \Pa{W}{\G}) \prod_{U \in \U} P(u)\\
    & = \sum_{z_1 \in \dom{Z_1}{}}\sum_{\V\setminus(\X\cup \Y \cup \Z)} \sum_{\U} \Psi(F(z_1)\oplus k, z_1)P^{\M_i}(z_2|\Pa{Z_2}{\G}) \prod_{W \in \V\setminus (\X\cup \{Z_2\})}P^{\M_i}(w \mid \Pa{W}{\G}) \prod_{U \in \U} P(u)\\
    & =  \sum_{z_1 \in \dom{Z_1}{}}\Psi(F(z_1)\oplus k, z_1)
    \sum_{\V\setminus(\X\cup \Y \cup \Z)} \sum_{\U} P^{\M_i}(z_2|\Pa{Z_2}{\G}) \prod_{W \in \V\setminus (\X\cup \{Z_2\})}P^{\M_i}(w \mid \Pa{W}{\G}) \prod_{U \in \U} P(u)\\
    & = \sum_{z_1 \in \dom{Z_1}{}}\Psi(F(z_1)\oplus k, z_1) P^{\M_i}_\x(\y, \z).
\end{align*}
Let us denote $\dom{Z_1}{} = \{\alpha_1, \alpha_2, \dots, \alpha_n\}$. For $z_1=\alpha_j$ and $j \in [1:n]$, we also denote
\begin{align*}
    & \psi_{j} = \psi(F(\alpha_j)\oplus 0, \alpha_j),\\
    & P^{\M_i}_{\hat{\x}}(\hat{\y}[\Y\setminus\{Z_1\}], \hat{\z}, \alpha_j) = \beta_j^{\M_i}.
\end{align*}
For $Z_2=(\hat{z}[Z_2], 0)$ we have:
\begin{align*}
    & P_{\hat{\x}}^{\M_i}(\hat{\y}\setminus\{Z_1\}, \hat{\z}) = \sum_{j=1}^n\psi_j\beta_j^{\M_i}.
\end{align*}
Recall that $\psi_j$ is a real number from the interval $(0, 1)$. 
Note that $\psi_j$ is independent from any other $\psi_l$ for $l\neq j$.


Next, we consider two cases:
\begin{itemize}
    \item Assume that $Z_2\in \Z$. In this case, we have
    \begin{align*}
        & P_{\x}^{\M_i'}(\z) = 
        \sum_{z_1 \in \dom{Z_1}{}}\sum_{\V\setminus(\X \cup \Z)} \sum_{\U} P^{\M_i'}((z_2, k)|\Pa{Z_2}{\G}) \prod_{W \in \V\setminus (\X\cup \{Z_2\})}P^{\M_i'}(w \mid \Pa{W}{\G}) \prod_{U \in \U} P(u)\\
        & = \sum_{z_1 \in \dom{Z_1}{}}\sum_{\V\setminus(\X \cup \Z)} \sum_{\U} \Psi(F(z_1)\oplus k, z_1)P^{\M_i}(z_2|\Pa{Z_2}{\G}) \prod_{W \in \V\setminus (\X\cup \{Z_2\})}P^{\M_i}(w \mid \Pa{W}{\G}) \prod_{U \in \U} P(u)\\
        & =  \sum_{z_1 \in \dom{Z_1}{}}\Psi(F(z_1)\oplus k, z_1)
        \sum_{\V\setminus(\X\cup \Z)} \sum_{\U} P^{\M_1}(z_2|\Pa{Z_2}{\G}) \prod_{W \in \V\setminus (\X\cup \{Z_2\})}P^{\M_i}(w \mid \Pa{W}{\G}) \prod_{U \in \U} P(u)\\
        & = \sum_{z_1 \in \dom{Z_1}{}}\Psi(F(z_1)\oplus k, z_1) P^{\M_i}(\z).
    \end{align*}
    We denote
    \begin{align*}
         & P^{\M_i}_{\hat{\x}}(\hat{\z}) = \gamma^{\M_i},
    \end{align*}
    which leads to
    \begin{align*}
        & P_{\x}^{\M_i}(\z) = \sum_{j=1}^n\psi_j\gamma^{\M_i},
    \end{align*}
    for $Z_2=(\hat{\z}[Z_2], 0)$.
    Thus, 
    $$
    P_{\x}^{\M_i}(\hat{\y}\setminus\{Z_1\}|\hat{\z}) = \frac{\sum_{j=1}^n\psi_j\beta_j^{\M_i}}{\sum_{j=1}^n\psi_j\gamma^{\M_i}}.
    $$
    By the assumption of the lemma, there exists $j\in [1:n]$ such that
    \begin{equation*}
        \frac{\beta_j^{\M_1}}{\gamma^{\M_1}} \neq \frac{\beta_j^{\M_2}}{\gamma^{\M_2}},
    \end{equation*}
    or equivalently,
    \begin{equation*}
        \beta_j^{\M_1} \gamma^{\M_2} \neq \beta_j^{\M_2} \gamma^{\M_1}.
    \end{equation*}
    Without loss of generality, we assume that the aforementioned inequality holds for $j=1$.
    Next, we prove that there exists a parameters $\{\psi_{j}\}_{j=1}^{n}$ such that
    \begin{equation*}
        \frac{\sum_{j=1}^n\psi_j\beta_j^{\M_1}}{\sum_{j=1}^n\psi_j\gamma^{\M_1}} \neq \frac{\sum_{j=1}^n\psi_j\beta_j^{\M_2}}{\sum_{j=1}^n\psi_j\gamma^{\M_2}},
    \end{equation*}
    or equivalently,
    % \begin{equation*}
    %     \sum_{j=1}^n\psi_j\beta_j^{\M_1} \sum_{j=1}^n\psi_j\gamma_j^{\M_2} \neq \sum_{j=1}^n\psi_j\beta_j^{\M_2} \sum_{j=1}^n\psi_j\gamma_j^{\M_1}
    % \end{equation*}
    % or
    \begin{equation*}
        \sum_{j=1}^n\psi_j\beta_j^{\M_1} \sum_{j=1}^n\psi_j\gamma^{\M_2} - \sum_{j=1}^n\psi_j\beta_j^{\M_2} \sum_{j=1}^n\psi_j\gamma^{\M_1} \neq 0.
    \end{equation*}
    Note that the left hand side is a quadratic equation with parameter $\psi_1$ that contains the following term
    \begin{equation*}
        (\beta_1^{\M_1} \gamma^{\M_2} - \beta_1^{\M_2} \gamma^{\M_1})\psi_1^2
    \end{equation*}
    Since $\beta_1^{\M_1} \gamma^{\M_2} - \beta_1^{\M_2} \gamma^{\M_1}\neq0$, then we can can find realization of $\{\psi_{j}\}_{j=1}^{n}$, such that
    \begin{equation*}
        \sum_{j=1}^n\psi_j\beta_j^{\M_1} \sum_{j=1}^n\psi_j\gamma^{\M_2} - \sum_{j=1}^n\psi_j\beta_j^{\M_2} \sum_{j=1}^n\psi_j\gamma^{\M_1} \neq 0.
    \end{equation*}
    which concludes the proof of the lemma for this case.
    
    
    \item Assume that $Z_2\in \Y$. In this case we have:
    \begin{align*}
        & P_{\x}^{\M_i'}(\z) = 
       \sum_{\V\setminus(\X \cup \Z)} \sum_{\U} P^{\M_i'}((z_2, k)|\Pa{Z_2}{\G}) \prod_{W \in \V\setminus (\X\cup \{Z_2\})}P^{\M_i'}(w \mid \Pa{W}{\G}) \prod_{U \in \U} P(u)\\
        & = \sum_{\V\setminus(\X \cup \Z)} \sum_{\U} \Psi(F(z_1)\oplus k, z_1)P^{\M_i}(z_2|\Pa{Z_2}{\G}) \prod_{W \in \V\setminus (\X\cup \{Z_2\})}P^{\M_i}(w \mid \Pa{W}{\G}) \prod_{U \in \U} P(u)\\
        & =  
        \sum_{\V\setminus(\X\cup \Z)} \sum_{\U} \sum_{k \in \{0, 1\}}\Psi(F(z_1)\oplus k, z_1) P^{\M_i}(z_2|\Pa{Z_2}{\G}) \prod_{W \in \V\setminus (\X\cup \{Z_2\})}P^{\M_i}(w \mid \Pa{W}{\G}) \prod_{U \in \U} P(u)\\
        & = P^{\M_i}(\z).
    \end{align*}
    We denote
    \begin{align*}
         & P^{\M_i}_{\hat{\x}}(\hat{\z}) = {\gamma}^{\M_i}.
    \end{align*}
    Thus, 
    $$
    P_{\x}^{\M_i}(\hat{\y}\setminus\{Z_1\}|\hat{\z}) = \frac{\sum_{j=1}^n\psi_j{\beta_j}^{\M_i}}{\gamma^{\M_i}}.
    $$

    By the assumption of the lemma exist $m \in [1:n]$ such that
    \begin{equation*}
        \frac{{\beta_m}^{\M_1}}{\gamma_j^{\M_1}} \neq \frac{{\beta_m}^{\M_2}}{\gamma^{\M_2}}.
    \end{equation*}
    Next, we prove that there exists a set of parameters $\{\psi_{j}\}_{j=1}^{n}$, such that
    \begin{equation*}
        \frac{\sum_{j=1}^n\psi_j{\beta_j}^{\M_1}}{\gamma^{\M_1}} \neq \frac{\sum_{j=1}^n\psi_j{\beta_j}^{\M_2}}{\gamma^{\M_2}}
    \end{equation*}
    or equivalently,
    \begin{equation*}
        \frac{\sum_{j=1}^n\psi_j{\beta_j'}^{\M_1}}{\gamma^{\M_1}} - \frac{\sum_{j=1}^n\psi_j{\beta_j'}^{\M_2}}{\gamma^{\M_2}} \neq 0.
    \end{equation*}
    Note that left hand side of the above equation is  linear with respect to parameter $\psi_m$ with the following coefficient,
    \begin{equation*}
        \frac{{\beta_m'}^{\M_1}}{\gamma^{\M_1}} - \frac{{\beta_m'}^{\M_2}}{\gamma^{\M_2}}\neq 0.
    \end{equation*}
    This ensures that we can can find a realization of $\{\psi_{j}\}_{j=1}^{n}$, such that
    \begin{equation*}
        \frac{\sum_{j=1}^n\psi_j{\beta_j'}^{\M_1}}{\sum_{j=1}^n\gamma^{\M_1}} - \frac{\sum_{j=1}^n\psi_j{\beta_j'}^{\M_2}}{\sum_{j=1}^n\gamma^{\M_2}} \neq 0.
    \end{equation*}
    This concludes the proof of the lemma for the second case.
\end{itemize}
    
\end{proof}

\section{On the positivity assumption in the literature} \label{sec: app B}
 As it was pointed out in \cite{kivva2022revisiting},  positivity assumption is crucial for proving the completeness part. More precisely, the completeness of an algorithm means that if the algorithm does not compute a given conditional causal effect, then it cannot be computed uniquely by any other algorithms. To prove the completeness, two models $\mathcal{M}_1$ and $\M_2$ are constructed such that they are both positive and induce the same set of distributions as the ones given in the problem statement, i.e., $Q[\A_0]$, $Q[\A_1]$, \dots, $Q[\A_m]$
, but they result in different values for the conditional causal effect of interest, i.e., $P^{\M_1}_{\mathbf{x}}(\mathbf{y}\mid\mathbf{z})\neq P^{\M_2}_{\mathbf{x}}(\mathbf{y}\mid\mathbf{z})$. Hence, $P_{\mathbf{x}}(\mathbf{y}\mid \mathbf{z})$
 cannot be uniquely computed . 
 
 In Lee et al. [2019, 2020] and Correal et al. [2021] for the completeness part authors constructed such models $\M_1$ and $\M_2$, but the models violate the positivity assumption. That is, it is possible to have examples in which a given causal effect is identifiable under the positivity assumption while it is possible to construct two non-positive models that show the causal effect is not identifiable (Kivva et al. [2022]). Violation of positivity assumption renders some distributions ill-defined (conditioning on zero-probability events). That is why computing a causal effect in the classical setting with do-calculus implicitly contains steps in which we can cancel out a distribution (e.g., $Q$) that appears on both side of an equality, i.e., $P_1\cdot Q = P_2\cdot Q \Rightarrow P_1=P_2$. Clearly, this is only possible when $Q>0$. If positivity is violated, then such steps in computing a causal effect cannot be used.

\subsection{General Transportability} 
The work of \cite{lee2020general} proves the completeness part of the c-gID problem by constructing two models that agree on the observable distributions and disagree on the target causal effect. Those models does not satisfy the positivity assumption by the construction. A similar flaw existed in the proof of \cite{lee2019general}, which was  specified in details later by \cite{kivva2022revisiting}.
Given that \cite{lee2020general} does not discuss whether their models can be transformed into positive ones.

For further details, we refer to the technical report of \cite{lee2020general}, which contains the proofs.

\textit{Parametrizations for an s-Thicket:} According to the appendix of \cite{lee2020general}, the models in Lemma 3 which is one of the main Lemmas for proving the completeness result are based on the ones in \cite{lee2019general}. These models violate the positivity assumption according to \cite{kivva2022revisiting} and should be substituted with a fixed ones.

\textit{Parametrization for an Extended s-Thicket:} According to Eq. (5) and (6) in \cite{lee2020general}, it is easy to observe that several observed variables are deterministic functions of other observed variables. This implies that there exists a realization of observed variables such that the conditional probability of one observed variable given the rest is zero. This is against the positivity assumption.

\textit{Parametrization for an Extended s-Thicket with a Path-Witnessing Subgraph:} In Eq. (7) of \cite{lee2020general} if $v_{\mathcal{P}}$ is an observed variable with only observed parents on a backdoor path $\mathcal{P}$, again,  $v_{\mathcal{P}}$ will be a deterministic function of only observed variables. This again does not satisfy the positivity. In general, such $v_{\mathcal{P}}$ would always exist. 

Please note that the errata for \cite{lee2019general} can potentially fix the issue for s-Thicket, but not for extended s-Thicket or Extended s-Thicket with a Path-Witnessing Subgraph (the last two cases).

\begin{figure}[t]
\centering
    \begin{tikzpicture}[
        roundnode/.style={circle, draw=black!60,, fill=white, thick, inner sep=1pt, minimum size=0.65cm},
        dashednode/.style = {circle, draw=black!60, dashed, fill=white, thick, inner sep=1pt, minimum size=0.65cm},
        ]
            % Nodes
            \node[roundnode]        (X0)        at (1.2, -2)                 {$X_0$};
            \node[roundnode]        (X1)        at (-2.6, -2)                    {$X_1$};
            \node[dashednode]       (U0)        at (2, -.0)              {$U_0$};
            \node[dashednode]       (U1)        at (-2.4, -.0)              {$U_1$};
            \node[roundnode]        (T)         at (-.4, -.0)                   {$T$};
            \node[roundnode]        (Z)         at (-0.7, -2)                {$Z$};
            \node[roundnode]        (Y)         at (3.2, -2)                      {$Y$};
            
            %Edges
            \draw[latex-] (X1) -- (T);
            \draw[latex-] (X1) -- (Z);
            \draw[-latex] (Z) -- (X0);
            \draw[latex-, dashed] (X0) -- (U0);
            \draw[-latex, dashed] (U0) -- (Y);
            \draw[latex-, dashed] (T) -- (U1);
            \draw[-latex, dashed] (U1) -- (X1);
        \end{tikzpicture}
    \caption{DAG $\G$ with $\X = \{X_0, X_1\}$ and $\Y = \{Y\}.$} 
    \label{fig: counter-exmpl}
\end{figure} 
\subsection{Counterfactual identification}
Here, we refer to the technical report of \cite{correa2021nested} and construct a simple example that demonstrates our main concerns about the proof of the completness part of the c-gID problem.

Recall that a causal effect $P_{\mathbf{T}}(\mathbf{Y}|\mathbf{X})$ can be written as a counterfactual $P(\mathbf{Y}_*, \mathbf{X}_*)$, where $\mathbf{Y}_* \cup \mathbf{X}_* = \{W_{[\mathbf{T}]}|W \in \mathbf{V}(\mathbf{Y}_* \cup \mathbf{X}_*)\}$ and $[\mathbf{T}]$ denotes an intervention under which the counterfactual value is observed. 
Now, consider the graph $\G$ in Fig. \ref{fig: counter-exmpl}.
Suppose that the known distribution is $P(\V)$ and the target conditional causal effect is 
$$
P_{T}(Y|X_0, X_1) = P(\X_*, \Y_*),
$$ 
where $\X_* = \{X_{0[T]}, X_{1[T]}\}$, $\Y_* = \{Y_{[T]}\}$, $\X = \{X_0, X_1\}$ and $\Y = \{Y\}$. 
Note that for both $X_0$ and $X_1$, there exists an active backdoor path to $Y$, thus, we cannot use the second rule of do-calculus to simplify $P_{T}(Y|X_0, X_1)$.
Please note that in this graph, $X_0, X_1, Z, Y$ belong to the same ancestral component (Def. 7 in [2]) induced by $\mathbf{X}_* \cup \mathbf{Y}_*$ given $\mathbf{X}_*$.  
This is because $Z \in An(X_{0[T]})_{\G_{\underline{X_0}}} \cap  An(Z_{[T]})_{\G}\cap An(X_{1[T]})_{\G_{\underline{X_1}}}$ and there is a bidirected arrow between $X_0$ and $Y$. 
This ancestral component contains $Y$ and based on the definition of $\mathbf{D}_*$ (after Eq. (69) in [2]), we have $\mathbf{D}_* = \{X_{0[T]}, X_{1[T]}, Z_{[T]}, Y_{[T]}\}$.
Furthermore, according to Equation (70) in \cite{correa2021nested} is
$$
\rho(\x, \y) := \sum_{\mathbf{d}_*\setminus (\y_*\cup\x_*)}P(\bigwedge_{D_t\in \mathbf{D}_*}D_{\textbf{pa}_d} = d)
$$
 and in our example, it is equivalent to 
 $$
 P_{T}(Y = \y[Y], X_0 = \x[X_0], X_1 = \x[X_1]).
 $$
In part of the proof, they encounter a setting in which $\rho(\x, \y)$ and $\rho(\x)$ are not g-ID and they need to show that 
$$\rho(\y | \x)=\rho(\x, \y)/\rho(\x)$$
is not c-gID.
To do so, they consider two models $\M^{(1)}$ and $\M^{(2)}$ that shows $\rho(\x, \y)$ is not g-ID and transform them into two new models to prove the non-c-gID of $\rho(\y | \x)$.
According to \cite{correa2021nested},  realizations $\x', \y'$ are such that for models $\M^{(1)}$ and $\M^{(2)}$: 
$$
\rho^{(1)}(\y',\! \x')\!\neq\! \rho^{(2)}(\y', \x').
$$
% Since $X_0, X_1$ and $Y$ do not have any children then distributions $P_{T}(Y, X_0)$, $P_{T}(Y, X_1)$ and $P_{T}(X_0, X_1)$ do not depend on the choice of distributions $P(X_1|\Pa{X_1}{\G})$, $P(X_0|\Pa{X_0}{\G})$ and $P(Y|\Pa{Y}{\G})$, respectively. 
Models $\M^{(1)'}$ and $\M^{(2)'}$ obtained from models $\M^{(1)}$ and $\M^{(2)}$ as follows:
\begin{enumerate}
    \item Append an extra bit $U_p$ to the node $U_0$. 
    
    \item $X_p$ and $Y_p$ binary unobserved variables defined for variables $X_0$ and $Y$, respectively.
    \item Rename $X_0$ and $Y$ as $\widetilde{X}_0$ and $\widetilde{Y}$ and make them unobserved, then $X_0$ and $Y$ are defined in models $\M^{(1)'}$ and $\M^{(2)'}$ as $X_0:=\x'[X_0]$ if $X_p=1$ and $\widetilde{X}_0$, otherwise. Similarly, they defined $Y$ using $Y_p$ and $\widetilde{Y}$.
\end{enumerate}
    % \begin{align*}
    %     & X_0 = 
    %     \begin{cases}
    %         & \x'[X_0] \quad \text{if} \; X_p=1,\\
    %         & \widetilde{X}_0 \quad \text{otherwise},
    %     \end{cases}
    %     \quad
    %      Y = 
    %     \begin{cases}
    %         & \y'[Y] \quad \text{if} \; Y_p=1,\\
    %         & \widetilde{Y} \quad \text{otherwise},
    %     \end{cases}
    % \end{align*}
%4. Distributions $P(X_p|U_p)$ and $P(Y_p|U_p)$ are defined such that: $ P(X_p=Y_p)= \gamma/2$ and  $P(X_p\neq Y_p)=(1-\gamma)/2$.
According to the definitions of $\rho(\x,\y)$, $\widetilde{Y}$, and $\widetilde{X}$, and using the law of total probability, we have
\begin{equation*}
    \rho'(\x', \y')\! =\! \sum_{X_p, Y_p, \widetilde{X}, \widetilde{Y}}\rho'(\x', \y', \widetilde{X}_0, \widetilde{Y}| X_p, Y_p)P(X_p, Y_p)
\end{equation*}
and therefore 
\begin{equation}
\begin{split}
    \label{eq:1}
     \rho'(\x', \y') = &P(X_p=0, Y_p=0)\rho(\x', \y') + \\
    & P(X_p=1, Y_p = 0)\rho(\x'[X_1], \y') + \\
    & P(X_p=0, Y_p=1)\rho(\x') + \\
    & P(X_p=1, Y_p=1)\rho(\x'[X_1]).
\end{split}
\end{equation}
Clearly, $\rho(\x'[X_1])\neq1$ otherwise, the positivity assumption does not hold. On the other hand, based on Eq. (78)-(81) \cite{correa2021nested},  $\rho'(\x', \y')$ is computed by 
\begin{equation}\label{eq:2}
\begin{split}
    & P(X_p=0, Y_p=0)\rho(\x', \y') +\\
    & P(X_p=1, Y_p=0)\rho( \y') +\\
    & P(X_p=0, Y_p=1)\rho(\x') +\\
    &P(X_p=1, Y_p=1).
\end{split}
\end{equation}
In general, \eqref{eq:1} and \eqref{eq:2} are not equal unless for example, $\X=\{X\}$ and $\Y=\{Y\}$. 

Moreover the rest of the proof in \cite{correa2021nested}, i.e., Eq. (83)-(92) heavily relies on Eq. \eqref{eq:2}, therefore without corresponding fix the whole proof for the completeness part in c-gID problem falls apart.

% \bibliography{kivva_47}

\end{document}
