% \documentclass{uai2024} % for initial submission
\documentclass[accepted]{uai2024} % after acceptance, for a revised version; 
% also before submission to see how the non-anonymous paper would look like 
                        
%% There is a class option to choose the math font
% \documentclass[mathfont=ptmx]{uai2024} % ptmx math instead of Computer
                                         % Modern (has noticeable issues)
% \documentclass[mathfont=newtx]{uai2024} % newtx fonts (improves upon
                                          % ptmx; less tested, no support)
% NOTE: Only keep *one* line above as appropriate, as it will be replaced
%       automatically for papers to be published. Do not make any other
%       change above this note for an accepted version.

%% Choose your variant of English; be consistent
\usepackage[american]{babel}
% \usepackage[british]{babel}

%% Some suggested packages, as needed:
\usepackage{natbib} % has a nice set of citation styles and commands
    \bibliographystyle{plainnat}
    \renewcommand{\bibsection}{\subsubsection*{References}}
\usepackage{mathtools} % amsmath with fixes and additions
% \usepackage{siunitx} % for proper typesetting of numbers and units
\usepackage{booktabs} % commands to create good-looking tables
\usepackage{tikz} % nice language for creating drawings and diagrams

\DeclareMathOperator*{\argmax}{argmax}
\usepackage{defs}
\usepackage{mathrsfs}
\usepackage{amsfonts}
\usepackage{amssymb}
\usepackage{pgfplots}
\usepackage{multicol}
\usepackage{caption}
\usepackage{subcaption}
% \usepackage{enumitem}
\usepackage{multirow}
\usepackage{bm}
\usepackage[noend]{algpseudocode}
\usepackage{algorithm}
% \usepackage{algorithmic}
\usepackage[switch]{lineno}

%Commenting
\newcommand{\manuj}[1]{\todo[inline,caption={},color=orange!40]{{\it Manuj:~}#1}}
\newcommand{\james}[1]{\todo[inline,caption={},color=blue!40]{{\it James:~}#1}}
\newcommand{\mike}[1]{\todo[inline,caption={},color=yellow!40]{{\it Mike:~}#1}}

\newtheorem{example}{Example}
\newtheorem{theorem}{Theorem}
\newtheorem{proposition}{Proposition}
\newtheorem{corollary}{Corollary}
\newtheorem{lemma}{Lemma}
\newtheorem{remark}{Remark}
\newtheorem{definition}{Definition}

\title{Characterising Interventions in Causal Games}

% The standard author block has changed for UAI 2024 to provide
% more space for long author lists and allow for complex affiliations
%
% All author information is authomatically removed by the class for the
% anonymous submission version of your paper, so you can already add your
% information below.
%
% Add authors
\author[1]{\href{mailto:<manujmishra2000@gmail.com>?Subject=Your UAI 2024 paper}{Manuj Mishra}}
\author[1,2]{James Fox}
\author[1]{Michael Wooldridge}
% Add affiliations after the authors
\affil[1]{%
    Department of Computer Science\\
    University of Oxford\\
    UK
}
\affil[2]{%
    London Initiative for Safe AI\\
    UK
}
% \affil[3]{%
%     Alan Turing Institute\\
%     London, UK
% }
  
\begin{document}
\maketitle

\begin{abstract}
  \emph{Causal games} are probabilistic graphical models that enable causal queries to be answered in multi-agent settings. They extend causal Bayesian networks by specifying decision and utility variables to represent the agents' degrees of freedom and objectives. In multi-agent settings, whether each agent decides on their policy before or after knowing the causal intervention is important as this affects whether they can respond to the intervention by adapting their policy. Consequently, previous work in causal games imposed chronological constraints on permissible interventions. We relax this by outlining a sound and complete set of primitive causal interventions so the effect of any arbitrarily complex interventional query can be studied in multi-agent settings. We also demonstrate applications to the design of safe AI systems by considering causal mechanism design and commitment.
\end{abstract}

\section{Introduction}\label{sec:intro}

When designing a system for rational, self-interested agents, it is important to incentivise behaviour that aligns with high-level goals, such as maximising social welfare or minimising the harm to other agents. To address this, game theory provides several representations that have different strengths and weaknesses depending on the setting. \citet{causal_games} recently introduced \textit{causal games} to extend \citet{pearl2009causality}'s `causal hierarchy' to the multi-agent setting. Causal games are graphical representations of dynamic non-cooperative games, which can be more compact and expressive than extensive-form games \citep{maids,hammond2021equilibrium}. Like causal Bayesian networks, they use a directed acyclic graph (DAG) to represent causal relationships between random variables, but they also specify decision and utility variables. Each agent selects a policy -- independent conditional probability distributions (CPDs) over actions for each of their decision variables -- to maximise their expected utility. 

Causal Bayesian networks handle interventions in settings without agents by cutting any edges incident to the intervened node in the DAG to represent that the effect of an intervention can only propagate downstream. However, to handle how an agent might or might not adapt their policy in response to an intervention, mechanised graphs extend the regular DAG by explicitly representing each variable's distribution and showing which other variables' distributions matter to an agent optimising a particular decision rule \citep{causal_games,dawid2002influence}.

\paragraph{Related Work:} 
The effect of causal interventions is important in many fields such as economics~\citep{heckman2022causality,leroy2004causality}, computer science~\citep{brand2023recent} and public health~\citep{ahern2009estimating, glass2013causal}. However, these fields use models that do not account for the strategic nature of multi-agent systems. Recently, causal games~\citep{causal_games} were introduced to unify the power of causal and strategic reasoning in one model. Causal games and their single-agent variant, causal influence diagrams~\citep{agent_incentives}, have been used to design safe and fair AI systems~\citep{ashurst2022fair,everitt2021reward,farquhar2022path,carroll2023characterizing}, explore reasoning patterns and deception~\citep{pfeffer2007reasoning,ward2022agent}, and identify agents from data~\citep{kenton2023discovering}. The key limitation is that existing work on multi-agent causal models assumes that an intervention is either fully post-policy (entirely invisible) to all agents or fully pre-policy (entirely visible) to all agents before they decide on their decision rule at each decision point. 

\paragraph{Contributions:}
Our most important novel contribution is to extend the theory of interventions in causal games to be able to accommodate arbitrary queries where agents choose their decision rules based on any subset of the interventions (those visible to them). This is necessary to discuss richer properties of causal games and calculate certain specifications. First, in Section \ref{sec:prim}, we present a sound and complete set of primitive causal interventions that enable any causal intervention (a game modification) to be decomposed into one of four operations acting on CPDs or functions acting on such distributions. Second, in Section \ref{sec:interventional_queries}, we prove that this generalises \citet{causal_games}'s notion of pre-policy and post-policy interventions, which assume that interventions are either visible to all agents (pre-policy) or no agents (post-policy), to arbitrarily complex compound interventions. In Section \ref{sec:CMD}, we explore how our theoretical contributions are useful for both qualitative and quantitative specifications in causal mechanism design. The former exploits graphical properties of the causal game's mechanised graph, and the latter formalises the effect of taxation and reward schemes. Finally, in Section \ref{sec:commit}, we show how causal games can be helpful for representing `commitment', where one agent can gain a strategic advantage over others by committing to a policy before the game begins.

\section{Background}

This section reviews \citet{causal_games}'s Causal Games. We begin with an example.

\begin{example}[\citet{spence1978job}'s Job Market Signalling Game]
    \label{ex:job_market}
    A worker who is either hard-working or lazy is hoping to be hired by a firm. They can choose to pursue university education but know that they will then suffer from three years of studying, especially if they are lazy. 
    The firm prefers hard workers but is using an automated hiring system that can only observe the worker’s education, not their temperament.
\end{example}

\begin{figure}[]
    \centering
    % \vspace{-1em}
    \begin{subfigure}[b]{0.45\linewidth}
        \centering
        \resizebox{0.75\width}{!}{
        \begin{influence-diagram}
            \node (T) [] {$T$};
            \node (U1) [utility, right = of T, player1] {$U^1$};
            \node (U2) [utility, right = of U1, player2] {$U^2$};
            \node (D1) [decision, below right = 1.4cm and 0.7cm of T, player1] {$D^1$};
            \node (D2) [decision, right = of D1, player2] {$D^2$};
            \edge {T} {D1};
            \edge {D1} {D2};
            \path (T) edge[->, bend left=45] (U2);
            \edge {T} {U1};
            \edge {D1} {U1};
            \edge {D2} {U1,U2};
        \end{influence-diagram}
        }
        \caption{}
        \label{fig:signal:a}
    \end{subfigure}
    \begin{subfigure}[b]{0.54\linewidth}
        \centering
        \resizebox{0.75\width}{!}{
        \begin{influence-diagram}
        \node (X) [] {$T$};
        \node (U1) [utility, right = of X, player1] {$U^1$};
        \node (U2) [utility, right = of U1, player2] {$U^2$};
        \node (D1) [decision, below right = 1.4cm and 0.7cm of X, player1] {$D^1$};
        \node (D2) [decision, right = of D1, player2] {$D^2$};
        \edge {X} {D1};
        \edge {D1} {D2};
        \path (X) edge[->, bend left=45] (U2);
        \edge {X} {U1};
        \edge {D1} {U1};
        \edge {D2} {U1,U2};
        \node (X_mec) [relevancew, above = of X] {$\Theta_T$};
        \node (U2_mec) [relevancew, above = of U2] {$\Theta_{U^2}$};
        \node (D1_mec) [relevanceb, below = of D1] {$\Pi_{D^1}$};
        \node (U1_mec) [relevancew, above = of U1] {$\Theta_{U^1}$};
        \node (D2_mec) [relevanceb, below = of D2] {$\Pi_{D^2}$};
        \edge[gray] {X_mec} {X};
        \edge[gray] {D1_mec} {D1};
        \edge[gray] {D2_mec} {D2};
        \edge[gray] {U1_mec} {U1};
        \edge[gray] {U2_mec} {U2};
        \node (space1) [minimum size=0mm, node distance=2mm, below = 0.7cm of D1, draw=none] {};
        \draw (X_mec) edge[gray,in=180,out=-135] (space1.center)
        (space1.center) edge[gray,->,out=0,in=135] (D2_mec);
        \node (space3) [minimum size=0mm, node distance=2mm, left = 0.7cm of D1, draw=none] {};
        \draw (U1_mec) edge[gray,in=90,out=-110] (space3.center)
        (space3.center) edge[gray,->,out=-90,in=135] (D1_mec);
        \path (D1_mec) edge[gray,->, bend right=15] (D2_mec);
        \path (D2_mec) edge[gray,->, bend right=15] (D1_mec);
        \draw (X_mec) edge[gray,->,out=-135,in=155] (D1_mec);
        \draw (U2_mec) edge[gray,->, out=-45, in=25] (D2_mec);
    \end{influence-diagram}
        }
        \caption{}
        \label{fig:signal:b}
    \end{subfigure}
 \caption{A causal game's (a) graph and (b) mechanised graph for Example \ref{ex:job_market}.}
    \label{fig:signal}
\end{figure}

We use capital letters $V$ for random variables, lowercase letters $v$ for their instantiations, and bold letters $\bm{V}$ and $\bm{v}$ respectively for sets of variables and their instantiations.
We let $\dom(V)$ denote the finite domain of $V$ and let $\dom(\bm{V}) \coloneqq {\bigtimes}_{V \in \bm{V}}\dom(V)$. $\Pa_V$ denotes the parents of variable $V$ in a graphical representation and $\pa_V$ the instantiation of $\Pa_V$. We also define $\Ch_V$, $\Anc_V$, $\Desc_V$, and $\Fa_V \coloneqq \Pa_V \cup \{V\}$ as the children, ancestors, descendants, and family of $V$, respectively. As with $\pa_V$, their instantiations are written in lowercase. We use superscripts to indicate an agent \label{def:agent} $i \in N = \{1, \dots, n\}$ and subscripts to index the elements of a set; for example, the decision variables belonging to agent $i$ are denoted $\bm{D}^i = \{D^i_1,\ldots,D^i_m\}$.

\subsection{Causal Games}
Causal games (CGs) are causal multi-agent influence diagrams \citep{maids,causal_games}.
Influence diagrams were initially devised to model single-agent decision problems graphically \citep{influence_diagrams, miller1976development}. They are defined similarly to 
a Bayesian network (BN) but with additional utility variables and parameter-less decision variables. A \textit{causal Bayesian network} (CBN) is a BN with edges that faithfully represent causal relationships \citep{pearl2009causality}. So, a CG is a game-theoretic CBN, where agents select a conditional distribution over actions at their decision variables to maximise the expected cumulative value of their utility variables. The simplest causal intervention $\Do(\bm{Y}=\bm{y})$ in a CBN or CG fixes the values of variables $\bm{Y}$ to some $\bm{y}$; we denote the resulting joint distribution by $\Pr_{\bm{y}}(\bm{V})$.

\begin{definition}
    \label{def: causal_game} 
    A \textbf{causal game (CG)} is a structure $\model = (\graph, \params)$ where $\graph = (\agents, \vars, \edges)$ specifies a set of agents $\agents = \set{1, \ldots, n}$ and a directed acyclic graph (DAG) ($\vars, \edges$) where $\bm{V}$ is partitioned into chance variables $\bm{X}$, decision variables $\bm{D} = \bigcup_{i \in N} \bm{D}^i$, and utility variables $\bm{U} = \bigcup_{i \in N} \bm{U}^i$. The parameters $\bm{\theta} = \{\theta_{V}\}_{V \in \bm{V} \setminus \bm{D}}$ define the CPDs $\Pr(V \mid \Pa_V ; \theta_V)$ for each non-decision variable such that for \emph{any} parameterisation of the decision variable CPDs, the induced model with joint distribution $\Pr^{\policyprof}(\bm{v})$ is a causal Bayesian network, i.e., $\graph$ is Markov compatible with $\Pr^{\policyprof}_{\bm{y}}$ for every $\bm{Y} \subseteq \bm{V}$ and $\bm{y} \in \dom(\bm{Y})$, and that:
        \noindent
        \begingroup
        \small   
  \thinmuskip=\muexpr\thinmuskip*5/8\relax
  \medmuskip=\muexpr\medmuskip*5/8\relax  
        $$\jointdistr^{\policyprof}_{\bm{y}}(v \mid \pa_V) =
        \begin{cases}
            1 & \text{\hspace{-.8em} $V \in \bm{Y}$, $v$ is consistent with $\bm{y}$,}\\
            \Pr^{\policyprof}(v \mid \pa_V) & \text{\hspace{-.8em} $V \notin \bm{Y}$, $\pa_V$ is consistent with $\bm{y}$.}\\
        \end{cases}$$
        \endgroup
\end{definition}

Figure \ref{fig:signal:a} depicts a causal game for Example \ref{ex:job_market}. White circles represent chance variables, e.g., the worker's temperament ($T$) with probabilities $p$ for hard-working and $1-p$ for lazy. Decision and utility variables are squares and diamonds, respectively. The worker's decision ($D^1$: attend university or not) and utility ($U^1$) are shown in red, while the firm's decision ($D^2$: offer a job or not) and utility ($U^2$) are in blue. Missing edges, like $T \rightarrow D^2$, indicate an agent's lack of information. The worker receives utility $5$ for a job offer but incurs a $1$ or $2$ cost for attending university (depending on their temperament). The firm gains $3$ for hiring a hard worker but suffers a cost of $2$ if they hire a lazy worker or an opportunity cost of $1$ if they reject a hard worker. Parameters $\bm{\theta}$ define conditional distributions for $T$, $U^1$, and $U^2$.

Given a causal game $\model = (\graph, \bm{\theta})$, a \textbf{decision rule} $\pi_D$ for $D \in \bm{D}$ is a CPD $\pi_D(D \mid \Pa_D)$ and a \textbf{partial policy profile} $\pi_{\bm{D}'}$ is a set of decision rules $\pi_D$ for each $D \in \bm{D}' \subseteq \bm{D}$, where we write $\pi_{-\bm{D}'}$ for the set of decision rules for each $D \in \bm{D} \setminus \bm{D}'$. 
A \textbf{policy} ${\bm{\pi}}^i$ refers to ${\bm{\pi}}_{\bm{D^i}}$, and a (full) \textbf{policy profile} ${\bm{\pi}} = ({\bm{\pi}}^1,\ldots,{\bm{\pi}}^n)$ is a tuple of policies, where ${\bm{\pi}}^{-i} \coloneqq ({\bm{\pi}}^1, \dots, {\bm{\pi}}^{i-1}, {\bm{\pi}}^{i+1}, \dots, {\bm{\pi}}^n)$. 
A decision rule is \textbf{pure} if $\pi_D(d \mid \pa_D) \in \{0,1\}$ and \textbf{fully stochastic} if $\pi_D(d \mid \pa_D) > 0$ for all $d \in \dom(D)$ and each  \textbf{decision context} $\pa_D \in \dom(\Pa_D)$; this holds for a policy (profile) if it holds for all decision rules in the policy (profile).

By combining ${\bm{\pi}}$ with the partial distribution $\Pr$ over the chance and utility variables, we obtain a joint distribution $\Pr^{\bm{\pi}}(\bm{x},\bm{d},\bm{u}) \coloneqq \prod_{V \in \bm{V} \setminus \bm{D}} \Pr (v \mid \pa_{V}) \cdot \prod_{D \in \bm{D}} \pi_{D} (d \mid \pa_{D})$\label{def:jointMAID} over all the variables in $\model$; inducing a BN. The \textbf{expected utility} for Agent $i$ given a policy profile ${\bm{\pi}}$ is defined as the expected sum of their utility variables in this BN, that is $\exputility_{\policyprof}[\utilvars^i] = \sum_{U \in \sU^i} \sum_{u \in \dom (U)} \jointdistr^{\policyprof} (U = u) \cdot u$\label{def:EU}. A policy ${\bm{\pi}}^i$ is a \textbf{best response} to profile ${\bm{\pi}}^{-i}$ if $\exputility_{({\bm{\pi}}^i,{\bm{\pi}}^{-i})}[\utilvars^i] \geq \exputility_{({\bm{\tilde{\pi}}}^i,{\bm{\pi}}^{-i})}[\utilvars^i]$ for all ${\bm{\tilde{\pi}}}^i \in {\bm{\Pi}}^i$. A \textbf{Nash equilibrium} (NE) is a policy profile where each agent plays a best response. A causal game is solved by finding a policy profile that satisfies a solution concept, usually an NE. 

Causal games offer several explainability and complexity advantages over extensive form games \cite{maids}. One key advantage is that probabilistic dependencies between chance and strategic variables can be exploited using the \textit{d-separation} graphical criterion \cite{pearl1988probabilistic}.

\begin{definition}
    \label{def:dsep}
    A \textbf{path}, $p$, in a DAG\footnote{We use that d-separation remains a valid test for conditional independence in cyclic graphs \citet{cyclicdsep}.} $\graph = (\bm{V}, \mathscr{E})$ is a sequence of adjacent variables in $\bm{V}$. A path $p$ is said to be \textbf{d-separated} by a set of variables $\bm{Y}$ if and only if:
    \begin{itemize}
        \item $p$ contains a \emph{chain} $X \rightarrow W \rightarrow Z$ or $X \gets W \gets Z$, or a \emph{fork} $X \leftarrow W \rightarrow Z$, and $W \in \bm{Y}$.
        \item $p$ contains a \emph{collider} $X \rightarrow W \leftarrow Z$ and $(\{W\} \cup \Desc_W) \cap \bm{Y} = \varnothing$.
    \end{itemize}
    A set $\bm{Y}$ \textbf{d-separates} $\bm{X}$ from $\bm{Z}$ ($\bm{X} \perp_\graph \bm{Z} \mid \bm{Y}$), if $\bm{Y}$ d-separates every path in $\graph$ from a variable in $\bm{X}$ to a variable in $\bm{Z}$. Sets of variables that are not d-separated are said to be \textbf{d-connected}, denoted $\bm{X} \not\perp_\graph \bm{Z} \mid \bm{Y}$.
    \end{definition}

If $\bm{X} \perp_\graph \bm{Z} \mid \bm{Y}$ in $\graph$, then $\bm{X}$ and $\bm{Z}$ are probabilistically independent conditional on $\bm{Y}$ in the sense that $\Pr(\bm{x} \mid \bm{y}, \bm{z}) = \Pr(\bm{x} \mid \bm{y})$, in every distribution $\Pr$ that is Markov compatible with $\graph$ and for which $\Pr(\bm{y}, \bm{z})>0$. Conversely, if $\bm{X} \not\perp_\graph \bm{Z} \mid \bm{Y}$, then $\bm{X}$ and $\bm{Z}$ are dependent conditional on $\bm{Y}$ in at least one distribution Markov compatible with $\graph$. For example, there are several paths from $U^2$ to $U^1$ in Figure \ref{fig:signal:a}: direct forks through $T$ or $D^2$, a fork through $T$ and then a forward chain through $D^1$, or a backward chain through $D^2$ and then a fork through $D^1$. If $\bm{Y} = \varnothing$, then $U^2$ is d-connected to $U^1$ ($U^2 \not\perp_\graph U^1\mid\varnothing$), but if $\bm{Y} = \{T, D^2\}$ then all of the paths have been blocked by conditioning on $\bm{Y}$ and so $U^2 \perp_\graph U^1\mid\bm{Y}$.

A causal game's regular graph $\graph$ captures the dependencies between \textbf{object-level} variables in the environment, but its \textbf{mechanised graph} $\mec{\graph}$ is an enhanced representation revealing the strategically relevant dependencies between agents' decision rules and the parameterisation of the game \citep{causal_games}. Collectively, decision rules and CPDs are known as the mechanisms $\mecvars$ of the decision, and chance/utility variables, respectively. Each object-level variable $V \in \bm{V}$ has a mechanism parent $\mecvar_V$ representing the distribution governing $V$. More specifically, each decision $D$ has a new decision rule parent $\Pi_D = \mecvar_D$ and each non-decision $V$ has a new parameter parent $\Theta_V = \mecvar_V$, whose values parameterise the CPDs. The \textit{independent mechanised graph} is the result (it has no inter-mechanism edges).

However, agents select a decision rule $\pi_D$ (i.e., the value of a decision rule variable $\Pi_D$) based on both the parameterisation of the game (i.e., the values of the parameter variables) and the selection of the other decision rules ${\bm{\pi}}_{-D}$ -- so these dependencies are captured by the edges from other mechanisms into decision rule nodes. These reflect some \emph{rationality assumptions}, captured by a set of \emph{rationality relations} $\mathcal{R}$ = $\{r_D\}_{D\in\bm{D}}$ that represent how the agents choose their decision rules. Each decision rule $\Pi_D$ is governed by a \emph{serial relation} $r_D \subseteq \dom(\Pa_{\Pi_D}) \times \dom(\Pi_D)$, which accounts for the fact that an agent may not deterministically choose a single decision rule $\pi_D$ in response to some $\pa_{\Pi_D}$. If all of the rationality relations $\mathcal{R}$ are satisfied by $\pi$, then $\pi$ is an $\mathcal{R}$-rational outcome of the game. We often assume that the agents are playing best responses $\mathcal{R} = \rbr$, so the $\rbr$-rational outcomes are simply the NE of the game. 

Finally, a graphical criterion $\mathcal{R}$-reachability (based on d-separation) determines which of these edges are necessary in the mechanised graph, e.g., $\mecvar_V \rightarrow \Pi_D$ exists if and only if the choice of best response decision rule $\Pi_D$ depends on the CPD at $\mecvar_V$ ($\mecvar_V$ is $\rbr$-relevant to $\Pi_D$). The mechanised graph for Example \ref{ex:job_market} (in Figure \ref{fig:signal:b}) shows that $\Theta_T$, $\Theta_{U^1}$, and $\Pi_{D^2}$ are all $\rbr$-relevant to $\Pi_{D^1}$ whereas $\Theta_{T}$, $\Theta_{U^2}$, and $\Pi_{D^1}$ are $\rbr$-relevant to $\Pi_{D^2}$. In contrast to a causal game's regular DAG, there may exist cycles between mechanisms (see \citep{causal_games} for more details). 

So, the mechanised graph $\mec{\graph}$ takes the original graph $\graph$ and, for each variable $V \in \vars$, adds mechanism parent node $\mecvar_V$ and edge $\mecvar_V \rightarrow V$ as well as edges $\mecvar_V \rightarrow \Pi_D$ for each decision rule $\Pi_D$ where $\mecvar_V$ is $\rbr$-relevant to $\Pi_D$.

\section{Characterising Interventions} \label{sec:interventions}

Causal games admit queries on level two of \citet{pearl2009causality}'s \emph{Causal Hierarchy}. Importantly, in game-theoretic settings, we only assume that an $\R$-rational outcome of the game (e.g., an NE) is chosen rather than some unique policy profile $\pi$. We therefore evaluate queries with respect to a set of policy profiles, e.g., `if $D^1=g$, is it the case that for all NE\ldots'. When an intervention takes place is important. 
\citet{causal_games} previously introduced a distinction between \textit{pre-policy} queries, where the intervention occurs before the policy profile is selected, and \textit{post-policy} queries, where the intervention occurs after. We extend this to accommodate arbitrary queries where each agent makes decisions based on the subset of interventions visible to them. 

\subsection{Primitive Interventions}\label{sec:prim}

Given a causal game $\model$ with mechanised graph $\mec \graph$ and rationality relations $\R$, an intervention $\I$ is a function that maps a set of joint probability distributions $\set{\jointdistr^{\policyprof}(\sv)}_{\policyprof \in \R}$ to a new set $\set{\jointdistr^{\policyprof}(\sv_\I)}_{\policyprof \in \R^*}$ where $\R^*$ are the rationality relations of the intervened game with graph $\mec \graph_\I$ and $\jointdistr^{\policyprof}(\sv_\I)$ is the joint probability distribution represented by the CBN induced by $\mec \graph_\I$ when parameterised over policy profile $\policyprof$. We define four primitive types of intervention.

\textbf{(1) Fixing an object-level variable:}
Intervening on variable $X$ replaces $\jointdistr^{\policyprof}(x \mid \pa_X)$ with a new CPD $\jointdistr^{\I}(x \mid \pa_X^*)$. Graphically, when $\pa_X^* \neq \pa_X$, the incoming edges to $X$ are changed such that $V \rightarrow X$ exists if and only if $V \in \pa_X^*$. The induced distribution is:
\begin{equation*}
\jointdistr^{\policyprof}(\sv_\I) = \jointdistr^{\I}(x \mid \pa_X^*) \cdot \prod_{V \in \vars \setminus \set{X}} \jointdistr^{\policyprof}(v \mid \pa_V)
\end{equation*}

A \textit{hard object-level intervention} assigns $\jointdistr^\I = \delta(X, g)$. In \citet{pearl2009causality}'s do-calculus, this is written $\Do (X=g)$. Any other form of object-level intervention is qualified as \textit{soft}. 

\textbf{(2) Fixing a mechanism variable:}
A \textit{hard mechanism-level intervention} $\Do (\mecvar_V = \mecval_V)$ sets the distribution over each mechanism $\mecvar_V$ to $\delta(\mecvar_V, \mecval_V)$. Any other form of mechanism-level intervention is qualified as \textit{soft}.
A mechanism-level intervention on decision rule $\Pi_D$ replaces $r_D: \dom (\Pa_{\Pi_D}) \rightarrow \dom (\Pi_D)$ with a new rationality relation $r_D^{\I}: \dom(\Pa_{\Pi_D}^*) \rightarrow \dom(\Pi_D)$. Graphically, when $\Pa_{\Pi_D}^* \neq \Pa_{\Pi_D}$, the incoming edges to variable $\Pi_D$ are changed such that $V \rightarrow \Pi_D$ exists if and only if $V \in \Pa_{\Pi_D}^*$. For a parameter variable $\Theta_V$ of $V \in \vars \setminus \decvars$, an intervention assigns a new distribution from the set of all CPDs over set $V$ given the values of its parents, set $Pa_V$. Note that parameter variables don't have parent mechanism variables as inputs to the choice of distribution.

\textbf{(3) Adding a new object-level variable:}
Adding a new object-level variable $Y$ introduces a new CPD $\jointdistr^{\I}(y \mid \pa_Y)$ to the joint distribution factorisation. Graphically, this adds a new node $Y$ to $\graph$ and adds edges $X \rightarrow Y$ for all $X \in \Pa_Y$ and $Y \rightarrow Z$ for all $Z \in \Ch_Y$. The induced distribution is
\begin{equation*}
\jointdistr^{\policyprof}((\sv \cup Y)_\I) = \jointdistr^{\I}(y \mid \pa_Y) \cdot \prod_{V \in \vars} \jointdistr^{\policyprof}(v \mid \pa_V^*)
\end{equation*}
\begin{equation*}
\text{where, for  } V \in \vars \text{, } \Pa_V^* = 
\begin{cases}
    \Pa_V \cup {Y} & \text{ if } V \in \Ch_Y\\
    \Pa_V & \text{ otherwise}
 \end{cases}
\end{equation*}
\textbf{(4) Removing an existing object-level variable:}
Removing an existing object-level variable $Y$ removes the CPD $\jointdistr^{\policyprof}(y \mid \pa_Y)$ from the joint distribution factorisation. Graphically, this removes the node $Y$ from $\graph$ and removes edges $X \rightarrow Y$ for all $X \in \Pa_Y$ and $Y \rightarrow Z$ for all $Z \in \Ch_Y$. The induced distribution is
\begin{equation*}
\jointdistr^{\policyprof}((\sv \setminus \set{Y})_\I) = \prod_{V \in \vars \setminus \set{Y}} \jointdistr^{\policyprof}(v \mid \pa_V^*)
\end{equation*}
\begin{equation*}
\text{where, for  } V \in \vars \text{, } \Pa_V^* = 
\begin{cases}
    \Pa_V \setminus \set{Y} & \text{ if } V \in \Ch_Y\\
    \Pa_V & \text{ otherwise}
\end{cases}
\end{equation*}

\begin{remark}
After any intervention of type 1, 3, or 4, $\mec \graph$ must be updated to reflect any changes in $\mathcal{R}$-reachability between mechanisms. Note that a type 1 intervention can be considered a type 4 intervention followed by a type 3 intervention, but we include it as a primitive for convenience.
\end{remark}

\begin{theorem}
\label{theorem:prim}
Primitive interventions are a sound and complete formulation of causal interventions. 
\end{theorem}
\begin{proof}[Proof sketch]
    Soundness comes because each primitive intervention corresponds with a function between a set of probability distributions induced by $\mathcal{R}$-rational outcomes to a new set of probability distributions induced by (a possibly different) set of $\mathcal{R}$-rational outcomes. This makes it a valid causal intervention. Completeness is shown by proving any valid intervention can be decomposed into an equivalent set of primitive interventions. We relegate the full proof to Appendix~\ref{app:proof}.
\end{proof}

There are a number of other interesting intervention types that can be constructed by composing these primitives. 

\textbf{Unfixing an object-level variable:}
For every type 1 intervention $\I$ which fixes variable $X$, there is a type 1 inverse intervention $\I'$ which unfixes it. It restores the intervened CPD to be based on the original policy profile $\policyprof$ and parents $\Pa_X$, rather than $\I$ and $\Pa_X^*$.

\textbf{Unfixing a mechanism variable:}
Similarly, for every type 2 intervention $\I$ which fixes a variable $\Pi_D$, there exists a type 2 inverse intervention $\I'$ which unfixes it. This restores the rationality relation associated with $\Pi_D$ to its default $r_D$, rather than $r_D^{\I}$. It also makes the mechanism conditionally dependent on the original parents $\Pa_{\Pi_D}$ rather than $\Pa_{\Pi_D}^*$.

\textbf{Adding an object-level dependency:}
Adding a dependency, e.g., $\Add (X \rightarrow Y)$, is equivalent to a type 1 intervention where $\jointdistr^{\I}(y \mid \pa_Y) = \jointdistr^{\policyprof}(y \mid \pa_Y \cup \set{X})$.

\textbf{Removing an object-level dependency:}
Removing a dependency, e.g., $\Del (X \rightarrow Y)$, is equivalent to a type 1 intervention where $\jointdistr^{\I}(y \mid \pa_Y) = \jointdistr^{\policyprof}(y \mid \pa_Y \setminus \set{X})$.

\subsection{Interventional Queries} \label{sec:interventional_queries}
An interventional query concerns the outcome of a game after a set of causal interventions $\sI$, where each agent is privy to the state of the game after a subset of these interventions has been performed. We say that an intervention is \textit{visible} to an agent if the agent has an opportunity to adapt their policy to that intervention. Consider Example~\ref{ex:job_market}. Unbeknownst to the firm, the worker may have an alternative job offer which changes her best-response policy. Simultaneously, the firm may have new hiring quotas, which change their payoffs and, therefore, their best response, but which are not disclosed to the worker. These two external interventions can be expressed in a unified analysis using our framework.

First, we introduce some new notation. $\prims$ denotes a set of primitive interventions. $\sI^i \subseteq \sI$ denotes the set of interventions visible to agent $i$. $\sI(\model)$ denotes the state of the causal game after applying interventions $\sI$ in any order. The $\circ$ operator denotes ordered composition where $(\sI_1 \circ \sI_0)(\model)$ is the state of the game after applying $\sI_0$ then $\sI_1$. As shorthand, $\I_0 \circ \I_1$ means $\set{\I_0} \circ \set{\I_1}$.

\begin{remark}
The order in which interventions are applied is important because interventions are not commutative. Consider, for example, two hard object-level interventions on the same variable but to different CPDs, $\delta(X, a)$ and $\delta(X, b)$. Then clearly $(\Do(X=a) \circ \Do(X=b))(\model) \not \equiv (\Do(X=b) \circ \Do(X=a))(\model)$.
\end{remark}
The $\mathcal{R}$-rational outcomes of the game after each agent $i$ has an opportunity to adapt to her visible interventions $\I^i$, is denoted $\R(\model_I)$. $\Theta_I$ denotes the parameterisation of non-decision mechanisms after interventions $\I$. Using this, we define an interventional query which Theorem \ref{thm:decomp} proves can always be decomposed into primitive intervention sets.

\begin{definition}[Interventional Query]
    Given CG $\model$, rationality relations $\R$, and set of visible interventions for each agent $\sI^1 , \ldots, \sI^N$, an interventional query $\phi(\policyprof)$ is a first-order logical formula that acts on the joint probability distribution $\jointdistr^{\policyprof}$ induced by $\R$-rational outcome $\policyprof \in \R(\model_{\sI})$ and parameterisation $\Theta_{\sI}$ where $\sI = \sI^1 \cup \ldots \cup \sI^N$.
\end{definition}

\begin{theorem}[Decomposition of Intervention Sets] \label{thm:decomp}
For any set of interventions $\sI$, where $\sI^i \subseteq \sI$ is the subset of interventions visible to agent $i$, there are primitive intervention sets $\prims_0, \ldots, \prims_{m}$, such that
\begin{equation} 
     \forall i~\exists j \in \set{0,\ldots,m} : \sI^i(\model)= (\prims_j \circ \prims_{j-1} \ldots \circ \prims_{0})(\model)
\end{equation}
\end{theorem}
That is to say, for any set of interventions $\sI$, where the visible set of each agent is an \textit{arbitrary} subset, $\sI^i \subseteq \sI$, we can construct an \textit{ordered} list of primitive interventions such that, after the first $j$ sets of primitive interventions, the state of the game is the exact state visible to Agent $i$ when choosing her policy. We prove Theorem \ref{thm:decomp} in Appendix~\ref{app:proof}. 

Taking this decomposition, we uniquely partition the agents into sets $A_0, \ldots, A_m$ according to the state of the game visible to them. The $\texttt{decompose}$ function maps $\I$ to sets $\prims_0, \ldots, \prims_m$ satisfying Theorem \ref{thm:decomp} and the corresponding partition of the agents $A_0, \ldots, A_m$. Then, Algorithm~\ref{alg:inter_query} solves the interventional query by iteratively calculating the $\R$-rational outcomes (e.g., NEs if $\R=\rbr$), fixing the policies of agents who cannot observe future interventions, and applying interventions. This subsumes \cite{causal_games}'s pre-policy and post-policy interventional queries. The computational complexity of Algorithm~\ref{alg:inter_query} is (in general) intractable, but as is almost any inference problem in Bayesian networks \cite{kwisthout2009computational}. \citet{fox2023imperfect} discuss how algorithms such as this one will only be practical in settings with bounded tree-width graphs, number of agents, and action sets. We leave improving the efficiency of this algorithm to future work.

Whenever the rationality assumptions have a solution existence guarantee (e.g., if $\R=\rbr$, there is always at least one NE of the game), then Algorithm~\ref{alg:inter_query} successfully terminates. There are two special cases:
\begin{enumerate}
    \item If $\prims_0 \cup \ldots \cup \prims_j = \emptyset$, the agent is not privy to any interventions and the interventional query is fully \textit{post-policy} with respect to Agent $i$.
    \item If $\prims_0 \cup \ldots \cup \prims_j = \I$, the agent is privy to all interventions and the interventional query is fully \textit{pre-policy} with respect to Agent $i$.
\end{enumerate}

\begin{algorithm}[h!]
\caption{Calculate the result of an interventional query}
\label{alg:inter_query}
\begin{algorithmic}[1]
\State \textbf{Input:} A causal game $\model$ with rationality relation $\R$, interventions $\sI = \sI^1 \cup \ldots \cup \sI^N$, and query $\phi(\policyprof)$.
\State $(\prims_0, \ldots, \prims_m), (A_0, \ldots, A_m) \leftarrow$ \Call{decompose}{$\sI$}
\State $A' \leftarrow \emptyset$
\For{$j = 0, \dots, m$}
    \State $A \leftarrow (A_j \cup \ldots \cup A_N) \setminus A'$
    \State $\nashpolicyprof \leftarrow$ uniformly sample an $\R$-rational outcome
    \For{{$i \in A_j$}}
        \State $\Do(\Pi_{D^i} = \hat{\pi}_{D^i})$
    \EndFor
    \For{{$\prim \in \prims_j$}}
        \State $\prim(\model)$
        \If{$\prim$ acts on $V \in \decvars^i \cup \policyprofs^i$}
            \State $A' \leftarrow A' \cup \set{i}$
        \EndIf
    \EndFor
\EndFor
\State $\jointdistr^{\policyprof} (\sv) \leftarrow \prod_{V \in \vars} \jointdistr^{\policyprof} (v\mid\pa_{V})$
\State \Return $\phi(\policyprof)$
\end{algorithmic}
\end{algorithm}

\textbf{Mechanism-level side effects:} Object-level interventions can have unintuitive mechanism-level side effects. A side effect is a modification to the inter-mechanism edges in $\mec \graph$ and $\not \rightarrow$ denotes an edge removal. Proposition~\ref{prop:side_effects} formalises the side effects of an object-level intervention.

\begin{definition}[Reachability Path]
  Let $D \in \decvars^i$. We write $\R(\mecvar_V \rightarrow \Pi_D)$ to denote the set of paths that make $\mecvar_V$ $\R$-relevant to $\Pi_D$. A \textit{reachability path} is any path $p \in \R(\mecvar_V \rightarrow \Pi_D)$. That is, a non-repeating sequence of nodes $V_0, ..., V_j \in \mec{}_{\perp}\vars$ of the independent mechanised graph $\mec{}_{\perp}\graph$ s.t $V_0 = \mecvar_V$, and $V_0$ is $\R$-relevant to $\Pi_D$.
\end{definition}

\begin{proposition}[Object-level intervention side effects] \label{prop:side_effects}
An object-level intervention $\jointdistr^{\I}(x \mid \pa_X^*)$ has side effect $\mecvar_V \not \rightarrow \Pi_D$ if, $\forall$ reachability paths $p \in \R(\mecvar_V \rightarrow \Pi_D)$ we have $\exists W \in \vars \text{s.t.} (W \not \in \Pa_X^*) \text{ and } ((W \rightarrow X) \in p)$ 
\end{proposition}

That is to say, an intervention on $X$ which severs at least one edge critical to each reachability path between $\mecvar_V$ and $\Pi_D$ through $X$, will delete the corresponding edge between those mechanisms in $\mec \graph$. Similarly, if an intervention creates at least one new reachability path, it will result in the addition of a new inter-mechanism edge.

\textbf{Minimum intervention sets:} Using these observations, we formalise the minimum set of interventions required to break a causal mechanism dependency $\mecvar_V \rightarrow \Pi_D$. Since we are only interested in interventions that do not directly modify the target policy $\Pi_D$, and we recall that reachability paths are calculated on the independent mechanised graph $\mec{}_{\perp}\graph$ which contains no edges of the form $\mecvar_V \rightarrow \Pi_D$, we can restrict our attention to object-level interventions. Then, the minimum intervention set is the minimum hitting set across all reachability paths, of the variables with incoming edges that would break the dependency if removed.

\begin{definition}[Minimum intervention set] \label{def:min_inter}
The minimum set of objects to intervene on in order to break causal mechanism dependency $\mecvar_V \rightarrow \Pi_D$ is $X$ s.t. :
\begin{align*}
  &X \cap S_i \neq \emptyset \text { for all } S_i \text{ where }\\
  &S_i = \set{V \in \vars \mid \exists W \in \vars . (W\rightarrow V) \in \R(\mecvar_V \rightarrow \Pi_D)}
\end{align*}
\end{definition}

This metric measures how \textit{robust} a causal mechanism dependency is to external interventions. The size of this set is the minimum number of object-level interventions required to ensure that, under every parameterization of the game, there is no incentive for a target policy $\Pi_D$ to depend on the mechanism variable $\mecvar_V$.

\section{Causal Mechanism Design}\label{sec:CMD}

Mechanism design~\citep{intro_mech_design} aims to modify a game to satisfy a desired social outcome or agent behaviour. Current approaches~\citep{rmcp, mech_design_survey} establish error bounds on expected outcomes for particular families of games when an intervention is conducted. This section explores how our framework enables a systematic approach to causal mechanism design.

\subsection{Qualitative Specifications}

Qualitative specifications are concerned with properties of the DAG $\graph$. Consider the mechanised graph of Example~\ref{ex:job_market} shown in Figure~\ref{fig:1}. The cyclic structure between nodes $\Pi_{D^1}$ and $\Pi_{D^2}$ means the optimal policy for each agent depends on the other agent's policy.

\begin{figure}[]
    \centering
    \begin{subfigure}[b]{0.45\linewidth}
        \centering
        \resizebox{0.75\width}{!}{
        \begin{influence-diagram}
        \node (X) [] {$T$};
        \node (U1) [utility, right = of X, player1] {$U^1$};
        \node (U2) [utility, right = of U1, player2] {$U^2$};
        \node (D1) [decision, below right = 1.4cm and 0.7cm of X, player1] {$D^1$};
        \node (D2) [decision, right = of D1, player2] {$D^2$};
        \edge [red] {X} {D1};
        \edge {D1} {D2};
        \path (X) edge[red,->, bend left=45] (U2);
        \edge {X} {U1};
        \edge {D1} {U1};
        \edge {D2} {U1,U2};
        \node (X_mec) [relevancew, above = of X] {$\Theta_T$};
        \node (U2_mec) [relevancew, above = of U2] {$\Theta_{U^2}$};
        \node (D1_mec) [relevanceb, below = of D1] {$\Pi_{D^1}$};
        \node (U1_mec) [relevancew, above = of U1] {$\Theta_{U^1}$};
        \node (D2_mec) [relevanceb, below = of D2] {$\Pi_{D^2}$};
        \edge[gray] {X_mec} {X};
        \edge[red] {D1_mec} {D1};
        \edge[gray] {D2_mec} {D2};
        \edge[gray] {U1_mec} {U1};
        \edge[gray] {U2_mec} {U2};
        \node (space1) [minimum size=0mm, node distance=2mm, below = 0.7cm of D1, draw=none] {};
        \draw (X_mec) edge[gray,in=180,out=-135] (space1.center)
        (space1.center) edge[gray,->,out=0,in=135] (D2_mec);
        \node (space3) [minimum size=0mm, node distance=2mm, left = 0.7cm of D1, draw=none] {};
        \draw (U1_mec) edge[gray,in=90,out=-110] (space3.center)
        (space3.center) edge[gray,->,out=-90,in=135] (D1_mec);
        \path (D1_mec) edge[blue,->, bend right=15] (D2_mec);
        \path (D2_mec) edge[gray,->, bend right=15] (D1_mec);
        \draw (X_mec) edge[gray,->,out=-135,in=155] (D1_mec);
        \draw (U2_mec) edge[gray,->, out=-45, in=25] (D2_mec);
    \end{influence-diagram}
        }
        \caption{}
        \label{fig:1}
    \end{subfigure}
    \begin{subfigure}[b]{0.54\linewidth}
        \centering
        \resizebox{0.75\width}{!}{
        \begin{influence-diagram}
        \node (X) [] {$T$};
        \node (U1) [utility, right = of X, player1] {$U^1$};
        \node (U2) [utility, right = of U1, player2] {$U^2$};
        \node (D1) [decision, intervened, below right = 1.4cm and 0.7cm of X, player1] {$g$};
        \node (D2) [decision, right = of D1, player2] {$D^2$};
        \edge {D1} {D2};
        \path (X) edge[->, bend left=45] (U2);
        \edge {X} {U1};
        \edge {D1} {U1};
        \edge {D2} {U1,U2};
        \node (X_mec) [relevancew, above = of X] {$\Theta_T$};
        \node (U2_mec) [relevancew, above = of U2] {$\Theta_{U^2}$};
        \node (D1_mec) [relevanceb, below = of D1] {$\Pi_{D^1}$};
        \node (U1_mec) [relevancew, above = of U1] {$\Theta_{U^1}$};
        \node (D2_mec) [relevanceb, below = of D2] {$\Pi_{D^2}$};
        \edge[gray] {X_mec} {X};
        \edge[gray] {D2_mec} {D2};
        \edge[gray] {U1_mec} {U1};
        \edge[gray] {U2_mec} {U2};
        \node (space1) [minimum size=0mm, node distance=2mm, below = 0.7cm of D1, draw=none] {};
        \draw (X_mec) edge[gray,in=180,out=-135] (space1.center)
        (space1.center) edge[gray,->,out=0,in=135] (D2_mec);
        \node (space3) [minimum size=0mm, node distance=2mm, left = 0.7cm of D1, draw=none] {};
        \draw (U1_mec) edge[gray,in=90,out=-110] (space3.center)
        (space3.center) edge[gray,->,out=-90,in=135] (D1_mec);
        % \path (D1_mec) edge[gray,->, bend right=15] (D2_mec);
        \path (D2_mec) edge[gray,->, bend right=15] (D1_mec);
        \draw (X_mec) edge[gray,->,out=-135,in=155] (D1_mec);
        \draw (U2_mec) edge[gray,->, out=-45, in=25] (D2_mec);
    \end{influence-diagram}
        }
        \caption{}
            \label{fig:2}
    \end{subfigure}
 \caption{The \textit{Job Market} game with an intervention $\Do (D^1 = g)$ satisfying qualitative specification $\Pi_{D^1} \nrightarrow \Pi_{D^2}$. Mechanism-level dependencies are coloured grey. In (a), the blue edge indicates the $\rbr$-relevance of $\Pi_{D^1}$ to $\Pi_{D^2}$ and red edges indicate an active reachability path. In (b), the intervention $\Do (D^1 = g)$ breaks all the reachability paths which made $\Pi_{D^1}$ relevant to $\Pi_{D^2}$.}
\end{figure}

A specification may require a decision rule to be \emph{independent} of a particular mechanism. For example, we may want the firm's hiring policy to be independent of the worker's policy when deciding to go to university. That is, we wish to break the causal dependency $\Pi_{D^1} \rightarrow \Pi_{D^2}$. When this edge does not exist, it means that the firm's optimal policy does not depend on the worker's policy for \emph{any} parameterisation of the game. There are two ways to satisfy this specification.
\begin{enumerate}
  \item Intervene on the target policy $\Pi_{D^2}$ with $r_{D^2}^{\I}: \dom(\Pa_{\Pi_{D^2}}^*) \rightarrow \dom(\Pi_{D^2})$ such that $\Pi_{D^1} \not \in \Pa_{\Pi_{D^2}}^*$, e.g., the hard intervention $\Do (\Pi_{D^2} = \delta(D^2, \lnot j))$ which forces the firm to reject every candidate.
  \item Perform an object-level intervention to appropriately change the reachability structure of the graph. There are two paths that make $\Pi_{D^1}$ $\rbr$-relevant to $\Pi_{D^2}$. The first is $\Pi_{D^1} \rightarrow D^1 \leftarrow T \rightarrow U^2$ when conditioned on $\set{D^2, D^1}$ since $\Pi_{D^1} {\not\perp}_{\meczero{\graph}}~\utilvars^2 \cap \Desc_{D^2} \mid D^2, \Pa_{D^2}$. The second is $\Pi_{D^1} \rightarrow D^1$ conditioned on $\emptyset$ since $\Pi_{D^1} {\not\perp}_{\meczero{\graph}}~\Pa_{D^2}$. 
\end{enumerate}

Option 1 is somewhat against the ``spirit'' of mechanism design, which seeks to induce certain behaviours or social outcomes without undermining an agent's ability to make their own rational choices. However, the intervention on $\Pi_{D^2}$ changes properties of the target agent's behaviour by directly intervening on their policy.

Option 2 requires both active paths to be blocked. This can be achieved through an intervention on $D^1$ of the form $\jointdistr^{\I}(d^1 \mid \pa_{D^1}^*)$ where $\Pa_{D^1} = \emptyset$. An example would be $\Do (D^1 = g)$, shown in Figure~\ref{fig:2}. The cyclic structure between $\Pi_{D^1}$ and $\Pi_{D^2}$ is broken, and the firm has no incentive to consider the worker's policy.

\paragraph{Hiding and Revealing Information}

Another qualitative specification is to hide or reveal certain information to agents. This can be done by modifying the incoming edges into a decision variable. Suppose we wish to hide the agent's decision of going to university from the firm in Example~\ref{ex:job_market}. Intervention $\Del (D^1 \rightarrow D^2)$ satisfies this but has mechanism level side-effect $\Pi_{D^1} \not \rightarrow \Pi_{D^2}$.

A more general question is: under what circumstances is it possible to hide or reveal information \textit{without} changing the mechanism dependency structure? The mechanism dependency structure is retained if, for any pair of mechanisms with active reachability paths, at least one path is not broken, and if, for any pair of mechanisms with no active reachability paths, no new paths are introduced. We call an intervention that preserves this structure \textit{incentive invariant}.

\begin{definition}[Incentive Invariance] \label{def:hide_reveal}
  An intervention $\I$ is incentive invariant if $\forall~\mecvar_V \in \mecvars, \forall~\Pi_D \in \policyprofs$, we have pre-intervention reachability paths $\rbr(\mecvar_V \rightarrow \Pi_D)$ and post-intervention reachability paths $\R^{\BR*}(\mecvar_V \rightarrow \Pi_D)$ s.t.
  \[
    \lvert \R^{\BR*}(\mecvar_V \rightarrow \Pi_D) \rvert 
    \begin{cases}
      = 0 \text{, if } \lvert \rbr(\mecvar_V \rightarrow \Pi_D) \rvert = 0 \\
      > 0 \text{, if } \lvert \rbr(\mecvar_V \rightarrow \Pi_D) \rvert > 0
    \end{cases}
  \]
\end{definition}

\subsection{Quantitative Specifications}

Quantitative specifications describe bounds on game outcomes. For example, they specify that the expected payoff of an agent is greater than some value, that the probability of a certain event occurring is within some range, or that some social welfare metric is maximised. There are many ways of satisfying these specifications, including the modifications to the object-level and mechanism-level dependencies discussed previously. Here, we focus on interventions that directly modify the chance or utility variables of the game or the corresponding mechanism-level parameter variables.

\textbf{Taxes and Rewards:} One way of inducing certain behaviour is to modify the payoffs for certain outcomes through taxes and rewards. The inter-mechanism edges reveal which utility variables, under some parameterisation of the game, can affect an agent's $\R$-rational choice of policy. For example, consider the Prisoner's Dilemma, where the prisoners are restricted to pure policies. The mechanised graph for this is the same as in Figure~\ref{fig:commitment_before}. Suppose we are a sadistic game designer who wants to maximise the jail time of both prisoners by any means. We can do this in several ways by modifying the usual payoffs of the game (Table \ref{tab:prisoners_dilemma}).

\begin{table}[h!] 
    \centering
    \caption{The payoffs in the Prisoner's Dilemma.}
    \begin{tabular}{cc|c|c|}
    & \multicolumn{1}{c}{} & \multicolumn{2}{c}{Agent 2 (Bob)}\\
    & \multicolumn{1}{c}{} & \multicolumn{1}{c}{Cooperate}  & \multicolumn{1}{c}{Defect} \\\cline{3-4}
    \multirow{2}*{Agent 1 (Alice)}  & Cooperate & (-1, -1) & (-5, 0) \\\cline{3-4}
    & Defect & (0, -5) & (-2, -2)\\\cline{3-4}
    \end{tabular}
    \label{tab:prisoners_dilemma}
\end{table}

One way is to decrease the payoffs of the NE $(D, D)$ (the $\rbr$-rational outcome). Typically, mutual defection leads to a total jail time of 4 years. Changing $(D, D)$ to $(-3, -3)$ yields 6 years total. In fact, we could change the payoff of $(D, D)$ to $(-5 + \varepsilon , -5 + \varepsilon)$ for arbitrary $\varepsilon > 0$ yielding $-10 + 2\varepsilon$ years total while retaining $(D, D)$ as the single pure policy NE. Since this intervention does not affect the best-response of either prisoner, it doesn't matter whether this intervention is implemented as a fully pre-policy, fully post-policy, or interleaved intervention. The prisoners will play the same policies and the same NE will be reached.

Another way is by \textit{taxing} the existing rational outcome. In fact, by introducing a partially visible intervention, we can also \textit{reward} certain behaviours to satisfy the specification. If Alice believes that mutual cooperation will lead to both agents going free, while Bob believes they will suffer 1 year each, then $(C, D)$ becomes a new NE. This can be implemented in one of two ways.

\begin{example}[Partially Visible Rewards] \label{ex:rewards}
We want to influence one prisoner in the Prisoner's Dilemma to cooperate. C and D indicate the pure policies ``cooperate'' and ``defect'' respectively. Let $\prims = \set{\Do (\Theta_{U^1} = \theta_{U^1}^*), \Do (\Theta_{U^2} = \theta_{U^2}^*)}$ be the set of primitive interventions with
\begin{equation*}
  \theta_{U^1}^*(u^1 \mid d^1, d^2) = 
  \begin{cases}
    \delta(u^1, 0) & \hspace{-1em} \text{if } d^1 = C \text{ and } d^2 = C \\
    \theta_{U^1}(u^1 \mid d^1, d^2) & \text{otherwise}
  \end{cases}
\end{equation*}
\noindent
and similar for $\theta_{U^2}^*$. Let $\prims'$ be the inverse. We make $\prims$ visible to only Alice in one of two ways:
\begin{enumerate}
  \item $\prims_0 = \emptyset,~\prims_1 = \prims,~A_0=\set{Bob},~A_1=\set{Alice}$. This changes the payoffs of $(C, C)$ so both prisoners go free, but only Alice is informed of the change (the intervention is hidden from Bob).
  \item $\prims_0=\prims,~\prims_1=\prims',~A_0=\set{Alice},~A_1=\set{Bob}$. This informs Alice that $(C, C)$ will lead to both prisoners going free but reverses this intervention between Alice's and Bob's policy choices, so it deceives Alice into believing an intervention has taken place.
\end{enumerate}
In either case, Alice believes there are two possible NE: $(C, C)$ and $(D, D)$, whereas Bob believes there is only one $(D, D)$. So, if Alice plays uniform distribution over her best responses $C$ and $D$, and Bob plays $\delta(D^2, D)$, the expected total jail time is $\expect_{\nashpolicyprof}[U^1 + U^2] = \frac{1}{2} (0 - 5) + \frac{1}{2} (-2 - 2) = -4.5$
Therefore, adding total reward of 2 to game outcome reduces the expected total payoff by 0.5.
\end{example}

\textbf{Environment Modifications:}
Another way of satisfying a quantitative specification is to modify the chance variables. In Example \ref{ex:job_market}, the worker's temperament can affect both agents' policies. Suppose we want to maximise the probability of the worker getting a job and $\R=\rbr$, i.e., we want the probability of the worker getting the job under any NE of the intervened game to be at least as high as the probability of the worker getting the job under any NE of the original game. Formally, an intervention $\I$ satisfies this specification if
\[
  \min_{\nashpolicyprof \in \rbr(\model_{\I})} \jointdistr^{\nashpolicyprof}(j) \geq \max_{\policyprof \in \rbr(\model)} \jointdistr^{\policyprof}(j)
\]

One way to do this is to change the location of the game to \textit{EffortVille} where everyone is hard-working. This corresponds with a mechanism-level $\Do (\Theta_T = \delta(T, h))$ or object-level $\Do (T = h)$ intervention. In this case, the CG has three pure policy $\rbr$-rational outcomes (NE).
\begin{enumerate}
  \item The worker always chooses $g$. The hiring system always chooses $j$. So $\exputility_{\policyprof}[\utilvars^1] = 5$ and $\exputility_{\policyprof}[\utilvars^2] = 3$
  \item The worker always chooses $g$. The hiring system chooses $j$ if the worker chooses $g$. Otherwise, it chooses $\lnot j$. So $\exputility_{\policyprof}[\utilvars^1] = 5$ and $\exputility_{\policyprof}[\utilvars^2] = 3$
  \item The worker always chooses $\lnot g$. The hiring system chooses $\lnot j$ if the worker chooses $g$. Otherwise, it chooses $j$. So $\exputility_{\policyprof}[\utilvars^1] = 4$ and $\exputility_{\policyprof}[\utilvars^2] = 3$
\end{enumerate}
In all these NEs, the probability of the worker getting a job is 1, so it satisfies the specification. Also, the first two NEs of the intervened game maximise utilitarian and egalitarian social welfare. The identity intervention, which does not change the game, would also have satisfied this specification because all three pure NEs of the original game also result in the worker getting a job with probability 1. However, this is not the case under NEs with stochastic policies. The original game has the following NE: If the worker is hardworking, she chooses $g$ with probability $\frac{1}{2}$. If she is lazy, she always chooses $\lnot g$. If she chooses $g$, the firm always chooses $j$. If she chooses $\lnot g$, the firm chooses $j$ with probability $\frac{4}{5}$ .
This yields a $\frac{9}{10}$ probability of the worker getting a job. On the other hand, the NEs of the intervened game are
\begin{enumerate}
  \item The worker always chooses $g$, The hiring system chooses $j$ if the worker chose $g$, otherwise it chooses $j$ with any probability $q_1 \in [0,1]$.
  \item The worker always chooses $\lnot g$, The hiring system chooses $j$ if the worker chose $\lnot g$, otherwise it chooses $j$ with any probability $q_2 \in [0,\frac{4}{5}]$.
\end{enumerate}
So, the worker gets a job with probability 1 either way. Therefore, the intervention of \textit{EffortVille} satisfies the specification in the stochastic policy case, whereas the identity intervention does not.
In our intervention framework, we can model \textit{EffortVille} with primitive intervention set $\prims_0 = \set{\Do (T=h)}$ and $A_0 = \set{1, 2}$ since we want the intervention to be fully pre-policy, allowing both agents to adapt their policies accordingly. Note, however, that it is typically not possible for game designers to intervene on the chance variables of the game as these are usually used to represent `moves by nature'. For example, a government may be able to intervene on utility variables by taxing or rewarding workers and firms, but it is unlikely that they can affect the underlying temperament of the workers.

\section{Commitment}\label{sec:commit}
Interventions on decision and decision rule variables enable us to reason about \textit{commitment}. In some games, it is possible for the first moving agent, the \textit{leader}, to gain a strategic advantage over others, called \textit{followers}, by \textit{committing} to a policy before the game begins; the leader can sometimes influence the follower's incentives by revealing private information about their policy. The simplest example is a \textit{Stackelberg game} consisting of one leader and follower. 

We use an example from \citep{letchford2010computing}, which shares the same game graph as in Figure \ref{fig:commitment_before} with Agent 1 (2) the leader (follower) and with $\dom(D^1)=\{T,B\}$ and $\dom(D^2)=\{L,R\}$. The utility parameterization is shown in Table~\ref{fig:stack-normal}.
Pre-commitment, Action $T$ strictly dominates $B$ so $(T,L)$ is a unique NE and $\exputility_{\policyprof}[\utilvars^1] = 2$. However, by committing to the pure policy $B$, the leader incentivises the follower to play $R$ and so $\exputility_{\policyprof}[\utilvars^1] = 3$. Note, in this case, the result of commitment is also a Pareto improvement over the original NE (i.e., Stackelberg commitment can also improve social welfare).

Causal games naturally represent commitment with a simple causal intervention on node $\Pi_{D^1}$ to be fixed to the committed policy $\pi_1$ (shown in Figure~\ref{fig:commitment_after}). The payoff received by the leader after commitment can be calculated through backward induction on the graph \citep{hammond2021equilibrium}. 

By representing commitment as a causal intervention, we can prove whether a particular commitment can be beneficial for the leader. In the stochastic policy setting, the follower will still play a pure policy since she has no incentive to randomise after the leader's commitment; she is effectively playing a single-agent decision game. The leader's expected utility after committing to policy $\pi_1 = \frac{1}{2} T + \frac{1}{2} B$ is 3.5 (in Appendix~\ref{app:commitment_after}). This is greater than the expected utility of 2 in the original game's unique NE, which benefits the leader.

A partially visible commitment is represented naturally in our new framework of causal interventions. Specifically, a commitment that occurs in the primitive intervention set $\prims_{j}$ can be revealed to all agents in $A_j, A_{j+1}, \ldots, A_{m}$. For example, if we have $\prims_0 = \emptyset$, $\prims_1 = \set{\Do(\Pi_1 = \delta(D^1, T))}$, $A_0 = \set{1}$, and $A_1 = \set{2}$ then Agent 1 commits to playing `B'' and reveals it to Agent 2. Algorithm~\ref{alg:inter_query} reveals that Agent 2 will play $\delta(D^2, R)$ (i.e. always playing ``R'') and Agent 1 will receive a payoff of $3$. However, if Agent 1's commitment to playing $\delta(D^1, B)$ is kept private from Agent 2, then we have $\prims_0 = \emptyset$, $\prims_1 = \set{\Do(\Pi_1 = \delta(D^1, B))}$, $A_0 = \set{1, 2}$, and $A_1 = \emptyset$. Then, Agent 2 will always play `L', in accordance with the NE of the original system, calculated after $\prims_0$, giving Agent 1 a payoff of $2$. In Appendix~\ref{app:optimal}, we show that we can also use the intervened graph to calculate the \textit{optimal} policy to commit to.

\begin{figure}[]
    \centering
    \begin{subfigure}[b]{0.34\linewidth}
        \centering
        \resizebox{0.6\width}{!}{
        \begin{influence-diagram}
            \node (D1) [decision, player1] {$D^1$};
            \node (D2) [decision, player2, right of=D1] {$D^2$};
            \node (U1) [utility, player1, below of=D1] {$U^1$};
            \node (U2) [utility, player2, below of=D2] {$U^2$};
            \node (P1) [relevanceb, above of=D1] {$\Pi_{D^1}$};
            \node (P2) [relevanceb, above of=D2] {$\Pi_{D^2}$};
            \node (M1) [relevancew, below left of=U1] {$\Theta_{U^1}$};
            \node (M2) [relevancew, below right of=U2] {$\Theta_{U^2}$};

            \edge {D1} {U1};
            \edge {D2} {U2};
            \edge {D1} {U2};
            \edge {D2} {U1};
            \edge[gray] {P1} {D1};
            \edge[gray] {P2} {D2};
            \edge[gray] {M1} {U1};
            \edge[gray] {M2} {U2};
            \path (M1) edge [->, gray, bend left] (P1);
            \path (M2) edge [->, gray, bend right] (P2);
            \path (P1) edge [->, gray, bend left] (P2);
            \path (P2) edge [->, gray, bend left] (P1);
            
        \end{influence-diagram}
        }
        \caption{}
                \label{fig:commitment_before}
    \end{subfigure}
    \begin{subfigure}[b]{0.34\linewidth}
        \centering
        \resizebox{0.6\width}{!}{
        \begin{influence-diagram}
            \node (D1) [decision, player1] {$D^1$};
            \node (D2) [decision, player2, right of=D1] {$D^2$};
            \node (U1) [utility, player1, below of=D1] {$U^1$};
            \node (U2) [utility, player2, below of=D2] {$U^2$};
            \node (P1) [intervened,relevanceb, above of=D1] {$\Pi_{D^1}$};
            \node (P2) [relevanceb, above of=D2] {$\Pi_{D^2}$};
            \node (M1) [relevancew, below left of=U1] {$\Theta_{U^1}$};
            \node (M2) [relevancew, below right of=U2] {$\Theta_{U^2}$};

            \edge {D1} {U1};
            \edge {D2} {U2};
            \edge {D1} {U2};
            \edge {D2} {U1};
            \edge[gray] {P1} {D1};
            \edge[gray] {P1} {P2};
            \edge[gray] {P2} {D2};
            \edge[gray] {M1} {U1};
            \edge[gray] {M2} {U2};
            \path (M2) edge [->, gray, bend right] (P2);
        \end{influence-diagram}
        }
        \caption{}
                \label{fig:commitment_after}
    \end{subfigure}
    \begin{subfigure}[b]{0.3\linewidth}
        \centering
        \centering
            \resizebox{0.8\width}{!}{
\begin{tabular}{ c | c c }
      & L & R \\
      \hline
      T & (2,1) & (4,0) \\
      B & (1,0) & (3,2) \\
    \end{tabular}}
        \caption{}
        \label{fig:stack-normal}
    \end{subfigure}
 \caption{The Stackleberg game represented as mechanised causal graphs (a) pre-commitment, and (b) post-commitment, with payoff matrix (c). }
    \label{fig:}
\end{figure}

\section{Conclusion}

This work presents a sound and complete characterisation of arbitrary causal interventions in causal games. It uses this framework to evaluate and systematically modify incentive structures to satisfy qualitative and quantitative specifications, which has important applications for causal mechanism design. Solving interventional queries is computationally expensive, but we prove results and give algorithms, showing how they can be made more tractable. Finally, we focus on pedagogical examples, but demonstrating the method empirically on larger examples is an important direction for future work.

\begin{acknowledgements}
    The authors wish to thank five anonymous reviewers for their helpful comments.  Fox was supported by the EPSRC Centre for Doctoral Training in Autonomous Intelligent Machines and Systems (Reference: EP/S024050/1) and Wooldridge was supported by a UKRI
Turing AI World Leading Researcher Fellowship (Reference: EP/W002949/1).
\end{acknowledgements}

\bibliography{refs}

\newpage

\onecolumn

\title{Characterising Interventions in Causal Games\\(Supplementary Material)}
\maketitle

\appendix

\section{Proofs}
\label{app:proof}
\setcounter{theorem}{0}
\setcounter{proposition}{0}

\begin{theorem}
\label{theorem:prim}
Primitive interventions are a sound and complete formulation of causal interventions. 
\end{theorem}

\begin{proof}
We first prove soundness. This is true using the definitions of the primitive interventions. Let $\jointdistr(\sv_{\I})$ be the induced joint distribution by type 1, 3, and 4 interventions, as per the definitions, and $\jointdistr(\sv_{\I}) = \jointdistr(\sv)$ for type 2 interventions. Also, let $\R^*$ be the induced rationality relations by type 2 interventions and $\R^* = \R$ for type 1, 3, and 4 interventions. Then, the effect of a primitive intervention $\mathrm{P}$ of any type is the function $\set{\jointdistr^{\policyprof}(\sv)}_{\policyprof \in \R} \mapsto \set{\jointdistr^{\policyprof}(\sv_{\I})}_{\policyprof \in \R^*}$ which is a valid causal intervention.

 We now turn to completeness by showing that any intervention $\I$ can be decomposed into a set of equivalent primitive interventions $\prims$. That is to say, the state of the game after applying intervention $\I$ is equivalent to the state of the game after applying interventions $\prims$. Suppose,
\begin{align*}
    \I(\set{\jointdistr^{\policyprof}(\sv)}_{\policyprof \in \R}, \R) &= (\set{\jointdistr^{\policyprof}(\sv_\I)}_{\policyprof \in \R^*}, \R^*)\\
    \text{s.t. } \jointdistr^{\policyprof}(\sv) &= \prod_{V \in \vars} \jointdistr^{\policyprof} (v\mid\pa_{V})\\
    \text{and } \jointdistr^{\policyprof}(\sv_\I) &= \prod_{V_\I \in \vars_\I} \jointdistr^{\policyprof} (v_\I\mid\pa_{V})
\end{align*}
Then the trivial decomposition of $\I$ is $| \sV_\I |$ type 3 interventions which multiply the joint distribution by each of $\jointdistr^{\policyprof} (v_\I\mid\pa_{V})$, followed by $| \sV |$ type 4 interventions that divide the joint distribution by each of $\jointdistr^{\policyprof} (v\mid\pa_{V})$, then $| \R^* |$ type 2 interventions that attach the appropriate rationality relation to each mechanism variable. 

Of course, more concise decompositions are possible if there is overlap between $\R$ and $\R^*$ as well as overlap between $\set{\Pa_V}_{V \in \sV}$ and $\set{\Pa_{V_\I}}_{V_\I \in \sV_\I}$.
\end{proof}

\begin{proposition}[Object-level intervention side effects] \label{prop:side_effects}
An object-level intervention $\jointdistr^{\I}(x \mid \pa_X^*)$ has side effect $\mecvar_V \not \rightarrow \Pi_D$ if, $\forall$ reachability paths $p \in \R(\mecvar_V \rightarrow \Pi_D)$ we have $\exists W \in \vars \text{s.t.} (W \not \in \Pa_X^*) \text{ and } ((W \rightarrow X) \in p)$ 
\end{proposition}

\begin{proof}
An intervention $\jointdistr^{\I}(x \mid \pa_X^*)$ has side effect $\mecvar_V \not \rightarrow \Pi_D$ if in the intervened graph there are no reachability paths from $\mecvar_V$ to $\Pi_D$. This means at least one causal arrow is broken in each such reachability path in the original graph. An object-level intervention on $X$ breaks only the causal arrows $W \rightarrow X$ where $W \in \Pa_X$ but $W \notin \Pa_X^*$.
\end{proof}

\begin{theorem}[Decomposition of Intervention Sets] \label{thm:decomp}
For any set of interventions $\sI$, where $\sI^i \subseteq \sI$ is the subset of interventions visible to agent $i$, there are primitive intervention sets $\prims_0, \ldots, \prims_{m}$, such that
\begin{equation} \label{eq:ordered_prims}
     \forall i~\exists j \in \set{0,\ldots,m} : \sI^i(\model)= (\prims_j \circ \prims_{j-1} \ldots \circ \prims_{0})(\model)
\end{equation}
\end{theorem}

\begin{proof}\label{proof:decomposition}
We show there is a set of primitive intervention sets that satisfy Theorem \ref{thm:decomp} for any set of interventions $\sI^i$ by constructing an example. We use the notation $\prims(\I)$ to denote the primitive decomposition of $\I$ as shown in the proof of Theorem \ref{theorem:prim}. Then, $\prims^i = \cup_{\I \in \sI^i} \prims(\I)$ are the primitive interventions equivalent to each agent's visible interventions.  Consider an arbitrary ordering of $\prims^i = \prim_0^i, \ldots, \prim_k^i$. Let $\invprim_k^i$ denote the inverse of $\prim_k^i$.  The construction is as follows.
\begin{align*}
    \prims_0 &= \prims^0\\
    \prims_j &= \prim_k^j \circ \ldots \circ \prim_0^j \circ \invprim_0^{j-1} \circ \ldots \circ \invprim_k^{j-1} \text{ for } j \in 1, \ldots, N\\
    A_0 &= \emptyset\\
    A_j &= \set{j} \text{ for } j \in 1, \ldots, N
\end{align*}
where $\prims^0$ are the fully pre-policy interventions visible to all agents. In this construction, $A_j$ are singleton sets (except $A_0$) so we have $m = N$. For all $i$, let $j = i$. Then, we make an inductive argument. The base case $\sI^0(\model) = \prims^0(\model) = \prims_0(\model)$ holds by definition of $\prims^0$. Assuming $\sI^{i-1}(\model)= (\prims_{j-1} \circ \prims_{j-2} \ldots \circ \prims_{0})(\model)$, we have
\begin{align*}
    \sI^i(\model) &= \prims^i(\model)\\
    &= (\prims^i \circ \invprims^{i-1} \circ \prims^{i-1})(\model)\\
    &= (\prims_j \circ \prims^{i-1})(\model)\\
    &= (\prims_j \circ \sI^{i-1})(\model)\\
    &= (\prims_j \circ \prims_{j-1} \ldots \circ \prims_{0})(\model)
\end{align*}
So, this assignment of primitive intervention sets satisfies Theorem~\ref{thm:decomp}. Algorithm \ref{alg:inter_query} explicitly shows how this construction is used to calculate interventional queries.
\end{proof}

\section{Commitment}

\subsection{Expected Utility after Commitment}\label{app:commitment_after}
We first show that the expected utility to agent 1 is 3.5 after she commits to policy $\pi_1$, picking between $T$ and $B$ with equal probability.

Let $\I = \set{\Do(\Pi_1 = \pi_1)}$ and fix $\policyprof \in \policyprofs$. We use $\jointdistr^{\I}(X)$ as shorthand for $\jointdistr^{\policyprof}(X_{\I})$, and $\expect_{\I}$ as shorthand for $\expect_{\policyprof}[U_{\I}]$. Then
\begin{align*}
  \expect_{\I} [U^1] &:=  \sum_{u^1 \in \mathit{dom}(U^1)} u^1 \jointdistr^{\I}(u^1) \label{eq:u1-stack} \tag{E1}\\
  &= 2 \cdot \jointdistr^{\I}(D^1 = T \mid \pi_1) \jointdistr^{\I}(D^2 = L \mid \Pi_{D^2})\\ 
  & \quad + 4 \cdot \jointdistr^{\I}(D^1 = T \mid\pi_1) \jointdistr^{\I} (D^2 = R \mid \Pi_{D^2})\\ 
  & \quad + 1 \cdot \jointdistr^{\I}(D^1 = B \mid \pi_1) \jointdistr^{\I} (D^2 = L \mid \Pi_{D^2})\\ 
  & \quad + 3 \cdot \jointdistr^{\I}(D^1 = B \mid \pi_1) \jointdistr^{\I} (D^2 = R \mid \Pi_{D^2})\\
  \jointdistr^{\I}(D^2 = L \mid \Pi_{D^2}) &= \begin{cases}
    1 & \text{if } 0.5 \cdot U^2(2,1) + 0.5 \cdot U^2(1,0) \\ & \quad > 0.5 \cdot U^2(4,0) + 0.5 \cdot U^2(3,2)\\
    0 & \text{otherwise}
  \end{cases}\\
  &= \begin{cases}
    1 & \text{if } 0.5 > 1 \\
    0 & \text{otherwise}
  \end{cases}\\
  &= 0\\
  \text{Similarly, } \jointdistr(D^2 = R \mid \Pi_{D^2}) &= 1\\
  \implies \expect_{\I} [U^1] &= 4 \cdot 0.5 + 3 \cdot 0.5 = 3.5
\end{align*}

\subsection{Optimal Stochastic Behavioural Policy}
\label{app:optimal}


Let agent 1 have policy $\pi_1$ where she plays $T$ with probability $p$ and agent 2 have policy $\pi_2$ where she plays $L$ with probability $q$. Then the optimal policy $\hat{\pi}_1 = \hat{p} T + (1 - \hat{p}) B$ is given by:
\begin{align*}
 q &= \begin{cases}
    1 & \text{if } p > 2(1-p)\\
    0 & \text{otherwise}
  \end{cases}\\
  &= \begin{cases}
    1 & \text{if } p > \frac{2}{3}\\
    0 & \text{otherwise}
  \end{cases}\\
  \implies
 \hat{p} &= \argmax_p \expect_{\I} [U^1] \label{eq:u1-opt} \tag{E2}\\
 &= \argmax_p (2pq + 4p(1-q) + (1-p)q + 3(1-p)(1-q))\\
 &= \argmax_p (p - 2q + 3)\\
 &= \argmax_p \left(p - 2\mathbb{I}\left(p > \frac{2}{3}\right) + 3\right)\\
 &= \frac{2}{3}
\end{align*}
\noindent
where $\I = \set{\Do(\Pi_1 = \hat{\pi}_1)}$.  

So the optimal policy for agent 1 to commit to is $\hat{\pi}_1 = \frac{2}{3}T + \frac{1}{3}B$ with payoff $\mathbb{E}_{\I} [U^1] = \frac{2}{3} + 3 = 3.\dot{6}$. This is greater than the payoff of 2 in the NE of the original game and the payoff of 3.5 in the NE induced after a commitment to $\frac{1}{2} T + \frac{1}{2} B$ as shown in the previous section.


\end{document}