\newpage
\section{Proof of Theorems for {\ppaAcron} model}
\label{appendixDAPAProofs}

The Distributed Affine Preferential Attachment ({\ppaAcron}) model (Section~\ref{sec:ourppamodel}) is defined as:
\begin{align}
    x_{ij}^{ } &\sim \text{Bernoulli}\big(p_{ij}^{ }\big) \label{eq:PPAbernoulliAppendix} \\
    p_{ij}^{ } &= \frac{\alphaP + \thetain d_i^{\text{in}} + \thetaout d_i^{\text{out}}}{j-2+\alphaP +\betaP} \label{eq:PPAprobAppendix}\\
    d_i^{\text{in}} &= \sum_{\BoxNodeSS{}=i+1}^{j-1} x_{i\BoxNodeSS{}}^{ }  \quad\quad
    d_i^{\text{out}} = \sum_{\BoxNodeSS{}=1}^{i-1} x_{\BoxNodeSS{}i}^{ } \label{eq:PPAdoutAppendix}    
\end{align}
where \mbox{$x_{ij} = 1$} ($\mbox{$x_{ij} = 0$}$) indicates an edge (no edge) between nodes $i$ and $j$.

% \begin{comment}
\novo{The parameters $\thetain$ and $\thetaout$ correspond to $\HubName$ and $\PathName$ causal arrows, respectively.  
If one uses the ordering of the nodes to orient the edges of the growing network, 
{\hub} arrows refer to the \mbox{in-degree} 
of the node $\BoxNodeS{}$ of the dyad \mbox{\dyadpair{\BoxNodeS{}}{j}} being decided 
(\ie, dyads of the type \mbox{\dyadpair{\BoxNodeS{}}{i}}, where \mbox{$\BoxNodeS{}<i$}). 
Whereas {\transitive} arrows refer to the \mbox{out-degree} of the node $\BoxNodeS{}$ 
(\ie, dyads of the type \mbox{\dyadpair{i}{\BoxNodeS{}}}, where \mbox{$i<\BoxNodeS{}$}).}
\potentiallyImprove{However, orienting the edges is not necessary, and the final statements of our theorems refer to the undirected degrees of the nodes.}
% \end{comment}

% This model exhibits three sparsity regimes (depending on $\thetain$ and $\thetaout$) and a flexible power law \novo{(depending on $\thetain$ for the ).} 
% \begin{comment}
\novo{This model exhibits three sparsity regimes (depending on $\thetain$ and $\thetaout$) and a flexible power law (depending on $\thetain$ for the constant average degree regime and on $\thetaout$ for the polynomial degree regime).}
% \end{comment}
% \begin{comment}
\potentiallyRemove{For the logarithmic average degree regime, 
which is at the transition between the constant and polynomial regimes, 
the dominant dependency 
% for the average degree 
is on the parameter $\alphaP$. 
And the expression for the power-law exponent in this transitional regime  agrees with the expression for both the constant and polynomial regimes.} 
% \end{comment}

\subsection{Proof of Theorem~\ref{thm:PPAPhaseTransition} \thmNamePPAAppendix}
% \label{appendixDAPAProofThm1}
% \subsubsection{Three sparsity regimes}
\label{appendixProof3Regimes}
% \begin{theorem}[\thmNamePPA]
% \label{thm:PPAPhaseTransitionAppendix}

Our {\ppaAcron} model exhibits three qualitatively different asymptotic behaviors for the average degree $\avgdegree$ \\[-12pt] %, 
    % depending on the value of ${\thetain+\thetaout}$ 
    % (see Fig.~\ref{fig:PPARegimes}, proof in Appendix~\ref{appendixProof3Regimes}):\\[-12pt]
    %Our {\ppaName} ({\ppaAcron}) model (\cref{eq:PPAprob,eq:PPAdin,eq:PPAdout}). 
% \end{theorem}
\vspace{-6pt}
\def\TempKern{\kern4pt}
\begin{center}
\begin{tabular}{llr}
    \vphantom{\Bigg(}constant:      &\TempKern$\displaystyle\frac{2\kern1pt\alphaP}{1-\big(\thetain+\thetaout\big)}$     &\TempKern$0<\thetain+\thetaout<1$ \\
    \vphantom{\Bigg(}logarithmic:   &\TempKern$2\kern1pt\alphaP \log\big(n\big) + C$                            &\TempKern$\thetain+\thetaout=1$ \\
    \vphantom{\Bigg(}polynomial:    &\TempKern$C \times n^{\thetain+\thetaout-1}$                     &\TempKern$1<\thetain+\thetaout<2$
\end{tabular}
\end{center}
%%%******
% The parameters $\thetain$ and $\thetaout$ correspond to $\HubName$ and $\PathName$ causal arrows, respectively. 
% If one uses the ordering of the nodes to orient the edges of the growing network, 
% {\hub} arrows refer to the \mbox{in-degree} 
% of the node $\BoxNodeS{}$ of the dyad \mbox{\dyadpair{\BoxNodeS{}}{j}} being decided 
% (\ie, dyads of the type \mbox{\dyadpair{\BoxNodeS{}}{i}}, where \mbox{$\BoxNodeS{}<i$}). 
% Whereas {\transitive} arrows refer to the \mbox{out-degree} of the node $\BoxNodeS{}$ 
% (\ie, dyads of the type \mbox{\dyadpair{i}{\BoxNodeS{}}}, where \mbox{$i<\BoxNodeS{}$}). 
% \footnote{Albeit not necessary, 
% due to the ordering of the nodes in the growing network,
% the presence of a dyad (\ie, an edge) can be thought as an arrow with the newer node as the tail and the older node as the head, or likewise as a direct edge from the newer node to the older node. 
% {\hub} and {\transitive} describe how dyads with different tail nodes (\ie, newer nodes) can directly influence each other, 
% and the case where the dyads that have the same tail node directly influence each other is described by {\forward} \textit{or} {\backward}.\label{footnotedirection}} 
% \novo{The parameters $\thetain$ and $\thetaout$ correspond to $\HubName$ and $\PathName$ causal arrows, respectively.  
% If one uses the ordering of the nodes to orient the edges of the growing network, 
% {\hub} arrows refer to the \mbox{in-degree} 
% of the node $\BoxNodeS{}$ of the dyad \mbox{\dyadpair{\BoxNodeS{}}{j}} being decided 
% (\ie, dyads of the type \mbox{\dyadpair{\BoxNodeS{}}{i}}, where \mbox{$\BoxNodeS{}<i$}). 
% Whereas {\transitive} arrows refer to the \mbox{out-degree} of the node $\BoxNodeS{}$ 
% (\ie, dyads of the type \mbox{\dyadpair{i}{\BoxNodeS{}}}, where \mbox{$i<\BoxNodeS{}$}).}
% \potentiallyImprove{However, orienting the edges is not necessary, and the final statements of our theorems refer to the undirected degrees of the nodes.}


\novo{We now derive the expressions for the average degree in the three regimes, 
starting with the constant regime.} 
\novo{To simplify notation on our derivations, 
we will use $n$ for both the step/iteration of the model and the number of nodes.  
% on our derivations.
% \footnote{\potentiallyRemove{Indeed, although this model is parallelizable, one can always simulate it sequentially with a single node arriving at each step.}}
\potentiallyRemove{(Indeed, although this model is parallelizable, one can always simulate it sequentially with a single node arriving at each step.)}
}
% \potentiallyRemove{Indeed, although this model is parallelizable, one can always simulate it sequentially with a single node arriving at each step.}
 
\def\logTIGHT{\log\kern-1pt}
\def\timesLOOSE{\kern1pt\times\kern1pt}
\def\ConstOne{C_1^{ }}
\def\ConstTwo{C_2^{ }}
\subsubsection{Constant degree regime: \protect{\textrm{$0\leq\thetain +\thetaout <1$}}}
% ***maybe quick comment that both thetas equal zero is ER
In this regime, the average degree converges to a constant: 
\begin{equation}
    \avgdegree = \frac{2\kern1pt\alphaP}{1-(\thetain+\thetaout)}  + \littleO{1} \label{eq:PPAavgdegreeSumThetaLess1}
\end{equation}

% \begin{comment}
\potentiallyRemove{For a node $j$, its in-degree $\din_j$ and out-degree $\dout_j$ are}
\potentiallyRemove{
\begin{align}
\din_j = \sum_{k=j+1}^{n} x_{jk} \kern1cm \text{and} \kern1cm \dout_j = \sum_{i=1}^{j-1} x_{ij}
\end{align}
}
% \end{comment}
After node $n$ has decided all its connections, 
the total number of edges in the network is
\begin{align}
    E(n) = \sum_{i=1}^{n} \din_i = \sum_{i=1}^n \dout_i
\end{align}
The expected number of edges added at each step
% \footnote{To simplify notation, here, we use $n$ for both the step/iteration of the model and the number of nodes.} 
is
%(indeed, although this model is parallelizable, one can always simulate it sequentially with a single node arriving at each step).} $n+1$ is
\begin{align}
    % \big\langle E(n+1) - E(n) | E(n) \big\rangle 
     \big\langle E(n+1) - E(n)  \big\rangle 
    &= \sum_{i=1}^{n} \frac{\alphaP + \thetain \din_i + \thetaout \dout_i}{n + \alphaP + \betaP - 1} \nonumber \\
    &= \frac{\alphaP n +\big(\thetain + \thetaout\big) E(n)}{n + \alphaP+ \betaP - 1} \label{eq:EDotOfN}
\end{align}
% \novo{To simplify notation, here, we use $n$ for both the step/iteration of the model and the number of nodes.}
% \novo{To simplify notation, here, we use $n$ for both the step/iteration of the model and the number of nodes.}

We make an ansatz of constant average degree 
\begin{align}
    \big\langle E(n) \big\rangle = \ConstOne \timesLOOSE n + g(n) \label{eq:ConstantDegreeAnsatz}
\end{align}
\potentiallyImprove{where ${g(n) = \littleO{n}}$ is subdominant.}  

We will first solve for $\ConstOne$ to obtain the asymptotic average degree ${\langle d \rangle = 2\ConstOne}$,
% \footnote{
% \potentiallyRemove{As degree equals in-degree plus out-degree, \mbox{$ d = \din_i  + \dout_i $}.}
% }
then we will verify our assumption that ${g(n) = \littleO{n}}$.  

Taking the expectation of \eqref{eq:EDotOfN}, 
\begin{align}
    \big\langle E(n+1) \big\rangle - \big\langle E(n) \big\rangle &= \frac{\alphaP n +\big(\thetain + \thetaout\big) \big\langle E(n) \big\rangle}{n + \alphaP + \betaP - 1} \label{eq:ConstantDegreeAfterExpectation}
\end{align}
using our ansatz \eqref{eq:ConstantDegreeAnsatz},
\begin{align}
     g(n+1) - g(n) + \underbrace{\ConstOne = \Bigg( \alphaP + \big(\thetain + \thetaout\big) \bigg(\ConstOne}_{\text{equate these constant terms}} + \frac{g(n)}{n} \bigg) \Bigg) \timesLOOSE \frac{n}{n + \alphaP + \betaP - 1} \label{eq:ConstantDegreeAfterAnsatz}
\end{align}
% **
and equating the \potentiallyImprove{$\bigTh{1}$ (constant) terms} to solve for $\ConstOne$, 
\begin{align}
    \ConstOne &= \alphaP + \big(\thetain + \thetaout\big) \ConstOne \\
    &= \frac{\alphaP}{1-\big(\thetain + \thetaout\big)} \label{eq:ConstantDegreeSolveForC}
\end{align}
we obtain the asymptotic average degree claimed in \eqref{eq:PPAavgdegreeSumThetaLess1}.  

To check verify our ansatz ${g(n) = \littleO{n}}$, substitute \eqref{eq:ConstantDegreeSolveForC} into \eqref{eq:ConstantDegreeAfterAnsatz}
\begin{align}
    \underbrace{g(n+1) - g(n) = \frac{\big(\thetain + \thetaout\big) g(n)}{n}}_{\text{equate these dominant terms}} - \frac{\alphaP+\betaP-1}{n} + \biggerO{\tfrac{g(n)}{n^2}}
\end{align}
to conclude that ${g(n) = \bigO{n^{\thetain+\thetaout}}}$.  

So our ansatz ${g(n) = \littleO{n}}$ is valid for ${\thetain+\thetaout<1}$, 
which incidentally is precisely when equation~\eqref{eq:PPAavgdegreeSumThetaLess1} is physically meaningful.  

% and separating the $\bigO{1}$ terms from the $\littleO{1}$ terms, we have
% \begin{align}
%     \bigO{1}:& \qquad C = \alphaP + \big(\thetain + \thetaout\big) C \label{eq:ConstantDegreeCTerms}\\
%     \bigO{1/n}:& \qquad g(n+1) - g(n) = -\frac{\alpha+\beta-1}{n} + \big(\thetain + \thetaout\big) \frac{g(n)}{n} + \bigO{n^{-2}}\label{eq:ConstantDegreeGTerms}
% \end{align}

\subsubsection{Logarithmic degree regime: \textrm{\protect$\thetain + \thetaout=1$}}

As ${\thetain + \thetaout \rightarrow 1}$, the average degree predicted by \eqref{eq:PPAavgdegreeSumThetaLess1} diverges, 
and when ${\thetain + \thetaout = 1}$, the average degree is no longer bounded.  
Instead, it grows logarithmically in $n$:
\begin{equation}
    % \avgdegree = \alpha\logTIGHT\big(n\big) \timesLOOSE \Big(1+\littleO{1}\Big) \label{eq:PPAavgdegreeSumThetaEqual1}
    \avgdegree = 2\kern1pt\alphaP\logTIGHT\big(n\big) + C + \littleO{1} \label{eq:PPAavgdegreeSumThetaEqual1}
\end{equation}


Similar to equation~\eqref{eq:ConstantDegreeAnsatz},
we make an ansatz but now of logarithmic average degree 
\begin{align}
    \big\langle E(n) \big\rangle = \ConstOne \timesLOOSE n \log n + g(n) \label{eq:LogDegreeAnsatz}
\end{align}
where ${g(n) = \littleO{n \log n}}$ is subdominant.  
% The expected change in number of edges is given by

\potentiallyImprove{The change in} ${n \log n}$ is approximately
\begin{align}
\big(n+1\big)\logTIGHT\big(n+1\big) - n\logTIGHT\big(n\big)=\logTIGHT\big(n\big) + 1 + \biggerO{\tfrac{1}{n^2}}.  
\end{align}
Substituting \potentiallyImprove{this} into equation~\eqref{eq:ConstantDegreeAfterExpectation}, %${n\logTIGHT\big(1+\frac{1}{n}\big)=1+\littleO{1}}$
\begin{align}
     % g(n+1) - g(n) + \ConstOne \timesLOOSE \Bigg( \logTIGHT\big(n+1) + n\logTIGHT\bigg(\frac{n+1}{n}\bigg) \Bigg) = \Bigg( \alpha + \big(\thetain + \thetaout\big) \bigg(\ConstOne\kern1pt\logTIGHT\big(n\big) + \frac{g(n)}{n} \bigg) \Bigg) \times \frac{n}{n + \alpha + \beta - 1} \\
     g(n+1) - g(n) + \underbrace{\ConstOne \timesLOOSE \bigg( \logTIGHT\big(n) + 1 \bigg) = \Bigg( \alphaP + \big(\thetain + \thetaout\big) \bigg(\ConstOne\kern1pt\logTIGHT\big(n\big)}_{\text{equate these logarithmic and constant terms}} + \frac{g(n)}{n} \bigg) \Bigg) \timesLOOSE \bigg(1+\biggerO{\tfrac{1}{n}}\bigg)% \timesLOOSE \frac{n}{n + \alpha + \beta - 1} 
     \label{eq:LogDegreeAfterAnsatz}
\end{align}
% where we have used ${\big(n+1\big)\logTIGHT\big(n+1\big) - n\logTIGHT\big(n\big)=\logTIGHT\big(n\big) + 1 + \littleO{1}}$.  
Equating the logarithmic terms, we recover the condition that ${\thetain + \thetaout = 1}$.  
And equating the constant terms, 
%\potentiallyImprove{we can solve for the constant ${\ConstOne=\alphaP}$.}  
\novo{we solve for the constant, obtaining ${\ConstOne=\alphaP}$.} 
% \novo{we solve for the constant ${\ConstOne=\alphaP}$.} 

To verify our ansatz ${g(n) = \littleO{n \log n}}$, we consider the {lower-order} terms: 
\begin{align}
    g(n+1) - g(n) = \frac{g(n)}{n} + \biggerO{\tfrac{\log n}{n}}
\end{align}
\potentiallyImprove{The solution can be written} as ${g(n) = C\timesLOOSE n + f(n)}$, where ${f(n) = \littleO{n}}$.  

Note that $C$ is not determined by the asymptotic balance.  
This suggests that different instances of networks generated with the same parameters may limit to different values of $C$.  
This is similar to the situation with the classic P\'olya urn \citep{eggenberger1923statistik}, 
\potentiallyImprove{where any asymptotic ratio is equally stable, resulting in a distribution over these ratios for any fixed set of parameters \citep{mahmoud2008polya, pekoz2019polya}.}  


\subsubsection{Sub-linear degree regime: \protect{$1<\thetain +\thetaout<2$}}


When ${1<\thetain + \thetaout < 2}$, the average degree grows as a (sublinear) power of $n$:
\begin{equation}
    \avgdegree \propto C \kern1pt n^{\rho}, \qquad \rho=\thetain +\thetaout-1\label{eq:PPAavgdegreeSumThetaGreater1}
\end{equation}


Again, we make the appropriate ansatz: 
\begin{align}
    \big\langle E(n) \big\rangle = \ConstOne \timesLOOSE n^{1+\rho}_{ } + g(n) \label{eq:SublinearDegreeAnsatz}
\end{align}
where ${g(n) = \littleO{n^{1+\rho}_{ }}}$ is subdominant.  
% The expected change in number of edges is given by

\potentiallyImprove{The change in ${n^{1+\rho}_{ }}$ is approximately}
\begin{align}
\big(n+1\big)^{1+\rho}_{ } - n^{1+\rho}_{ }=\big(1+\rho\big)n^{\rho}_{ } + \biggerO{n^{\rho-1}_{ }}.  
\end{align}

Substituting this into equation~\eqref{eq:ConstantDegreeAfterExpectation}, 
\begin{align}
     g(n+1) - g(n) + \underbrace{\ConstOne \timesLOOSE \big(1+\rho\big)n^{\rho}_{ } = \Bigg( \alphaP + \big(\thetain + \thetaout\big) \bigg(\ConstOne n^{\rho}_{ }}_{\text{equate these $\bigO{n^{\rho}}$ terms}} + \frac{g(n)}{n} \bigg) \Bigg) \timesLOOSE \bigg(1+\biggerO{\tfrac{1}{n}}\bigg)
     \label{eq:SublinearDegreeAfterAnsatz}
\end{align}
and equating the dominant $\biggerO{\tfrac{1}{n}}$ terms, 
% we can solve for the exponent ${\rho=\thetain + \thetaout -1}$. 
% \novo{we solve for the exponent ${\rho=\thetain + \thetaout -1}$.}  
\novo{we solve for the exponent, obtaining ${\rho=\thetain + \thetaout -1}$.}  
% 

Note that this does not fix $\ConstOne$.  
To see why, let us attempt to verify our ansatz ${g(n) = \littleO{n \log n}}$.  
We again equate the remaining {lower-order} terms: 
\begin{align}
    g(n+1) - g(n) = \big(1+\rho\big) \frac{g(n)}{n} + \biggerO{n^{\rho - 1}_{ }}
\end{align}
In this case, it seems as though our ansatz is not verified, with $g(n)$ being the same order as \potentiallyImprove{the ``dominant'' part of the solution:} ${g(n) = \ConstTwo\timesLOOSE n^{1+\rho}_{ } + \littleO{n^{1+\rho}_{ }}}$.  
However, this is in fact not a contradiction --- this is the asymptotic analysis telling us that the original \potentiallyImprove{constant $C$ itself} is not determined.  

Recapitulating the sequence of results:\\[-12pt]
\begin{itemize}
    \item When $\thetain + \thetaout < 1$, the average degree asymptotes to a fixed constant. 
    \item When $\thetain + \thetaout = 1$, the average degree grows logarithmically in $n$, \potentiallyImprove{but} with an arbitrary additive constant.
    \item When $\thetain + \thetaout > 1$, the average degree grows as a sublinear power of $n$, with an arbitrary multiplicative constant.
\end{itemize}
\hfill\qed

\commentToDo{Should we add a comment about the case of thetain plus thetaout equal 2?\\
 Also should we comment more about const1 for the constant regime? }






\subsection{Proof of Theorem~\ref{thm:PPAPhaseTransitiondegdist} \thmNamePPAAppendixdegdist}
\label{appendix:dapapowerlawproof}
% \subsection{Adjustable power-law}
% In the {\ppaAcron} model, the in-degrees \mbox{$d_i^{\text{in}} = \sum_{k=i+1}^{j-1} x_{ik}^{ }$} 
% (connections that node $i$ makes with later nodes) 
% exhibit a power-law (depending on $\thetain$):
% \begin{align*}
%     p\big(d\big)  \propto  d^{-\gamma} \qquad \gamma  =  1+\displaystyle\frac{1}{\thetain}
% \end{align*}

In the {\ppaAcron} model, the asymptotic distribution of node degrees exhibits a power-law tail %(depending on either $\thetain$ or $\thetaout$):
\mbox{$p(d) \propto d^{-\gamma}$}, where the \novo{scaling exponent $\gamma$} depends on either $\thetain$ or $\thetaout$: %\\
\def\TempKern{\kern30pt}
\begin{align}
    \vphantom{\bigg(}\text{constant:}      &\TempKern\gamma = \frac{1+\thetain}{\thetain}     \kern-2.5cm &0<\thetain+\thetaout\leq1 \\
    \vphantom{\bigg(}\text{polynomial:}    &\TempKern\gamma = \frac{2-\thetaout}{1-\thetaout}        \kern-2.5cm &1\leq\thetain+\thetaout<2 
\end{align}
%    \def\TempKern{\kern4pt}
%    \begin{tabular}{llr}
%     \vphantom{\Bigg(}\text{constant:}      &\TempKern$\displaystyle\gamma = \frac{1+\thetain}{\thetain}$     &\TempKern$0<\thetain+\thetaout\leq1$ \\
%     \vphantom{\Bigg(}polynomial:    &\TempKern$\displaystyle\gamma = \frac{2-\thetaout}{1-\thetaout}$                     &\TempKern$1\leq\thetain+\thetaout<2$
% \end{tabular}
% \begin{align*}
%     p\big(d\big)  \propto  d^{-\gamma} \qquad \gamma  = 
%         1+\displaystyle\frac{1}{\thetain}
%         \vphantom{\Bigg(}\text{constant:}      &\displaystyle\gamma = \frac{1+\thetain}{\thetain}     &0<\thetain+\thetaout\leq1 \\
%         \vphantom{\Bigg(}polynomial:    &\displaystyle\gamma = \frac{2-\thetaout}{1-\thetaout}                     \TempKern1\leq\thetain+\thetaout<2
% \end{align*}
To show this, we will first characterize the \potentiallyImprove{out-degrees \mbox{$d_j^{\text{out}} = \sum_{i=1}^{j-1} x_{ij}^{ }$} 
(connections that a node $j$ makes with previous nodes).}  
\potentiallyImprove{These out-degrees (and the node arrival time $j$) serve as the initial conditions for the growth of the in-degrees \mbox{$d_j^{\text{in}} = \sum_{k=j+1}^{n} x_{jk}^{ }$} 
(connections that node $j$ makes with later nodes).}  



\subsubsection{The out-degrees (connections with previous nodes)}

\potentiallyImprove{The out-degrees do \textit{not} exhibit a power law in this model.}    
\potentiallyImprove{This is because the outcomes of these $x_{ij}^{ }$ (\mbox{$1\leq i < j$}) are conditionally independent given the previous entries $x_{ab}^{ }$ (\mbox{$1\leq a < b < j$}), 
and the sum of independent Bernoulli variables does not exhibit a power-law distribution.}   

Denote these (conditionally) independent probabilities as $p_{ij}^{ }$.  
\potentiallyImprove{In our proof of the sparsity of the model above,} % in Appendix~\ref{appendixProof3Regimes}, 
we used the fact that the sum of these probabilities \mbox{\smash{$\sum_{i=1}^{j-1}p_{ij}^{ }$}} is the expected change in edges at each step $j$.  
\potentiallyImprove{Moreover, as the network grows, this sum does not change much between each step.}  
Thus, the expected out-degree \mbox{\smash{$d_j^{\text{out}} = \sum_{i=1}^{j-1} x_{ij}^{ }$}} of node $j$ is approximately 
\vspace{-12pt}
\def\TempKern{\kern30pt}
% \begin{center}
\begin{align}%[llr]
    \vphantom{\Bigg(}\text{constant:}      &\TempKern\big\langle d_j^{\text{out}} \big\rangle \sim \displaystyle\frac{\alphaP}{1-\big(\thetain+\thetaout\big)}     \kern-2.5cm &0<\thetain+\thetaout<1 \label{eq:dOutConstant}\\
    \vphantom{\Bigg(}\text{logarithmic:}   &\TempKern\big\langle d_j^{\text{out}} \big\rangle \sim \alphaP \log\kern-1pt \big(j\big) + C              \kern-2.5cm &\thetain+\thetaout=1 \label{eq:dOutLogarithmic}\\
    \vphantom{\Bigg(}\text{polynomial:}    &\TempKern\big\langle d_j^{\text{out}} \big\rangle \sim C \times j^{\thetain+\thetaout-1}        \kern-2.5cm &1<\thetain+\thetaout<2 \label{eq:dOutPolynomial}
\end{align}
% \end{center}
with a variance upper-bounded by this average \potentiallyImprove{(as they are the sum of independent Bernoulli random variables).}  

\subsubsection{The in-degrees (connections with later nodes)}

For a node $j$ with a given out-degree $d_j^{\text{out}}$, 
the expected in-degree grows according to the difference equation: 
\begin{align}
    \big\langle d_j^{\text{in}}\big\rangle(n+1) - \big\langle d_j^{\text{in}}\big\rangle(n) = \frac{\alphaP + \thetaout d_j^{\text{out}} + \thetain \big\langle d_j^{\text{in}}\big\rangle(n)}{n + \alphaP + \betaP - 1}  \qquad \big\langle d_j^{\text{in}}\big\rangle(j) = 0
\end{align}
 \potentiallyImprove{As this evolution does not depend on the outcome of any other edges in the network,} 
we can write the solution in closed form:
\begin{align}
    \big\langle d_j^{\text{in}}\big\rangle(n) = \frac{\alphaP + \thetaout d_j^{\text{out}}}{\thetain} \Bigg( \frac{\Gamma\big( \alphaP + \betaP + j - 1 \big)}{\Gamma\big( \alphaP + \betaP + \thetain + j - 1 \big)} \frac{\Gamma\big( \alphaP + \betaP + \thetain + n - 1 \big)}{\Gamma\big( \alphaP + \betaP +  n - 1 \big)} - 1\Bigg)
\end{align}
\novo{where \mbox{$\Gamma(n):=(n-1)!$} is the gamma function.}
% \novo{where is the gamma function.}

For \mbox{$1\ll j < n$}, 
\potentiallyImprove{the ratios of gamma functions can be approximated, 
and the expected degree as a function of $j$ and $n$ is} 
\begin{align}
    \big\langle d_j^{\text{ }}\big\rangle(n) \approx \frac{\alphaP + \thetaout \big\langle d_j^{\text{out}}\big\rangle}{\thetain} \Bigg( \bigg(\frac{n}{j}\bigg)^{\kern-2pt\thetain} - 1\Bigg) + \big\langle d_j^{\text{out}}\big\rangle \label{eq:diTotalAsAFunctionOfN}
\end{align}

\potentiallyImprove{We can extract the power law of the degree distribution from the dependence of the expected degree on the node index $j$.  
Since $\big\langle d_j^{\text{ }}\big\rangle$ is monotonically decreasing in $j$, 
the probability density will be proportional to the reciprocal of the magnitude of the derivative with respect to $j$:}
\begin{align}
    p\big(d\big) \propto \Big| \tfrac{d}{dj} \big\langle d_j^{\text{ }}\big\rangle \Big|^{-1} 
\end{align}
For a power-law degree distribution \mbox{$p\big(d\big) \propto d^{-\gamma}$}, 
the exponent is the change in \mbox{$\log\kern-1pt\big(p(d)\big)$} with respect to \mbox{$\log\kern-2pt\big(d\big)$}:
\begin{align}
    \gamma = \frac{\tfrac{d}{dj}\log\kern-1pt\Big| \tfrac{d}{dj} \big\langle d_j^{\text{ }}\big\rangle \Big| }{\tfrac{d}{dj} \log\kern-1pt\big\langle d_j^{\text{ }}\big\rangle} = \frac{\big\langle d_j^{\text{ }}\big\rangle \tfrac{d^2}{dj^2}\big\langle d_j^{\text{ }}\big\rangle}{\big(\tfrac{d}{dj}\big\langle d_j^{\text{ }}\big\rangle\big)^{\kern-1pt 2}} \label{eq:ScalingExponentDerivatives}
\end{align}
Substitute the expressions for \mbox{$\big\langle d_j^{\text{out}}\big\rangle$} from equations~\eqref{eq:dOutConstant} and \eqref{eq:dOutPolynomial} into equation~\eqref{eq:diTotalAsAFunctionOfN}.  
\potentiallyImprove{When \mbox{$1\ll j \ll n$},} the dominant term has the following scalings:
% \begin{align}
%     \big\langle d_i^{\text{ }}\big\rangle(n) \propto \begin{cases}
%         n^{\thetain}_{ } i^{-\thetain}_{ } &\kern12pt\vphantom{\Big(} 0<\thetain+\thetaout<1 \\
%         n^{\thetain}_{ } i^{\thetaout - 1}_{ } &\kern12pt\vphantom{\Big(} 1<\thetain+\thetaout<2 \end{cases}
%     % n^{\thetain}_{ } i^{-\thetain}_{ } &\kern1cm 0<\thetain+\thetaout<1 \\
%     % \big\langle d_i^{\text{ }}\big\rangle(n) \propto n^{\thetain}_{ } i^{\thetaout - 1}_{ } &\kern1cm 1<\thetain+\thetaout<2 
% \end{align}
\begin{align}
    \vphantom{\bigg(}\text{constant:}      &\TempKern\big\langle d_j^{\text{ }}\big\rangle(n) \propto n^{\thetain}_{ } j^{-\thetain}_{ }     \kern-2.5cm &0<\thetain+\thetaout<1 \\%\label{eq:dConstant}\\
    \vphantom{\bigg(}\text{polynomial:}    &\TempKern\big\langle d_j^{\text{ }}\big\rangle(n) \propto n^{\thetain}_{ } j^{\thetaout - 1}_{ }        \kern-2.5cm &1<\thetain+\thetaout<2 %\label{eq:dTotalPolynomial}
\end{align}
% When \mbox{$0<\thetain+\thetaout<1$}, the expected out-degree limits to a constant, 
% so the 
Substituting these into equation~\eqref{eq:ScalingExponentDerivatives}, we obtain the following power-law exponents: 
\begin{align}
    \vphantom{\bigg(}\text{constant:}      &\TempKern\gamma = \frac{1+\thetain}{\thetain}     \kern-2.5cm &0<\thetain+\thetaout\leq1 \\
    \vphantom{\bigg(}\text{polynomial:}    &\TempKern\gamma = \frac{2-\thetaout}{1-\thetaout}        \kern-2.5cm &1\leq\thetain+\thetaout<2 
\end{align}
Note that both expressions give the same scaling when \mbox{$\thetain+\thetaout=1$} for the intermediate logarithmic regime.  \\
\hfill\qed

\commentToDo{comment about assumptions for validity of the proof and numerical confirmations...}