\newpage
\section{Proof of Theorems for {\ppaAcron} model}
\label{appendixDAPAProofs}
The Distributed Affine Preferential Attachment ({\ppaAcron}) model (Section~\ref{sec:ourppamodel}) is defined as:
\begin{align}
    x_{ij}^{ } &\sim \text{Bernoulli}\big(p_{ij}^{ }\big) \label{eq:PPAbernoulliAppendix} \\
    p_{ij}^{ } &= \frac{\alphaP + \thetain d_i^{\text{in}} + \thetaout d_i^{\text{out}}}{j-2+\alphaP +\betaP} \label{eq:PPAprobAppendix}\\
    d_i^{\text{in}} &= \sum_{\BoxNodeSS{}=i+1}^{j-1} x_{i\BoxNodeSS{}}^{ }  \quad\quad
    d_i^{\text{out}} = \sum_{\BoxNodeSS{}=1}^{i-1} x_{\BoxNodeSS{}i}^{ } \label{eq:PPAdoutAppendix}    
\end{align}
where \mbox{$x_{ij} = 1$} ($\mbox{$x_{ij} = 0$}$) indicates an edge (no edge) between nodes $i$ and $j$.

% This model exhibits three sparsity regimes (depending on $\thetain$ and $\thetaout$) and a flexible power law \novo{(depending on $\thetain$ for the ).} 
\novo{This model exhibits three sparsity regimes (depending on $\thetain$ and $\thetaout$) and a flexible power law (depending on $\thetain$ for the constant average degree regime and on $\thetaout$ for the polynomial degree regime). 
For the logarithmic average degree regime, 
which is at the transition between the constant and polynomial regimes, 
the dominant dependency 
% for the average degree 
is on the parameter $\alphaP$. 
And the expression for the power-law exponent in this transitional regime  agrees with the expression for both the constant and polynomial regimes. 
} 

\subsection{Proof of Theorem~\ref{thm:PPAPhaseTransition} \thmNamePPAAppendix}
% \label{appendixDAPAProofThm1}
% \subsubsection{Three sparsity regimes}
\label{appendixProof3Regimes}
% \begin{theorem}[\thmNamePPA]
% \label{thm:PPAPhaseTransitionAppendix}
    Our {\ppaAcron} model exhibits three qualitatively different asymptotic behaviors for the average degree $\avgdegree$ \\[-12pt] %, 
    % depending on the value of ${\thetain+\thetaout}$ 
    % (see Fig.~\ref{fig:PPARegimes}, proof in Appendix~\ref{appendixProof3Regimes}):\\[-12pt]
    %Our {\ppaName} ({\ppaAcron}) model (\cref{eq:PPAprob,eq:PPAdin,eq:PPAdout}). 
% \end{theorem}
\vspace{-6pt}
\def\TempKern{\kern4pt}
\begin{center}
\begin{tabular}{llr}
    \vphantom{\Bigg(}constant:      &\TempKern$\displaystyle\frac{2\kern1pt\alphaP}{1-\big(\thetain+\thetaout\big)}$     &\TempKern$0<\thetain+\thetaout<1$ \\
    \vphantom{\Bigg(}logarithmic:   &\TempKern$2\kern1pt\alphaP \log\big(n\big) + C$                            &\TempKern$\thetain+\thetaout=1$ \\
    \vphantom{\Bigg(}polynomial:    &\TempKern$C \times n^{\thetain+\thetaout-1}$                     &\TempKern$1<\thetain+\thetaout<2$
\end{tabular}
\end{center}
%%%******
% The parameters $\thetain$ and $\thetaout$ correspond to $\HubName$ and $\PathName$ causal arrows, respectively. 
% If one uses the ordering of the nodes to orient the edges of the growing network, 
% {\hub} arrows refer to the \mbox{in-degree} 
% of the node $\BoxNodeS{}$ of the dyad \mbox{\dyadpair{\BoxNodeS{}}{j}} being decided 
% (\ie, dyads of the type \mbox{\dyadpair{\BoxNodeS{}}{i}}, where \mbox{$\BoxNodeS{}<i$}). 
% Whereas {\transitive} arrows refer to the \mbox{out-degree} of the node $\BoxNodeS{}$ 
% (\ie, dyads of the type \mbox{\dyadpair{i}{\BoxNodeS{}}}, where \mbox{$i<\BoxNodeS{}$}). 
% \footnote{Albeit not necessary, 
% due to the ordering of the nodes in the growing network,
% the presence of a dyad (\ie, an edge) can be thought as an arrow with the newer node as the tail and the older node as the head, or likewise as a direct edge from the newer node to the older node. 
% {\hub} and {\transitive} describe how dyads with different tail nodes (\ie, newer nodes) can directly influence each other, 
% and the case where the dyads that have the same tail node directly influence each other is described by {\forward} \textit{or} {\backward}.\label{footnotedirection}} 
\novo{
% Albeit not necessary, 
% due to the ordering of the nodes in the growing network,
% the presence of a dyad (\ie, an edge) can be thought as an arrow with the newer node as the tail and the older node as the head, or likewise as a direct edge from the newer node to the older node. 
The parameters $\thetain$ and $\thetaout$ correspond to $\HubName$ and $\PathName$ causal arrows, respectively.  
If one uses the ordering of the nodes to orient the edges of the growing network, 
{\hub} arrows refer to the \mbox{in-degree} 
of the node $\BoxNodeS{}$ of the dyad \mbox{\dyadpair{\BoxNodeS{}}{j}} being decided 
(\ie, dyads of the type \mbox{\dyadpair{\BoxNodeS{}}{i}}, where \mbox{$\BoxNodeS{}<i$}). 
Whereas {\transitive} arrows refer to the \mbox{out-degree} of the node $\BoxNodeS{}$ 
(\ie, dyads of the type \mbox{\dyadpair{i}{\BoxNodeS{}}}, where \mbox{$i<\BoxNodeS{}$}). 
% The parameters $\thetain$ and $\thetaout$ correspond to $\HubName$ and $\PathName$ causal arrows, respectively. 
% These arrows are associated with the parameters $\thetain$ and $\thetaout$, respectively. 
}
\novo{However, orienting the edges is not necessary, and our theorems refer to the undirected degrees of the nodes.}
% {\hub} and {\transitive} describe how dyads with different tail nodes (\ie, newer nodes) can directly influence each other, 
% and the case where the dyads that have the same tail node directly influence each other is described by {\forward} \textit{or} {\backward}.

% \novo{Note that this model has a remarkable degree of parallelization: it can be generated $\mathcal{O}(n)$ in time, where $n$ is the number of nodes in the network, in contrast to the $\mathcal{O}(n^2)$ time need .}
% This leads to a remarkable degree of parallelizability 

\novo{We now derive the expressions for the average degree in the three regimes, 
starting with the constant regime.} 
 
\def\logTIGHT{\log\kern-1pt}
\def\timesLOOSE{\kern1pt\times\kern1pt}
\def\ConstOne{C_1^{ }}
\def\ConstTwo{C_2^{ }}
\subsubsection{Constant degree regime (when: \protect$0\leq\thetain +\thetaout <1$)}
% ***maybe quick comment that both thetas equal zero is ER
In this regime, the average degree converges to a constant: 
\begin{equation}
    \avgdegree = \frac{2\kern1pt\alphaP}{1-(\thetain+\thetaout)}  + \littleO{1} \label{eq:PPAavgdegreeSumThetaLess1}
\end{equation}

\potentiallyRemove{For a node $j$, its in-degree $\din_j$ and out-degree $\dout_j$ are}
\potentiallyRemove{
\begin{align}
\din_j = \sum_{k=j+1}^{n} x_{jk} \kern1cm \text{and} \kern1cm \dout_j = \sum_{i=1}^{j-1} x_{ij}
\end{align}
}
After node $n$ has decided all its connections, 
the total number of edges in the network is
\begin{align}
    E(n) = \sum_{i=1}^{n} \din_i = \sum_{i=1}^n \dout_i
\end{align}
The expected number of edges added at each step\footnote{To simplify notation, here, we use $n$ for both the step/iteration of the model and the number of nodes.} is
%(indeed, although this model is parallelizable, one can always simulate it sequentially with a single node arriving at each step).} $n+1$ is
\begin{align}
    % \big\langle E(n+1) - E(n) | E(n) \big\rangle 
     \big\langle E(n+1) - E(n)  \big\rangle 
    &= \sum_{i=1}^{n} \frac{\alphaP + \thetain \din_i + \thetaout \dout_i}{n + \alphaP + \betaP - 1} \nonumber \\
    &= \frac{\alphaP n +\big(\thetain + \thetaout\big) E(n)}{n + \alphaP+ \betaP - 1} \label{eq:EDotOfN}
\end{align}
We make an ansatz of constant average degree 
\begin{align}
    \big\langle E(n) \big\rangle = \ConstOne \timesLOOSE n + g(n) \label{eq:ConstantDegreeAnsatz}
\end{align}
where ${g(n) = \littleO{n}}$ is subdominant.  

We will first solve for $\ConstOne$ to obtain the asymptotic average degree ${\langle d \rangle = 2\ConstOne}$, 
then we will verify our assumption that ${g(n) = \littleO{n}}$.  

Taking the expectation of \eqref{eq:EDotOfN}, 
\begin{align}
    \big\langle E(n+1) \big\rangle - \big\langle E(n) \big\rangle &= \frac{\alphaP n +\big(\thetain + \thetaout\big) \big\langle E(n) \big\rangle}{n + \alphaP + \betaP - 1} \label{eq:ConstantDegreeAfterExpectation}
\end{align}
using our ansatz \eqref{eq:ConstantDegreeAnsatz},
\begin{align}
     g(n+1) - g(n) + \underbrace{\ConstOne = \Bigg( \alphaP + \big(\thetain + \thetaout\big) \bigg(\ConstOne}_{\text{equate these constant terms}} + \frac{g(n)}{n} \bigg) \Bigg) \timesLOOSE \frac{n}{n + \alphaP + \betaP - 1} \label{eq:ConstantDegreeAfterAnsatz}
\end{align}
% **
and equating the $\bigTh{1}$ (constant) terms to solve for $\ConstOne$, 
\begin{align}
    \ConstOne &= \alphaP + \big(\thetain + \thetaout\big) \ConstOne \\
    &= \frac{\alphaP}{1-\big(\thetain + \thetaout\big)} \label{eq:ConstantDegreeSolveForC}
\end{align}
we obtain the asymptotic average degree claimed in \eqref{eq:PPAavgdegreeSumThetaLess1}.  

To check verify our ansatz ${g(n) = \littleO{n}}$, substitute \eqref{eq:ConstantDegreeSolveForC} into \eqref{eq:ConstantDegreeAfterAnsatz}
\begin{align}
    \underbrace{g(n+1) - g(n) = \frac{\big(\thetain + \thetaout\big) g(n)}{n}}_{\text{equate these dominant terms}} - \frac{\alphaP+\betaP-1}{n} + \biggerO{\tfrac{g(n)}{n^2}}
\end{align}
to conclude that ${g(n) = \bigO{n^{\thetain+\thetaout}}}$.  

So our ansatz ${g(n) = \littleO{n}}$ is valid for ${\thetain+\thetaout<1}$, 
which incidentally is precisely when equation~\eqref{eq:PPAavgdegreeSumThetaLess1} is physically meaningful.  

% and separating the $\bigO{1}$ terms from the $\littleO{1}$ terms, we have
% \begin{align}
%     \bigO{1}:& \qquad C = \alphaP + \big(\thetain + \thetaout\big) C \label{eq:ConstantDegreeCTerms}\\
%     \bigO{1/n}:& \qquad g(n+1) - g(n) = -\frac{\alpha+\beta-1}{n} + \big(\thetain + \thetaout\big) \frac{g(n)}{n} + \bigO{n^{-2}}\label{eq:ConstantDegreeGTerms}
% \end{align}

\subsubsection{Logarithmic degree regime (when: \protect$\thetain + \thetaout=1$)}
As ${\thetain + \thetaout \rightarrow 1}$, the average degree predicted by \eqref{eq:PPAavgdegreeSumThetaLess1} diverges, 
and when ${\thetain + \thetaout = 1}$, the average degree is no longer bounded.  
Instead, it grows logarithmically in $n$:
\begin{equation}
    % \avgdegree = \alpha\logTIGHT\big(n\big) \timesLOOSE \Big(1+\littleO{1}\Big) \label{eq:PPAavgdegreeSumThetaEqual1}
    \avgdegree = 2\kern1pt\alphaP\logTIGHT\big(n\big) + C + \littleO{1} \label{eq:PPAavgdegreeSumThetaEqual1}
\end{equation}


Similar to equation~\eqref{eq:ConstantDegreeAnsatz},
we make an ansatz but now of logarithmic average degree 
\begin{align}
    \big\langle E(n) \big\rangle = \ConstOne \timesLOOSE n \log n + g(n) \label{eq:LogDegreeAnsatz}
\end{align}
where ${g(n) = \littleO{n \log n}}$ is subdominant.  
% The expected change in number of edges is given by

The change in ${n \log n}$ is approximately
\begin{align}
\big(n+1\big)\logTIGHT\big(n+1\big) - n\logTIGHT\big(n\big)=\logTIGHT\big(n\big) + 1 + \biggerO{\tfrac{1}{n^2}}.  
\end{align}
Substituting this into equation~\eqref{eq:ConstantDegreeAfterExpectation}, %${n\logTIGHT\big(1+\frac{1}{n}\big)=1+\littleO{1}}$
\begin{align}
     % g(n+1) - g(n) + \ConstOne \timesLOOSE \Bigg( \logTIGHT\big(n+1) + n\logTIGHT\bigg(\frac{n+1}{n}\bigg) \Bigg) = \Bigg( \alpha + \big(\thetain + \thetaout\big) \bigg(\ConstOne\kern1pt\logTIGHT\big(n\big) + \frac{g(n)}{n} \bigg) \Bigg) \times \frac{n}{n + \alpha + \beta - 1} \\
     g(n+1) - g(n) + \underbrace{\ConstOne \timesLOOSE \bigg( \logTIGHT\big(n) + 1 \bigg) = \Bigg( \alphaP + \big(\thetain + \thetaout\big) \bigg(\ConstOne\kern1pt\logTIGHT\big(n\big)}_{\text{equate these logarithmic and constant terms}} + \frac{g(n)}{n} \bigg) \Bigg) \timesLOOSE \bigg(1+\biggerO{\tfrac{1}{n}}\bigg)% \timesLOOSE \frac{n}{n + \alpha + \beta - 1} 
     \label{eq:LogDegreeAfterAnsatz}
\end{align}
% where we have used ${\big(n+1\big)\logTIGHT\big(n+1\big) - n\logTIGHT\big(n\big)=\logTIGHT\big(n\big) + 1 + \littleO{1}}$.  
Equating the logarithmic terms, we recover the condition that ${\thetain + \thetaout = 1}$.  
And equating the constant terms, we can solve for the constant ${\ConstOne=\alphaP}$.  

To verify our ansatz ${g(n) = \littleO{n \log n}}$, we consider the {lower-order} terms: 
\begin{align}
    g(n+1) - g(n) = \frac{g(n)}{n} + \biggerO{\tfrac{\log n}{n}}
\end{align}
The solution can be written as ${g(n) = C\timesLOOSE n + f(n)}$, where ${f(n) = \littleO{n}}$.  

Note that $C$ is not determined by the asymptotic balance.  
This suggests that different instances of network generated with the same parameters may limit to different values of $C$.  
This is similar to the situation with the classic P\'olya urn \citep{eggenberger1923statistik}, where any asymptotic ratio is equally stable, resulting in a distribution over these ratios for any fixed set of parameters \citep{mahmoud2008polya, pekoz2019polya}.  


\subsubsection{Sub-linear degree regime (when: \protect$1<\thetain +\thetaout<2$)}
When ${1<\thetain + \thetaout < 2}$, the average degree grows as a (sublinear) power of $n$:
\begin{equation}
    \avgdegree \propto C \kern1pt n^{\rho}, \qquad \rho=\thetain +\thetaout-1\label{eq:PPAavgdegreeSumThetaGreater1}
\end{equation}

Again, we make the appropriate ansatz: 
\begin{align}
    \big\langle E(n) \big\rangle = \ConstOne \timesLOOSE n^{1+\rho}_{ } + g(n) \label{eq:SublinearDegreeAnsatz}
\end{align}
where ${g(n) = \littleO{n^{1+\rho}_{ }}}$ is subdominant.  
% The expected change in number of edges is given by
The change in ${n^{1+\rho}_{ }}$ is approximately
\begin{align}
\big(n+1\big)^{1+\rho}_{ } - n^{1+\rho}_{ }=\big(1+\rho\big)n^{\rho}_{ } + \biggerO{n^{\rho-1}_{ }}.  
\end{align}

Substituting this into equation~\eqref{eq:ConstantDegreeAfterExpectation}, 
\begin{align}
     g(n+1) - g(n) + \underbrace{\ConstOne \timesLOOSE \big(1+\rho\big)n^{\rho}_{ } = \Bigg( \alphaP + \big(\thetain + \thetaout\big) \bigg(\ConstOne n^{\rho}_{ }}_{\text{equate these $\bigO{n^{\rho}}$ terms}} + \frac{g(n)}{n} \bigg) \Bigg) \timesLOOSE \bigg(1+\biggerO{\tfrac{1}{n}}\bigg)
     \label{eq:SublinearDegreeAfterAnsatz}
\end{align}
and equating the dominant $\biggerO{\tfrac{1}{n}}$ terms, we can solve for the exponent ${\rho=\thetain + \thetaout -1}$.  

Note that this does not fix $\ConstOne$.  
To see why, let us attempt to verify our ansatz ${g(n) = \littleO{n \log n}}$.  
We again equate the remaining {lower-order} terms: 
\begin{align}
    g(n+1) - g(n) = \big(1+\rho\big) \frac{g(n)}{n} + \biggerO{n^{\rho - 1}_{ }}
\end{align}
In this case, it seems as though our ansatz is not verified, with $g(n)$ being the same order as the ``dominant'' part of the solution: ${g(n) = \ConstTwo\timesLOOSE n^{1+\rho}_{ } + \littleO{n^{1+\rho}_{ }}}$.  
However, this is in fact not a contradiction --- this is the asymptotic analysis telling us that the original constant $C$ itself is not determined.  

Recapitulating the sequence of results:\\[-12pt]
\begin{itemize}
    \item When $\thetain + \thetaout < 1$, the average degree asymptotes to a fixed constant. 
    \item When $\thetain + \thetaout = 1$, the average degree grows logarithmically in $n$, but with an arbitrary additive constant.
    \item When $\thetain + \thetaout > 1$, the average degree grows as a sublinear power of $n$, with an arbitrary multiplicative constant.
\end{itemize}
\hfill\qed







\subsection{Proof of Theorem~\ref{thm:PPAPhaseTransitiondegdist} \thmNamePPAAppendixdegdist}
\label{appendix:dapapowerlawproof}
% \subsection{Adjustable power-law}
% In the {\ppaAcron} model, the in-degrees \mbox{$d_i^{\text{in}} = \sum_{k=i+1}^{j-1} x_{ik}^{ }$} 
% (connections that node $i$ makes with later nodes) 
% exhibit a power-law (depending on $\thetain$):
% \begin{align*}
%     p\big(d\big)  \propto  d^{-\gamma} \qquad \gamma  =  1+\displaystyle\frac{1}{\thetain}
% \end{align*}
In the {\ppaAcron} model, the asymptotic distribution of node degrees exhibits a power-law tail %(depending on either $\thetain$ or $\thetaout$):
\mbox{$p(d) \propto d^{-\gamma}$}, where the scaling exponent depends on either $\thetain$ or $\thetaout$: %\\
\def\TempKern{\kern30pt}
\begin{align}
    \vphantom{\bigg(}\text{constant:}      &\TempKern\gamma = \frac{1+\thetain}{\thetain}     \kern-2.5cm &0<\thetain+\thetaout\leq1 \\
    \vphantom{\bigg(}\text{polynomial:}    &\TempKern\gamma = \frac{2-\thetaout}{1-\thetaout}        \kern-2.5cm &1\leq\thetain+\thetaout<2 
\end{align}
%    \def\TempKern{\kern4pt}
%    \begin{tabular}{llr}
%     \vphantom{\Bigg(}\text{constant:}      &\TempKern$\displaystyle\gamma = \frac{1+\thetain}{\thetain}$     &\TempKern$0<\thetain+\thetaout\leq1$ \\
%     \vphantom{\Bigg(}polynomial:    &\TempKern$\displaystyle\gamma = \frac{2-\thetaout}{1-\thetaout}$                     &\TempKern$1\leq\thetain+\thetaout<2$
% \end{tabular}
% \begin{align*}
%     p\big(d\big)  \propto  d^{-\gamma} \qquad \gamma  = 
%         1+\displaystyle\frac{1}{\thetain}
%         \vphantom{\Bigg(}\text{constant:}      &\displaystyle\gamma = \frac{1+\thetain}{\thetain}     &0<\thetain+\thetaout\leq1 \\
%         \vphantom{\Bigg(}polynomial:    &\displaystyle\gamma = \frac{2-\thetaout}{1-\thetaout}                     \TempKern1\leq\thetain+\thetaout<2
% \end{align*}
To show this, we will first characterize the out-degrees \mbox{$d_j^{\text{out}} = \sum_{i=1}^{j-1} x_{ij}^{ }$} 
(connections that a node $j$ makes with previous nodes).  
These out-degrees (and the node arrival time $j$) serve as the initial conditions for the growth of the in-degrees \mbox{$d_j^{\text{in}} = \sum_{k=j+1}^{n} x_{jk}^{ }$} 
(connections that node $j$ makes with later nodes).  


\subsubsection{The out-degrees (connections with previous nodes)}
The out-degrees do \textit{not} exhibit a power law in this model.  
This is because the outcomes of these $x_{ij}^{ }$ (\mbox{$1\leq i < j$}) are conditionally independent given the previous entries $x_{ab}^{ }$ (\mbox{$1\leq a < b < j$}), 
and the sum of independent Bernoulli variables does not exhibit a power-law distribution.  

Denote these (conditionally) independent probabilities as $p_{ij}^{ }$.  
In the proof of the sparsity of the model in Appendix~\ref{appendixProof3Regimes}, 
we used the fact that the sum of these probabilities \mbox{\smash{$\sum_{i=1}^{j-1}p_{ij}^{ }$}} is the expected change in edges at each step $j$.  
Moreover, as the network grows, this sum does not change much between each step.  
Thus, the expected out-degree \mbox{\smash{$d_j^{\text{out}} = \sum_{i=1}^{j-1} x_{ij}^{ }$}} of node $j$ is approximately 
\vspace{-12pt}
\def\TempKern{\kern30pt}
% \begin{center}
\begin{align}%[llr]
    \vphantom{\Bigg(}\text{constant:}      &\TempKern\big\langle d_j^{\text{out}} \big\rangle \sim \displaystyle\frac{\alphaP}{1-\big(\thetain+\thetaout\big)}     \kern-2.5cm &0<\thetain+\thetaout<1 \label{eq:dOutConstant}\\
    \vphantom{\Bigg(}\text{logarithmic:}   &\TempKern\big\langle d_j^{\text{out}} \big\rangle \sim \alphaP \log\kern-1pt \big(j\big) + C              \kern-2.5cm &\thetain+\thetaout=1 \label{eq:dOutLogarithmic}\\
    \vphantom{\Bigg(}\text{polynomial:}    &\TempKern\big\langle d_j^{\text{out}} \big\rangle \sim C \times j^{\thetain+\thetaout-1}        \kern-2.5cm &1<\thetain+\thetaout<2 \label{eq:dOutPolynomial}
\end{align}
% \end{center}
with a variance upper-bounded by this average (as they are the sum of independent Bernoulli random variables).  

\subsubsection{The in-degrees (connections with later nodes)}
For a node $j$ with a given out-degree $d_j^{\text{out}}$, 
the expected in-degree grows according to the difference equation: 
\begin{align}
    \big\langle d_j^{\text{in}}\big\rangle(n+1) - \big\langle d_j^{\text{in}}\big\rangle(n) = \frac{\alphaP + \thetaout d_j^{\text{out}} + \thetain \big\langle d_j^{\text{in}}\big\rangle(n)}{n + \alphaP + \betaP - 1}  \qquad \big\langle d_j^{\text{in}}\big\rangle(j) = 0
\end{align}
As this evolution does not depend on the outcome of any other edges in the network, 
we can write the solution in closed form:
\begin{align}
    \big\langle d_j^{\text{in}}\big\rangle(n) = \frac{\alphaP + \thetaout d_j^{\text{out}}}{\thetain} \Bigg( \frac{\Gamma\big( \alphaP + \betaP + j - 1 \big)}{\Gamma\big( \alphaP + \betaP + \thetain + j - 1 \big)} \frac{\Gamma\big( \alphaP + \betaP + \thetain + n - 1 \big)}{\Gamma\big( \alphaP + \betaP +  n - 1 \big)} - 1\Bigg)
\end{align}
For \mbox{$1\ll j < n$}, the ratios of gamma functions can be approximated, and the expected degree as a function of $j$ and $n$ is
\begin{align}
    \big\langle d_j^{\text{ }}\big\rangle(n) \approx \frac{\alphaP + \thetaout \big\langle d_j^{\text{out}}\big\rangle}{\thetain} \Bigg( \bigg(\frac{n}{j}\bigg)^{\kern-2pt\thetain} - 1\Bigg) + \big\langle d_j^{\text{out}}\big\rangle \label{eq:diTotalAsAFunctionOfN}
\end{align}

We can extract the power law of the degree distribution from the dependence of the expected degree on the node index $j$.  
Since $\big\langle d_j^{\text{ }}\big\rangle$ is monotonically decreasing in $j$, 
the probability density will be proportional to the reciprocal of the magnitude of the derivative with respect to $j$:
\begin{align}
    p\big(d\big) \propto \Big| \tfrac{d}{dj} \big\langle d_j^{\text{ }}\big\rangle \Big|^{-1} 
\end{align}
For a power-law degree distribution \mbox{$p\big(d\big) \propto d^{-\gamma}$}, 
the exponent is the change in \mbox{$\log\kern-1pt\big(p(d)\big)$} with respect to \mbox{$\log\kern-2pt\big(d\big)$}:
\begin{align}
    \gamma = \frac{\tfrac{d}{dj}\log\kern-1pt\Big| \tfrac{d}{dj} \big\langle d_j^{\text{ }}\big\rangle \Big| }{\tfrac{d}{dj} \log\kern-1pt\big\langle d_j^{\text{ }}\big\rangle} = \frac{\big\langle d_j^{\text{ }}\big\rangle \tfrac{d^2}{dj^2}\big\langle d_j^{\text{ }}\big\rangle}{\big(\tfrac{d}{dj}\big\langle d_j^{\text{ }}\big\rangle\big)^{\kern-1pt 2}} \label{eq:ScalingExponentDerivatives}
\end{align}
Substitute the expressions for \mbox{$\big\langle d_j^{\text{out}}\big\rangle$} from equations~\eqref{eq:dOutConstant} and \eqref{eq:dOutPolynomial} into equation~\eqref{eq:diTotalAsAFunctionOfN}.  
When \mbox{$1\ll j \ll n$}, the dominant term has the following scalings:
% \begin{align}
%     \big\langle d_i^{\text{ }}\big\rangle(n) \propto \begin{cases}
%         n^{\thetain}_{ } i^{-\thetain}_{ } &\kern12pt\vphantom{\Big(} 0<\thetain+\thetaout<1 \\
%         n^{\thetain}_{ } i^{\thetaout - 1}_{ } &\kern12pt\vphantom{\Big(} 1<\thetain+\thetaout<2 \end{cases}
%     % n^{\thetain}_{ } i^{-\thetain}_{ } &\kern1cm 0<\thetain+\thetaout<1 \\
%     % \big\langle d_i^{\text{ }}\big\rangle(n) \propto n^{\thetain}_{ } i^{\thetaout - 1}_{ } &\kern1cm 1<\thetain+\thetaout<2 
% \end{align}
\begin{align}
    \vphantom{\bigg(}\text{constant:}      &\TempKern\big\langle d_j^{\text{ }}\big\rangle(n) \propto n^{\thetain}_{ } j^{-\thetain}_{ }     \kern-2.5cm &0<\thetain+\thetaout<1 \\%\label{eq:dConstant}\\
    \vphantom{\bigg(}\text{polynomial:}    &\TempKern\big\langle d_j^{\text{ }}\big\rangle(n) \propto n^{\thetain}_{ } j^{\thetaout - 1}_{ }        \kern-2.5cm &1<\thetain+\thetaout<2 %\label{eq:dTotalPolynomial}
\end{align}
% When \mbox{$0<\thetain+\thetaout<1$}, the expected out-degree limits to a constant, 
% so the 
Substituting these into equation~\eqref{eq:ScalingExponentDerivatives}, we obtain the following power-law exponents: 
\begin{align}
    \vphantom{\bigg(}\text{constant:}      &\TempKern\gamma = \frac{1+\thetain}{\thetain}     \kern-2.5cm &0<\thetain+\thetaout\leq1 \\
    \vphantom{\bigg(}\text{polynomial:}    &\TempKern\gamma = \frac{2-\thetaout}{1-\thetaout}        \kern-2.5cm &1\leq\thetain+\thetaout<2 
\end{align}
Notice that both expressions give the same scaling when \mbox{$\thetain+\thetaout=1$} for the intermediate logarithmic regime.  \\
\hfill\qed


