\documentclass{article}

\usepackage[utf8]{inputenc} % allow utf-8 input
\usepackage[T1]{fontenc}    % use 8-bit T1 fonts
\usepackage{booktabs}       % professional-quality tables
\usepackage{amsfonts}       % blackboard math symbols
\usepackage{nicefrac}       % compact symbols for 1/2, etc.
\usepackage{graphicx}
\usepackage{amsmath,amssymb,amsfonts}
\usepackage{tikz}
\usepackage[dvipsnames]{xcolor}

\usetikzlibrary{arrows, chains, fit, quotes, matrix,calc, positioning, backgrounds,tikzmark}
\usepackage{tkz-graph}

\title{}

\date{} 

\author{}

\begin{document}

\maketitle

\begin{center}

\begin{tikzpicture}
[
roundsqnode/.style={rectangle, align=center, rounded corners=1ex, draw=green!60, fill=green!5, very thick, minimum size=5mm},
roundrecnode/.style={rectangle, rounded corners=1ex, draw=blue!60, very thick, minimum size=5mm, align=center},
roundnode/.style={circle, draw=green!60, very thick, minimum size=3mm},
squarednode/.style={rectangle, align=center, draw=blue!30, fill=blue!5, very thick, minimum size=5mm},
squarednodepri/.style={rectangle, align=center, draw=gray!50, fill=gray!5, very thick, minimum size=5mm},
]

\node[squarednode] (user) {\footnotesize{User ($\mathcal{S},\mathcal{A},\theta$)}\\\footnotesize{$\pi_{\theta}\sim p(\pi|\theta)$}};

\node[squarednodepri] (userpri) [right=70pt of user] {\footnotesize{User ($\mathcal{S}^\prime,\mathcal{A}^\prime,\theta^\prime$)}\\\footnotesize{$\pi_{\theta^\prime}\sim p(\pi|\theta^\prime)$}};

\node[roundsqnode] (lowerrect) [below=70pt of user] {\footnotesize{\sf AS} \\ (${\rm h}_\psi,{\rm g}_\phi,\mathcal{M}$)};

\node[roundsqnode,fill=red!5,draw=red!60] (usermlowerrect) [right=80pt of lowerrect] {\footnotesize{\sf AS$^\prime$} \\ (${\rm h}_{\psi}^\prime,{\rm g}_{\phi}^{\prime}$)};

\node[roundsqnode, minimum width=23mm, minimum height=48mm, fill=none, draw=green!60, dashed] (environment) [below=-35pt of user] {};

\node[align=center, yshift = -15mm, xshift =-15mm,rotate=90] at (user) (env) {\footnotesize{\sf Env}};

\node[roundsqnode, minimum width=25mm, minimum height=48mm, fill=none, draw=red!60, dashed] (environmentpri) [below=-35pt of userpri] {};

\node[align=center, yshift = -15mm, xshift =15mm,rotate=90] at (userpri) (env) {\footnotesize{\sf Env$^\prime$}};

\node[align=center, yshift =+1.3mm, xshift = -3mm] at (userpri.south) (statepri) {};

\node[align=center, yshift=-1.3mm, xshift = -2.2mm] at (usermlowerrect.north) (AIpri) {};

\node[align=center, yshift =+1.3mm, xshift = +2.5mm] at (userpri.south) (actionpri) {};

\node[align=center, yshift=-1.3mm, xshift = +3.2mm] at (usermlowerrect.north) (AIprirecomm) {};

\draw[-latex',very thick] (statepri) -- (AIpri); 

\node[align=center, yshift = -17mm, xshift = -7mm,rotate=-90] at (userpri) (observationpri) {\scriptsize{$\mathbf{o}^\prime=(\mathbf{s}^\prime,\mathbf{a}^\prime)\in\mathcal{D}^{\prime\sf C}$}};

\draw[-latex',very thick] (AIprirecomm) -- (actionpri); 

\node[align=center, yshift = -17mm, xshift = +6mm,rotate=-90] at (userpri) (actionprim) {\scriptsize{$\mathbf{a}^\prime={\rm g}_{\phi}^\prime(\mathcal{D}^{\prime\sf T})$}};

\draw[-latex',very thick] (user.south) -- (lowerrect.north);

\node[align=center, yshift = -17mm, xshift = 3mm, rotate=-90] at (user) (observation) {\scriptsize $\mathbf{o}=(\mathbf{s},\mathbf{a})\in\mathcal{D}$};

\draw[-latex',dashed,very thick] (lowerrect.east)--(usermlowerrect.west); 

\node[align=center, yshift = 3mm, xshift =-24mm, rotate=0] at (usermlowerrect) (gradientn) {$\omega=\left(\psi,\phi\right)$};

\end{tikzpicture}
\end{center}

\end{document}