% \begin{table*}
%     \centering
%     % \small
%     \caption{Recommendation performance comparison. The highest results are boldfaced while the runners-up are underlined. Units of numbers are percentage (\%). All models are trained ten times with different random seeds. Reported numbers are averaged over ten runs. $^\star$ denotes statistical significance on a paired t-test with $\text{p-value} < 0.05$. }
%     % On MovieLens, where models' performance vary, \ourmethod's numbers are statistically significant on some metrics, e.g., the statistically significant gap between \ourmethod\ and ADDVAE on R@10, N@10 and N@50.\looseness=-1}
%     \label{tab:recom_result}
%     \scalebox{1}{
%     % \begin{tabular}{c@{\hskip 0.04in}c@{\hskip 0.03in}c@{\hskip 0.03in}c@{\hskip 0.03in}c@{\hskip 0.03in}c@{\hskip 0.2in}c@{\hskip 0.03in}c@{\hskip 0.03in}c@{\hskip 0.03in}c@{\hskip 0.03in}c@{\hskip 0.2in}c@{\hskip 0.03in}c@{\hskip 0.03in}c@{\hskip 0.03in}c@{\hskip 0.03in}c}
%     \begin{tabular}{c
%                     c@{\hskip 0.03in}c@{\hskip 0.03in}c@{\hskip 0.03in}c 
%                     c@{\hskip 0.03in}c@{\hskip 0.03in}c@{\hskip 0.03in}c 
%                     c@{\hskip 0.03in}c@{\hskip 0.03in}c@{\hskip 0.03in}c}
%         \toprule
%         \multirow{3}{*}{\textbf{Model}} & \multicolumn{4}{c}{\textbf{CiteULike-a}} & \multicolumn{4}{c}{\textbf{Cell Phones}} & \multicolumn{4}{c}{\textbf{MovieLens}}\\
%         \cmidrule(lr){2-5}\cmidrule(lr){6-9}\cmidrule(lr){10-13}
%         & Recall & Recall & NDCG & NDCG & Recall & Recall & NDCG & NDCG & Recall & Recall & NDCG & NDCG\\
%         & @10 & @50 & @10 & @50 & @10 & @50 & @10 & @50 & @10 & @50 & @10 & @50\\
%         \midrule
%         MDCVAE & 22.43 & 38.72 & 20.97 & 26.45 & 4.34 & 9.60 & 3.38 & 4.87 & 14.03 & 29.75 & 11.98 & 18.13\\
%         TopicVAE & 17.00 & 37.78 & 17.54 & 23.84 & 5.31 & 11.59 & 4.23 & 6.00 & 14.27 & 31.90 & 13.01 & 19.54\\
%         RecVAE & 21.46 & 38.39 & 22.43 & 27.27 & 3.77 & 8.79 & 2.92 & 4.34 & \textbf{14.45} & 32.78 & 13.02 & \underline{19.80}\\
%         MacridVAE & 21.92 & 43.00 & 22.95 & 29.21 & 5.82 & 11.96 & 4.84 & 6.58 & 14.25 & 32.28 & 12.74 & 19.49\\
%         SEM-MacridVAE & 22.25 & 42.52 & 23.42 & 29.41 & 5.13 & 10.91 & 4.23 & 5.88 & 14.17 & 31.59 & \textbf{13.36} & 19.77\\
%         ADDVAE & \underline{23.44} & \underline{43.89} & \underline{24.12} & \underline{30.23} & 5.76 & 11.96 & 4.90 & 6.65 & 14.01 & \underline{32.95} & 12.62 & 19.63\\
%         VALID & 22.50 & 43.44 & 23.24 & 29.43 & \underline{6.18} & \underline{12.61} & \underline{5.21} & \underline{7.01} & 14.22 & 31.91 & 12.99 & 19.60\\
%         \midrule
%         \ourmethod & $\textbf{24.10}^\star$ & $\textbf{45.26}^\star$ & $\textbf{24.68}^\star$ & $\textbf{30.93}^\star$ & $\textbf{6.63}^\star$ & $\textbf{13.65}^\star$ & $\textbf{5.35}^\star$ & $\textbf{7.35}^\star$ & \underline{14.36} & $\textbf{33.22}^\star$ & \underline{13.08} & $\textbf{20.05}^\star$\\
%         \bottomrule
%     \end{tabular}
%     }
% \end{table*}

% \begin{table*}
%     \centering
%     % \small
%     \caption{Recommendation performance comparison. The highest results are boldfaced while the runners-up are underlined. Units of numbers are percentage (\%). All models are trained ten times with different random seeds. Reported numbers are averaged over ten runs. $^\star$ denotes statistical significance on a paired t-test with $\text{p-value} < 0.05$. }
%     % On MovieLens, where models' performance vary, \ourmethod's numbers are statistically significant on some metrics, e.g., the statistically significant gap between \ourmethod\ and ADDVAE on R@10, N@10 and N@50.\looseness=-1}
%     \label{tab:recom_result}
%     \scalebox{0.9}{
%     % \begin{tabular}{c@{\hskip 0.04in}c@{\hskip 0.03in}c@{\hskip 0.03in}c@{\hskip 0.03in}c@{\hskip 0.03in}c@{\hskip 0.2in}c@{\hskip 0.03in}c@{\hskip 0.03in}c@{\hskip 0.03in}c@{\hskip 0.03in}c@{\hskip 0.2in}c@{\hskip 0.03in}c@{\hskip 0.03in}c@{\hskip 0.03in}c@{\hskip 0.03in}c}
%     \begin{tabular}{c
%                     c@{\hskip 0.03in}c@{\hskip 0.03in}c@{\hskip 0.03in}c 
%                     c@{\hskip 0.03in}c@{\hskip 0.03in}c@{\hskip 0.03in}c 
%                     c@{\hskip 0.03in}c@{\hskip 0.03in}c@{\hskip 0.03in}c
%                     c@{\hskip 0.03in}c@{\hskip 0.03in}c@{\hskip 0.03in}c}
%         \toprule
%         \multirow{3}{*}{\textbf{Model}} & \multicolumn{4}{c}{\textbf{CiteULike-a}} & \multicolumn{4}{c}{\textbf{Cell Phones}} & \multicolumn{4}{c}{\textbf{Video Games}} & \multicolumn{4}{c}{\textbf{MovieLens}}\\
%         \cmidrule(lr){2-5}\cmidrule(lr){6-9}\cmidrule(lr){10-13}\cmidrule(lr){14-17}
%         % & Recall & Recall & NDCG & NDCG & Recall & Recall & NDCG & NDCG & Recall & Recall & NDCG & NDCG & Recall & Recall & NDCG & NDCG\\
%         & R@10 & R@50 & N@10 & N@50 & R@10 & R@50 & N@10 & N@50 & R@10 & R@50 & N@10 & N@50 & R@10 & R@50 & N@10 & N@50\\
%         % & @10 & @50 & @10 & @50 & @10 & @50 & @10 & @50 & @10 & @50 & @10 & @50 & @10 & @50 & @10 & @50\\
%         \midrule
%         MDCVAE & 22.43 & 38.72 & 20.97 & 26.45 & 4.34 & 9.60 & 3.38 & 4.87 & 5.90 & 14.21 & 3.84 & 5.98 & 14.03 & 29.75 & 11.98 & 18.13\\
%         TopicVAE & 17.00 & 37.78 & 17.54 & 23.84 & 5.31 & 11.59 & 4.23 & 6.00 & - & - & - & - & 14.27 & 31.90 & 13.01 & 19.54\\
%         RecVAE & 21.46 & 38.39 & 22.43 & 27.27 & 3.77 & 8.79 & 2.92 & 4.34 & 6.93 & 18.02 & 4.33 & 7.15 & \textbf{14.45} & 32.78 & 13.02 & \underline{19.80}\\
%         MacridVAE & 21.92 & 43.00 & 22.95 & 29.21 & 5.82 & 11.96 & 4.84 & 6.58 & 7.95 & 20.02 & 5.14 & 8.22 & 14.25 & 32.28 & 12.74 & 19.49\\
%         SEM-MacridVAE & 22.25 & 42.52 & 23.42 & 29.41 & 5.13 & 10.91 & 4.23 & 5.88 & 6.82 & 17.30 & 4.31 & 7.01 & 14.17 & 31.59 & \textbf{13.36} & 19.77\\
%         ADDVAE & 23.44 & \underline{43.89} & 24.12 & 30.23 & 5.76 & 11.96 & 4.90 & 6.65 & 8.09 & 20.11 & 5.21 & 8.30 & 14.01 & \underline{32.95} & 12.62 & 19.63\\
%         VALID & 22.50 & 43.44 & 23.24 & 29.43 & \underline{6.18} & \underline{12.61} & \underline{5.21} & \underline{7.01} & \underline{8.50} & \underline{20.61} & \underline{5.43} & \underline{8.60} & 14.22 & 31.91 & 12.99 & 19.60\\
%         FacetVAE & \underline{23.53} & 43.85 & \textbf{24.68} & \underline{30.43} & 5.52 & 11.60 & 4.53 & 6.25 & 7.64 & 19.50 & 4.92 & 7.96 & 13.97 & 31.89 & 12.68 & 19.33\\
%         \midrule
%         \ourmethod & $\textbf{24.10}^\star$ & $\textbf{45.26}^\star$ & $\textbf{24.68}$ & $\textbf{30.93}^\star$ & $\textbf{6.63}^\star$ & $\textbf{13.65}^\star$ & $\textbf{5.35}^\star$ & $\textbf{7.35}^\star$ & $\textbf{8.78}^\star$ & $\textbf{21.39}^\star$ & $\textbf{5.63}^\star$ & $\textbf{8.86}^\star$ & \underline{14.36} & $\textbf{33.22}^\star$ & \underline{13.08} & $\textbf{20.05}^\star$\\
%         \bottomrule
%     \end{tabular}
%     }
% \end{table*}


% \begin{table*}
%     \centering
%     % \small
%     \caption{Recommendation performance comparison. The highest results are boldfaced while the runners-up are underlined. Units of numbers are percentage (\%). All models are trained ten times with different random seeds. Reported numbers are averaged over ten runs. $^\star$ denotes statistical significance on a paired t-test with $\text{p-value} < 0.05$. }
%     % On MovieLens, where models' performance vary, \ourmethod's numbers are statistically significant on some metrics, e.g., the statistically significant gap between \ourmethod\ and ADDVAE on R@10, N@10 and N@50.\looseness=-1}
%     \label{tab:recom_result}
%     \scalebox{0.9}{
%     % \begin{tabular}{c@{\hskip 0.04in}c@{\hskip 0.03in}c@{\hskip 0.03in}c@{\hskip 0.03in}c@{\hskip 0.03in}c@{\hskip 0.2in}c@{\hskip 0.03in}c@{\hskip 0.03in}c@{\hskip 0.03in}c@{\hskip 0.03in}c@{\hskip 0.2in}c@{\hskip 0.03in}c@{\hskip 0.03in}c@{\hskip 0.03in}c@{\hskip 0.03in}c}
%     \begin{tabular}{c
%                     c@{\hskip 0.03in}c@{\hskip 0.03in}c@{\hskip 0.03in}c 
%                     c@{\hskip 0.03in}c@{\hskip 0.03in}c@{\hskip 0.03in}c 
%                     c@{\hskip 0.03in}c@{\hskip 0.03in}c@{\hskip 0.03in}c
%                     c@{\hskip 0.03in}c@{\hskip 0.03in}c@{\hskip 0.03in}c}
%         \toprule
%         \multirow{3}{*}{\textbf{Model}} & \multicolumn{4}{c}{\textbf{CiteULike-a}} & \multicolumn{4}{c}{\textbf{Cell Phones}} & \multicolumn{4}{c}{\textbf{Video Games}} & \multicolumn{4}{c}{\textbf{MovieLens}}\\
%         \cmidrule(lr){2-5}\cmidrule(lr){6-9}\cmidrule(lr){10-13}\cmidrule(lr){14-17}
%         % & Recall & Recall & NDCG & NDCG & Recall & Recall & NDCG & NDCG & Recall & Recall & NDCG & NDCG & Recall & Recall & NDCG & NDCG\\
%         & R@10 & R@50 & N@10 & N@50 & R@10 & R@50 & N@10 & N@50 & R@10 & R@50 & N@10 & N@50 & R@10 & R@50 & N@10 & N@50\\
%         % & @10 & @50 & @10 & @50 & @10 & @50 & @10 & @50 & @10 & @50 & @10 & @50 & @10 & @50 & @10 & @50\\
%         \midrule
%         MDCVAE & 22.43 & 38.72 & 20.97 & 26.45 & 4.34 & 9.60 & 3.38 & 4.87 & 5.90 & 14.21 & 3.84 & 5.98 & 14.03 & 29.75 & 11.98 & 18.13\\
%         TopicVAE & 17.00 & 37.78 & 17.54 & 23.84 & 5.31 & 11.59 & 4.23 & 6.00 & - & - & - & - & 14.27 & 31.90 & 13.01 & 19.54\\
%         RecVAE & 21.46 & 38.39 & 22.43 & 27.27 & 3.77 & 8.79 & 2.92 & 4.34 & 6.93 & 18.02 & 4.33 & 7.15 & \textbf{14.45} & 32.78 & 13.02 & \underline{19.80}\\
%         MacridVAE & 21.92 & 43.00 & 22.95 & 29.21 & 5.82 & 11.96 & 4.84 & 6.58 & 7.95 & 20.02 & 5.14 & 8.22 & 14.25 & 32.28 & 12.74 & 19.49\\
%         SEM-MacridVAE & 22.25 & 42.52 & 23.42 & 29.41 & 5.13 & 10.91 & 4.23 & 5.88 & 6.82 & 17.30 & 4.31 & 7.01 & 14.17 & 31.59 & \textbf{13.36} & 19.77\\
%         ADDVAE & 23.44 & \underline{43.89} & 24.12 & 30.23 & 5.76 & 11.96 & 4.90 & 6.65 & 8.09 & 20.11 & 5.21 & 8.30 & 14.01 & \underline{32.95} & 12.62 & 19.63\\
%         VALID & 22.50 & 43.44 & 23.24 & 29.43 & \underline{6.18} & \underline{12.61} & \underline{5.21} & \underline{7.01} & \underline{8.50} & \underline{20.61} & \underline{5.43} & \underline{8.60} & 14.22 & 31.91 & 12.99 & 19.60\\
%         FacetVAE & \underline{23.53} & 43.85 & \textbf{24.68} & \underline{30.43} & 5.52 & 11.60 & 4.53 & 6.25 & 7.64 & 19.50 & 4.92 & 7.96 & 13.97 & 31.89 & 12.68 & 19.33\\
%         \midrule
%         \ourmethod & $\textbf{24.10}^\star$ & $\textbf{45.26}^\star$ & $\textbf{24.68}$ & $\textbf{30.93}^\star$ & $\textbf{6.63}^\star$ & $\textbf{13.65}^\star$ & $\textbf{5.35}^\star$ & $\textbf{7.35}^\star$ & $\textbf{8.78}^\star$ & $\textbf{21.39}^\star$ & $\textbf{5.63}^\star$ & $\textbf{8.86}^\star$ & \underline{14.36} & $\textbf{33.22}^\star$ & \underline{13.08} & $\textbf{20.05}^\star$\\
%         \bottomrule
%     \end{tabular}
%     }
% \end{table*}

% TKDE version
\begin{table*}[t]
    \centering
    \caption{Recommendation performance comparison. The highest results are boldfaced while the runners-up are underlined. Units of reported numbers, which are averaged over ten runs, are percentage. Blue numbers denote \ourmethod's improvements over baselines. $^\star$ denotes statistical significance on a paired t-test with $\text{p-value} < 5 \times 10^{-2}$. }
    \label{tab:recom_result}
    \scalebox{1}{
    \begin{tabular}{l
                    l@{\hskip 0.1in}l
                    l@{\hskip 0.1in}l 
                    l@{\hskip 0.1in}l
                    l@{\hskip 0.1in}l}
        \toprule
        \multirow{2}{*}{\textbf{Model}} & \multicolumn{2}{c}{\textbf{CiteULike-a}} & \multicolumn{2}{c}{\textbf{Cell Phones}} & \multicolumn{2}{c}{\textbf{Video Games}} & \multicolumn{2}{c}{\textbf{MovieLens}}\\
        \cmidrule(lr){2-3}\cmidrule(lr){4-5}\cmidrule(lr){6-7}\cmidrule(lr){8-9}
        % & R@10 & R@50 & N@10 & N@50 & R@10 & R@50 & N@10 & N@50 & R@10 & R@50 & N@10 & N@50 & R@10 & R@50 & N@10 & N@50\\
        & R@10 & N@10 & R@10 & N@10 & R@10 & N@10 & R@10 & N@10\\
        \midrule
        MDCVAE & 22.43$^{\textcolor{blue}{+7.8\%}}$ & 20.97$^{\textcolor{blue}{+17.8\%}}$ & 4.34$^{\textcolor{blue}{+53.5\%}}$ & 3.38$^{\textcolor{blue}{+58.3\%}}$ & 5.90$^{\textcolor{blue}{+51.2\%}}$ & 3.84$^{\textcolor{blue}{+50.0\%}}$ & 14.03$^{\textcolor{blue}{+2.4\%}}$ & 11.98$^{\textcolor{blue}{+9.7\%}}$\\
        TopicVAE & 17.00$^{\textcolor{blue}{+42.2\%}}$ & 17.54$^{\textcolor{blue}{+40.8\%}}$ & 5.31$^{\textcolor{blue}{+25.4\%}}$ & 4.23$^{\textcolor{blue}{+26.5\%}}$ & 6.87$^{\textcolor{blue}{+29.8\%}}$ & 4.37$^{\textcolor{blue}{+31.8\%}}$ & 14.27$^{\textcolor{blue}{+0.6\%}}$ & 13.01$^{\textcolor{blue}{+1.0\%}}$\\
        RecVAE & 21.46$^{\textcolor{blue}{+12.6\%}}$ & 22.43$^{\textcolor{blue}{+10.1\%}}$ & 3.77$^{\textcolor{blue}{+76.7\%}}$ & 2.92$^{\textcolor{blue}{+83.2\%}}$ & 6.93$^{\textcolor{blue}{+28.7\%}}$ & 4.33$^{\textcolor{blue}{+33.0\%}}$ & \textbf{14.45}$^{\textcolor{blue}{-0.6\%}}$ & 13.02$^{\textcolor{blue}{+0.9\%}}$\\
        MacridVAE & 21.92$^{\textcolor{blue}{+10.3\%}}$ & 22.95$^{\textcolor{blue}{+7.6\%}}$ & 5.82$^{\textcolor{blue}{+14.4\%}}$ & 4.84$^{\textcolor{blue}{+10.5\%}}$ & 7.95$^{\textcolor{blue}{+12.2\%}}$ & 5.14$^{\textcolor{blue}{+12.1\%}}$ & 14.25$^{\textcolor{blue}{+0.8\%}}$ & 12.74$^{\textcolor{blue}{+3.1\%}}$\\
        SEM-MacridVAE & 22.91$^{\textcolor{blue}{+5.5\%}}$ & 23.85$^{\textcolor{blue}{+3.6\%}}$ & 5.39$^{\textcolor{blue}{+23.6\%}}$ & 4.32$^{\textcolor{blue}{+23.8\%}}$ & 7.61$^{\textcolor{blue}{+17.2\%}}$ & 4.87$^{\textcolor{blue}{+18.3\%}}$ & 14.17$^{\textcolor{blue}{+1.3\%}}$ & \textbf{13.36}$^{\textcolor{blue}{-1.6\%}}$\\
        ADDVAE & 23.44$^{\textcolor{blue}{+3.1\%}}$ & 24.12$^{\textcolor{blue}{+2.4\%}}$ & 5.76$^{\textcolor{blue}{+15.6\%}}$ & 4.90$^{\textcolor{blue}{+9.2\%}}$ & 8.09$^{\textcolor{blue}{+10.3\%}}$ & 5.21$^{\textcolor{blue}{+10.6\%}}$ & 14.01$^{\textcolor{blue}{+2.5\%}}$ & 12.62$^{\textcolor{blue}{+4.1\%}}$\\
        ELSA & 21.23$^{\textcolor{blue}{+13.8\%}}$ & 22.25$^{\textcolor{blue}{+11.0\%}}$ & \underline{6.21}$^{\textcolor{blue}{+7.2\%}}$ & 4.75$^{\textcolor{blue}{+12.6\%}}$ & 7.39$^{\textcolor{blue}{+20.7\%}}$ & 4.63$^{\textcolor{blue}{+24.4\%}}$ & 13.35$^{\textcolor{blue}{+7.6\%}}$ & 12.26$^{\textcolor{blue}{+7.2\%}}$\\
        VALID & 22.50$^{\textcolor{blue}{+7.4\%}}$ & 23.24$^{\textcolor{blue}{+6.3\%}}$ & 6.18$^{\textcolor{blue}{+7.8\%}}$ & \underline{5.21}$^{\textcolor{blue}{+2.7\%}}$ & \underline{8.48}$^{\textcolor{blue}{+5.2\%}}$ & \underline{5.39}$^{\textcolor{blue}{+6.9\%}}$ & 14.22$^{\textcolor{blue}{+1.0\%}}$ & 12.99$^{\textcolor{blue}{+1.2\%}}$\\
        FacetVAE & \underline{23.53}$^{\textcolor{blue}{+2.7\%}}$ & \underline{24.68}$^{\textcolor{blue}{+0.1\%}}$ & 5.52$^{\textcolor{blue}{+20.7\%}}$ & 4.53$^{\textcolor{blue}{+18.1\%}}$ & 7.64$^{\textcolor{blue}{+16.8\%}}$ & 4.92$^{\textcolor{blue}{+17.1\%}}$ & 13.97$^{\textcolor{blue}{+2.8\%}}$ & 12.68$^{\textcolor{blue}{+3.6\%}}$\\
        \midrule
        \ourmethod & $\textbf{24.17}^\star$ & $\textbf{24.70}$ & $\textbf{6.66}^\star$ & $\textbf{5.35}^\star$ & $\textbf{8.92}^\star$ & $\textbf{5.76}^\star$ & \underline{14.36} & \underline{13.14}\\
        p-value & $2.2 \times 10^{-4}$ & $7.7 \times 10^{-1}$ & $6.6 \times 10^{-5}$ & $3.2 \times 10^{-2}$ & $6.6 \times 10^{-4}$ & $1.1 \times 10^{-4}$ & $4.4 \times 10^{-1}$ & $5.9 \times 10^{-2}$\\
        \bottomrule
    \end{tabular}
    }
    
    \scalebox{0.97}{
    \begin{tabular}{l
                    l@{\hskip 0.1in}l
                    l@{\hskip 0.1in}l 
                    l@{\hskip 0.1in}l
                    l@{\hskip 0.1in}l}
        \toprule
        \multirow{2}{*}{\textbf{Model}} & \multicolumn{2}{c}{\textbf{CiteULike-a}} & \multicolumn{2}{c}{\textbf{Cell Phones}} & \multicolumn{2}{c}{\textbf{Video Games}} & \multicolumn{2}{c}{\textbf{MovieLens}}\\
        \cmidrule(lr){2-3}\cmidrule(lr){4-5}\cmidrule(lr){6-7}\cmidrule(lr){8-9}
        & R@50 & N@50 & R@50 & N@50 & R@50 & N@50 & R@50 & N@50\\
        \midrule
        MDCVAE & 38.72$^{\textcolor{blue}{+17.1\%}}$ & 26.45$^{\textcolor{blue}{+17.0\%}}$ & 9.60$^{\textcolor{blue}{+42.4\%}}$ & 4.87$^{\textcolor{blue}{+50.9\%}}$ & 14.21$^{\textcolor{blue}{+51.9\%}}$ & 5.98$^{\textcolor{blue}{+50.5\%}}$ & 29.75$^{\textcolor{blue}{+11.5\%}}$ & 18.13$^{\textcolor{blue}{+10.8\%}}$\\
        TopicVAE & 37.78$^{\textcolor{blue}{+20.1\%}}$ & 23.84$^{\textcolor{blue}{+29.8\%}}$ & 11.59$^{\textcolor{blue}{+17.9\%}}$ & 6.00$^{\textcolor{blue}{+22.5\%}}$ & 17.94$^{\textcolor{blue}{+20.3\%}}$ & 7.22$^{\textcolor{blue}{+24.7\%}}$ & 31.90$^{\textcolor{blue}{+4.0\%}}$ & 19.54$^{\textcolor{blue}{+2.8\%}}$\\
        RecVAE & 38.39$^{\textcolor{blue}{+18.2\%}}$ & 27.27$^{\textcolor{blue}{+13.5\%}}$ & 8.79$^{\textcolor{blue}{+55.5\%}}$ & 4.34$^{\textcolor{blue}{+69.4\%}}$ & 18.02$^{\textcolor{blue}{+19.8\%}}$ & 7.15$^{\textcolor{blue}{+25.9\%}}$ & 32.78$^{\textcolor{blue}{+1.2\%}}$ & \underline{19.80}$^{\textcolor{blue}{+1.5\%}}$\\
        MacridVAE & 43.00$^{\textcolor{blue}{+5.5\%}}$ & 29.21$^{\textcolor{blue}{+5.9\%}}$ & 11.96$^{\textcolor{blue}{+14.3\%}}$ & 6.58$^{\textcolor{blue}{+11.7\%}}$ & 20.02$^{\textcolor{blue}{+7.8\%}}$ & 8.22$^{\textcolor{blue}{+9.5\%}}$ & 32.28$^{\textcolor{blue}{+2.8\%}}$ & 19.49$^{\textcolor{blue}{+3.1\%}}$\\
        SEM-MacridVAE & 43.14$^{\textcolor{blue}{+5.1\%}}$ & 29.87$^{\textcolor{blue}{+3.6\%}}$ & 11.75$^{\textcolor{blue}{+16.3\%}}$ & 6.12$^{\textcolor{blue}{+20.1\%}}$ & 19.01$^{\textcolor{blue}{+13.5\%}}$ & 7.80$^{\textcolor{blue}{+15.4\%}}$ & 31.59$^{\textcolor{blue}{+5.0\%}}$ & 19.77$^{\textcolor{blue}{+1.6\%}}$\\
        ADDVAE & \underline{43.89}$^{\textcolor{blue}{+3.3\%}}$ & 30.23$^{\textcolor{blue}{+2.3\%}}$ & 11.96$^{\textcolor{blue}{+14.3\%}}$ & 6.65$^{\textcolor{blue}{+10.5\%}}$ & 20.11$^{\textcolor{blue}{+7.3\%}}$ & 8.30$^{\textcolor{blue}{+8.4\%}}$ & \underline{32.95}$^{\textcolor{blue}{+0.7\%}}$ & 19.63$^{\textcolor{blue}{+2.3\%}}$\\
        ELSA & 41.20$^{\textcolor{blue}{+10.1\%}}$ & 28.32$^{\textcolor{blue}{+9.3\%}}$ & \underline{13.05}$^{\textcolor{blue}{+4.8\%}}$ & 6.72$^{\textcolor{blue}{+9.4\%}}$ & 19.91$^{\textcolor{blue}{+8.4\%}}$ & 7.81$^{\textcolor{blue}{+15.2\%}}$ & 31.95$^{\textcolor{blue}{+3.8\%}}$ & 19.13$^{\textcolor{blue}{+5.0\%}}$\\
        VALID & 43.44$^{\textcolor{blue}{+4.4\%}}$ & 29.43$^{\textcolor{blue}{+5.1\%}}$ & 12.61$^{\textcolor{blue}{+8.4\%}}$ & \underline{7.01}$^{\textcolor{blue}{+4.9\%}}$ & \underline{20.61}$^{\textcolor{blue}{+4.7\%}}$ & \underline{8.56}$^{\textcolor{blue}{+5.10\%}}$ & 31.91$^{\textcolor{blue}{+4.0\%}}$ & 19.60$^{\textcolor{blue}{+2.5\%}}$\\
        FacetVAE & 43.85$^{\textcolor{blue}{+3.4\%}}$ & \underline{30.43}$^{\textcolor{blue}{+1.7\%}}$ & 11.60$^{\textcolor{blue}{+17.8\%}}$ & 6.25$^{\textcolor{blue}{+17.6\%}}$ & 19.50$^{\textcolor{blue}{+10.7\%}}$ & 7.96$^{\textcolor{blue}{+13.1\%}}$ & 31.89$^{\textcolor{blue}{+4.0\%}}$ & 19.33$^{\textcolor{blue}{+3.9\%}}$\\
        \midrule
        \ourmethod & $\textbf{45.36}^\star$ & $\textbf{30.94}^\star$ & $\textbf{13.67}^\star$ & $\textbf{7.35}^\star$ & $\textbf{21.58}^\star$ & $\textbf{9.00}^\star$ & $\textbf{33.18}^\star$ & $\textbf{20.09}^\star$\\
        p-value & $2.5 \times 10^{-3}$ & $7.8 \times 10^{-3}$ & $2.8 \times 10^{-3}$ & $2.3 \times 10^{-4}$ & $2.8 \times 10^{-6}$ & $1.1\times10^{-8}$ & $3.8 \times 10^{-2}$ & $3.2 \times 10^{-2}$\\
        \bottomrule
    \end{tabular}
    }
\end{table*}
\begin{table*}
    \centering
    % \small
    \caption{Recommendation performance comparison. The highest results are boldfaced while the runners-up are underlined. Units of numbers are percentage (\%). All models are trained ten times with different random seeds. Reported numbers are averaged over ten runs. $^\star$ denotes statistical significance on a paired t-test with $\text{p-value} < 0.05$. }
    % On MovieLens, where models' performance vary, \ourmethod's numbers are statistically significant on some metrics, e.g., the statistically significant gap between \ourmethod\ and ADDVAE on R@10, N@10 and N@50.\looseness=-1}
    \label{tab:recom_result}
    \scalebox{0.9}{
    % \begin{tabular}{c@{\hskip 0.04in}c@{\hskip 0.03in}c@{\hskip 0.03in}c@{\hskip 0.03in}c@{\hskip 0.03in}c@{\hskip 0.2in}c@{\hskip 0.03in}c@{\hskip 0.03in}c@{\hskip 0.03in}c@{\hskip 0.03in}c@{\hskip 0.2in}c@{\hskip 0.03in}c@{\hskip 0.03in}c@{\hskip 0.03in}c@{\hskip 0.03in}c}
    \begin{tabular}{c
                    c@{\hskip 0.03in}c@{\hskip 0.03in}c@{\hskip 0.03in}c 
                    c@{\hskip 0.03in}c@{\hskip 0.03in}c@{\hskip 0.03in}c 
                    c@{\hskip 0.03in}c@{\hskip 0.03in}c@{\hskip 0.03in}c
                    c@{\hskip 0.03in}c@{\hskip 0.03in}c@{\hskip 0.03in}c}
        \toprule
        \multirow{3}{*}{\textbf{Model}} & \multicolumn{4}{c}{\textbf{CiteULike-a}} & \multicolumn{4}{c}{\textbf{Cell Phones}} & \multicolumn{4}{c}{\textbf{Video Games}} & \multicolumn{4}{c}{\textbf{MovieLens}}\\
        \cmidrule(lr){2-5}\cmidrule(lr){6-9}\cmidrule(lr){10-13}\cmidrule(lr){14-17}
        % & Recall & Recall & NDCG & NDCG & Recall & Recall & NDCG & NDCG & Recall & Recall & NDCG & NDCG & Recall & Recall & NDCG & NDCG\\
        & R@10 & R@50 & N@10 & N@50 & R@10 & R@50 & N@10 & N@50 & R@10 & R@50 & N@10 & N@50 & R@10 & R@50 & N@10 & N@50\\
        % & @10 & @50 & @10 & @50 & @10 & @50 & @10 & @50 & @10 & @50 & @10 & @50 & @10 & @50 & @10 & @50\\
        \midrule
        MDCVAE & 22.43 & 38.72 & 20.97 & 26.45 & 4.34 & 9.60 & 3.38 & 4.87 & 5.90 & 14.21 & 3.84 & 5.98 & 14.03 & 29.75 & 11.98 & 18.13\\
        TopicVAE & 17.00 & 37.78 & 17.54 & 23.84 & 5.31 & 11.59 & 4.23 & 6.00 & - & - & - & - & 14.27 & 31.90 & 13.01 & 19.54\\
        RecVAE & 21.46 & 38.39 & 22.43 & 27.27 & 3.77 & 8.79 & 2.92 & 4.34 & 6.93 & 18.02 & 4.33 & 7.15 & \textbf{14.45} & 32.78 & 13.02 & \underline{19.80}\\
        MacridVAE & 21.92 & 43.00 & 22.95 & 29.21 & 5.82 & 11.96 & 4.84 & 6.58 & 7.95 & 20.02 & 5.14 & 8.22 & 14.25 & 32.28 & 12.74 & 19.49\\
        SEM-MacridVAE & 22.25 & 42.52 & 23.42 & 29.41 & 5.13 & 10.91 & 4.23 & 5.88 & 6.82 & 17.30 & 4.31 & 7.01 & 14.17 & 31.59 & \textbf{13.36} & 19.77\\
        ADDVAE & 23.44 & \underline{43.89} & 24.12 & 30.23 & 5.76 & 11.96 & 4.90 & 6.65 & 8.09 & 20.11 & 5.21 & 8.30 & 14.01 & \underline{32.95} & 12.62 & 19.63\\
        VALID & 22.50 & 43.44 & 23.24 & 29.43 & \underline{6.18} & \underline{12.61} & \underline{5.21} & \underline{7.01} & \underline{8.50} & \underline{20.61} & \underline{5.43} & \underline{8.60} & 14.22 & 31.91 & 12.99 & 19.60\\
        FacetVAE & \underline{23.53} & 43.85 & \textbf{24.68} & \underline{30.43} & 5.52 & 11.60 & 4.53 & 6.25 & 7.64 & 19.50 & 4.92 & 7.96 & 13.97 & 31.89 & 12.68 & 19.33\\
        \midrule
        \ourmethod & $\textbf{24.10}^\star$ & $\textbf{45.26}^\star$ & $\textbf{24.68}$ & $\textbf{30.93}^\star$ & $\textbf{6.63}^\star$ & $\textbf{13.65}^\star$ & $\textbf{5.35}^\star$ & $\textbf{7.35}^\star$ & $\textbf{8.78}^\star$ & $\textbf{21.39}^\star$ & $\textbf{5.63}^\star$ & $\textbf{8.86}^\star$ & \underline{14.36} & $\textbf{33.22}^\star$ & \underline{13.08} & $\textbf{20.05}^\star$\\
        \bottomrule
    \end{tabular}
    }
\end{table*}
