\begin{table*}[ht]
\captionsetup{font=small,labelfont=small}
\begin{minipage}{0.48\textwidth}
\centering
\caption{Effect of adding the regularization term $\mathcal{R}(h, \mathcal{S}, \mathcal{T})$ to loss on performance for IPUMS dataset. For significant impact of the extra regularization term, the hyperparameter search is done within range $W = \{10^{-5}, 5\times 10^{-5}, 10^{-4}, 5\times 10^{-4}, 10^{-3}, 5\times 10^{-3}, 10^{-2}\}$.}\label{tab:reg_term_train_ipums}
\scriptsize
\begin{tabular}{l|rr|rr}
Dataset &\multicolumn{2}{c}{PLWFA} &\multicolumn{2}{c}{BLWFA} \\\cmidrule{1-5}
\diagbox{\textbfne{Bag Size}}{\textbfne{Method}} &$w_R = 0$ &best $w_R \in W$ &$w_R = 0$ &best $w_R \in W$ \\\midrule
8 &1.15 ± 0.00 &1.23 ± 0.01 &1.14 ± 0.00 &1.23 ± 0.01 \\
32 &1.18 ± 0.00 &1.32 ± 0.02 &1.16 ± 0.00 &1.32 ± 0.02 \\
128 &1.25 ± 0.01 &1.38 ± 0.03 &1.22 ± 0.00 &1.38 ± 0.03 \\
256 &1.29 ± 0.01 &1.42 ± 0.02 &1.25 ± 0.01 &1.42 ± 0.02\\
\end{tabular}
\end{minipage}
\hfill
\begin{minipage}{0.48\textwidth}
\centering
\caption{Effect of adding the regularization term $\mathcal{R}(h, \mathcal{S}, \mathcal{T})$ to loss on performance for Criteo dataset. For significant impact of the extra regularization term, the hyperparameter search is done within range $W = \{10^{-5}, 5\times 10^{-5}, 10^{-4}, 5\times 10^{-4}, 10^{-3}, 5\times 10^{-3}, 10^{-2}\}$.}\label{tab:reg_term_train_criteo}
\scriptsize
\begin{tabular}{l|rr|rr}
Dataset &\multicolumn{2}{c}{PLWFA} &\multicolumn{2}{c}{BLWFA} \\\cmidrule{1-5}
\diagbox{\textbfne{Bag Size}}{\textbfne{Method}} &$w_R = 0$ &best $w_R \in W$ &$w_R = 0$ &best $w_R \in W$ \\\midrule
64 &204.71 ± 2.6 &256.11 ± 4.45 &204.62 ± 2.4 &255.23 ± 4.57 \\
128 &226.39 ± 2.9 &264.97 ± 3.61 &226.33 ± 2.9 &264.45 ± 3.50 \\
256 &240.55 ± 3.3 &279.45 ± 2.06 &240.39 ± 3.2 &279.48 ± 2.06 \\
512 &254.46 ± 5.5 &291.38 ± 2.44 &254.36 ± 5.5 &290.96 ± 2.46 \\
\end{tabular}
\end{minipage}
\end{table*}

