\begin{table*}[ht]
\centering
\caption{Test accuracy comparison ($\%$). Results are averaged over the last 5 rounds.}
\label{tab:comparison_acc}
\begin{tabular}{|l|c|c|c|c|c|c|}
\hline
\textbf{Dataset} & \textbf{$\alpha$} & \textbf{FedAvg} & \textbf{FedProx} & \textbf{FedSophia} & \textbf{FedNew} & \textbf{FedNewton} \\ \hline
\multirow{3}{*}{\textbf{MNIST}} & \textbf{0.1} & 85.27 & 85.49 & 89.37 & 89.30 & \textbf{94.50} \\
 & 0.5 & 93.60 & 93.56 & 93.82 & 93.78 & \textbf{97.82} \\
 & 10 & 94.79 & 94.71 & 94.37 & 94.32 & \textbf{97.86} \\
\hline
\multirow{3}{*}{\textbf{Fashion-MNIST}} & \textbf{0.1} & 76.36 & 76.81 & 77.62 & 77.89 & \textbf{82.32} \\
 & 0.5 & 84.41 & 84.38 & 84.90 & 84.86 & \textbf{89.11} \\
 & 10 & 86.52 & 86.44 & 86.38 & 86.31 & \textbf{89.24} \\
\hline
\multirow{3}{*}{\textbf{CIFAR-10}} & \textbf{0.1} & 77.98 & 78.14 & 80.87 & 81.04 & \textbf{86.35} \\
 & 0.5 & 83.35 & 83.33 & 83.68 & 83.60 & \textbf{87.51} \\
 & 10 & 85.22 & 85.17 & 84.83 & 84.75 & \textbf{87.93} \\
\hline
\end{tabular}
\end{table*}

\begin{table*}[ht]
\centering
\caption{Comparison of average training time per round (seconds) and peak GPU memory usage (MB). Results are averaged across all $\alpha$ settings. Lower is better.}
\label{tab:resources}
\begin{tabular}{|l|c|c|c|c|c|c|}
\hline
\textbf{Dataset} & \textbf{Metric} & \textbf{FedAvg} & \textbf{FedProx} & \textbf{FedSophia} & \textbf{FedNew} & \textbf{FedNewton} \\ \hline
\multirow{2}{*}{\textbf{MNIST}} & Time (s) & 57.89 & 55.71 & 54.15 & \textbf{53.34} & 69.05 \\
 & GPU (MB) & 1507.91 & 1507.85 & 1508.08 & 1508.08 & \textbf{1463.39} \\ \hline
\multirow{2}{*}{\textbf{Fashion-MNIST}} & Time (s) & 55.91 & 53.97 & \textbf{53.29} & 53.39 & 68.96 \\
 & GPU (MB) & 1507.91 & 1507.78 & 1508.08 & 1508.08 & \textbf{1463.39} \\ \hline
\multirow{2}{*}{\textbf{CIFAR-10}} & Time (s) & 68.60 & 65.57 & 55.62 & \textbf{52.18} & 90.18 \\
 & GPU (MB) & 1482.33 & 1482.33 & 1482.45 & 1482.45 & \textbf{1438.89} \\ \hline
\end{tabular}
\end{table*}

