% Auto-generated significance vs random_25
\begin{table}[t]
\floatconts{tab:significance}{\caption{Paired significance vs random\_25 baseline (two-tailed sign-flip test); $N$=pairs per method.}}{
\begin{tabular}{lcccc}
\toprule
Method & $N$ & $\Delta Q$ (mean) & $p$-value & Cohen's $d$ \\
\midrule
hybrid_no_silence_prompt_proxy & 12 & -0.184 & 0.0008 & -1.46 \\
hybrid_ours & 12 & -0.003 & 0.9300 & -0.02 \\
phrase_boundary & 12 & -0.068 & 0.0862 & -0.54 \\
random_10 & 12 & -0.388 & 0.0002 & -3.03 \\
tension_only & 12 & -0.325 & 0.0006 & -2.22 \\
weak_beats & 12 & -0.389 & 0.0005 & -3.28 \\
\bottomrule
\end{tabular}
}
\end{table}