% Please add the following required packages to your document preamble:
% \usepackage{booktabs}
\begin{table}[H]
\centering
\caption{TTS training data of text-to-token LLM with 12.5Hz speech tokenizer. Tokens measured in billions.}
\label{tab:tts-breakdown}
\begin{tabular}{ccccc}
\toprule
Language & Speech Hours & Speech Tokens & Text Tokens & Total Tokens \\ \midrule
Chinese  & 94,980     & 4.27B          & 1.18B        & 5.45B         \\
English  & 42,726     & 1.92B          & 0.56B        & 2.49B         \\ \bottomrule
\end{tabular}
\end{table}