\begin{table}[t]
  \centering
  \small
  \setlength{\tabcolsep}{6pt}
  \begin{tabular}{llllll}
    \toprule
    Model & Family & Size (B) & Tokens (T) & FLOPs (1E21) & OpenLLM metric \

    \midrule
    baichuan-inc/Baichuan-7B & Baichuan & — & 1.20 & — & No \
    baichuan-inc/Baichuan2-7B-Base & Baichuan & 7 & 2.60 & 109.20 & No \
    baichuan-inc/Baichuan2-7B-Chat & Baichuan & 7 & 2.60 & 109.20 & No \
    deepseek-ai/DeepSeek-V3 & DeepSeek & 684.5 & 14.80 & 60783.60 & No \
    deepseek-ai/deepseek-coder-1.3b-base & DeepSeek-Coder & 1.3 & 2.00 & 15.60 & No \
    deepseek-ai/deepseek-coder-1.3b-instruct & DeepSeek-Coder & 1.3 & 2.00 & 15.60 & No \
    deepseek-ai/deepseek-coder-33b-base & DeepSeek-Coder & 33.3 & 2.00 & 396.00 & No \
    deepseek-ai/deepseek-coder-33b-instruct & DeepSeek-Coder & 33.3 & 2.00 & 399.60 & No \
    deepseek-ai/deepseek-coder-6.7b-base & DeepSeek-Coder & 6.7 & 2.00 & 80.40 & No \
    deepseek-ai/deepseek-coder-6.7b-instruct & DeepSeek-Coder & 6.7 & 2.00 & 80.40 & No \
    deepseek-ai/deepseek-coder-7b-base-v1.5 & DeepSeek-Coder & 6.9 & 2.00 & 82.80 & No \
    deepseek-ai/deepseek-coder-7b-instruct-v1.5 & DeepSeek-Coder & 6.9 & 2.00 & 82.80 & No \
    deepseek-ai/DeepSeek-R1 & DeepSeek-R1 & 684.5 & 14.80 & 60783.60 & No \
    deepseek-ai/DeepSeek-R1-Distill-Llama-70B & DeepSeek-R1 & 70.6 & 15.00 & 6354.00 & Yes \
    deepseek-ai/DeepSeek-R1-Distill-Llama-8B & DeepSeek-R1 & 8 & 15.00 & 720.00 & Yes \
    deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B & DeepSeek-R1 & 1.8 & 18.00 & 194.40 & Yes \
    deepseek-ai/DeepSeek-R1-Distill-Qwen-14B & DeepSeek-R1 & 14.8 & 18.00 & 1598.40 & Yes \
    deepseek-ai/DeepSeek-R1-Distill-Qwen-32B & DeepSeek-R1 & 32.8 & 18.00 & 3542.40 & Yes \
    deepseek-ai/DeepSeek-R1-Distill-Qwen-7B & DeepSeek-R1 & 7.6 & 18.00 & 820.80 & Yes \
    LGAI-EXAONE/EXAONE-3.5-32B-Instruct & Exaone & 32 & 6.50 & 1248.00 & Yes \
    LGAI-EXAONE/EXAONE-Deep-32B & Exaone & 32 & 6.50 & 1248.00 & No \
    openai/gpt-oss-120b & GPT-OSS & 120.4 & — & — & No \
    openai/gpt-oss-20b & GPT-OSS & 21.5 & — & — & No \
    google/gemma-1.1-2b-it & Gemma & 2.5 & 3.00 & 45.00 & Yes \
    google/gemma-1.1-7b-it & Gemma & 8.5 & 6.00 & 306.00 & Yes \
    google/gemma-7b & Gemma & 8.5 & 6.00 & 252.00 & Yes \
    google/gemma-7b-it & Gemma & 8.5 & 2.00 & 102.00 & Yes \
    google/gemma-2-27b & Gemma-2 & 27.2 & 13.00 & 2121.60 & Yes \
    google/gemma-2-27b-it & Gemma-2 & 27.2 & 13.00 & 2121.60 & Yes \
    google/gemma-2-2b & Gemma-2 & 2.6 & 2.00 & 31.20 & Yes \
    google/gemma-2-2b-it & Gemma-2 & 2.6 & 2.00 & 31.20 & Yes \
    google/gemma-2-9b & Gemma-2 & 9.2 & 8.00 & 441.60 & Yes \
    google/gemma-2-9b-it & Gemma-2 & 9.2 & 8.00 & 441.60 & Yes \
    google/gemma-2b & Gemma-2 & 2.5 & 6.00 & 72.00 & Yes \
    google/gemma-2b-it & Gemma-2 & 2.5 & 6.00 & 90.00 & Yes \
    google/gemma-3-12b-it & Gemma-3 & 12.2 & 12.00 & 878.40 & No \
    google/gemma-3-12b-pt & Gemma-3 & 12.2 & 12.00 & 878.40 & No \
    google/gemma-3-27b-it & Gemma-3 & 27.4 & 14.00 & 2301.60 & No \
    google/gemma-3-4b-it & Gemma-3 & 4.3 & 4.00 & 103.20 & No \
    google/gemma-3-4b-pt & Gemma-3 & 4.3 & 4.00 & 103.20 & No \
    ibm-granite/granite-3.1-2b-base & Granite & 2.5 & 12.00 & 180.00 & Yes \
    ibm-granite/granite-3.1-2b-instruct & Granite & 2.5 & 12.00 & 180.00 & Yes \
    ibm-granite/granite-3.1-8b-base & Granite & 8.2 & 12.00 & 590.40 & Yes \
    ibm-granite/granite-3.1-8b-instruct & Granite & 8.2 & 12.00 & 590.40 & Yes \
    ibm-granite/granite-3.2-2b-instruct & Granite & 2.5 & 12.00 & 180.00 & Yes \
    ibm-granite/granite-3.2-8b-instruct & Granite & 8.2 & 12.00 & 590.40 & Yes \
    ibm-granite/granite-3.3-2b-base & Granite & 2.5 & 12.00 & 180.00 & No \
    ibm-granite/granite-3.3-2b-instruct & Granite & 2.5 & 12.00 & 180.00 & No \
    ibm-granite/granite-3.3-8b-base & Granite & 8.2 & 12.00 & 590.40 & No \
    ibm-granite/granite-3.3-8b-instruct & Granite & 8.2 & 12.00 & 590.40 & No \
    moonshotai/Kimi-K2-Instruct & Kimi & 1000 & 15.50 & 93000.00 & No \
    meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8 & Llama & 401.6 & 22.00 & 53011.20 & No \
    meta-llama/Llama-4-Scout-17B-16E-Instruct & Llama & 108.6 & 40.00 & 26064.00 & No \
    meta-llama/llama3\\_8B\\_o4-mini-2025-04-16 & Llama & — & — & — & No \
    meta-llama/Llama-2-13b-hf & Llama-2 & 13 & 2.00 & 156.00 & Yes \
    meta-llama/Llama-2-70b-hf & Llama-2 & 69 & 2.00 & 840.00 & Yes \
    meta-llama/Llama-2-7b-hf & Llama-2 & 6.7 & 2.00 & 84.00 & Yes \
    meta-llama/Llama-3.1-70B & Llama-3 & 70.6 & 15.00 & 6354.00 & Yes \
    meta-llama/Llama-3.2-1B & Llama-3 & 1.2 & 9.00 & 64.80 & Yes \
    meta-llama/Llama-3.2-3B & Llama-3 & 3.2 & 9.00 & 172.80 & Yes \
    meta-llama/Llama-3.3-70B-Instruct & Llama-3 & 70.6 & 15.00 & 6354.00 & Yes \
    meta-llama/Meta-Llama-3-70B & Llama-3 & 70.6 & 15.00 & 6300.00 & Yes \
    meta-llama/Meta-Llama-3-70B-Instruct & Llama-3 & 70.6 & 15.00 & 6354.00 & Yes \
    meta-llama/Meta-Llama-3-8B & Llama-3 & 8 & 15.00 & 720.00 & Yes \
    meta-llama/Meta-Llama-3-8B-Instruct & Llama-3 & 8 & 15.00 & 720.00 & Yes \
    mistralai/Mistral-7B-Instruct-v0.2 & Mistral & 7.2 & — & — & Yes \
    mistralai/Mixtral-8x7B-Instruct-v0.1 & Mistral & 46.7 & — & — & Yes \
    Qwen/Qwen-14B & Qwen & 14.2 & 3.00 & 252.00 & No \
    Qwen/Qwen-72B & Qwen & 72.3 & 3.00 & 1296.00 & No \
    Qwen/Qwen-7B & Qwen & 7.7 & 2.40 & 100.80 & No \
    Qwen/Qwen1.5-1.8B & Qwen1.5 & 1.8 & 2.40 & 25.92 & Yes \
    Qwen/Qwen1.5-110B & Qwen1.5 & 111.2 & 7.00 & 4670.40 & Yes \
    Qwen/Qwen1.5-14B & Qwen1.5 & 14.2 & 4.00 & 336.00 & Yes \
    Qwen/Qwen1.5-32B & Qwen1.5 & 32.5 & 4.00 & 768.00 & Yes \
    Qwen/Qwen1.5-4B & Qwen1.5 & 4 & 2.40 & 57.60 & Yes \
    Qwen/Qwen1.5-72B & Qwen1.5 & 72.3 & 3.00 & 1296.00 & No \
    Qwen/Qwen1.5-7B & Qwen1.5 & 7.7 & 4.00 & 168.00 & Yes \
    Qwen/Qwen2.5-0.5B & Qwen2.5 & 0.5 & 18.00 & 54.00 & Yes \
    Qwen/Qwen2.5-1.5B & Qwen2.5 & 1.5 & 18.00 & 162.00 & Yes \
    Qwen/Qwen2.5-14B & Qwen2.5 & 14.8 & 18.00 & 1598.40 & Yes \
    Qwen/Qwen2.5-32B & Qwen2.5 & 32.8 & 18.00 & 3542.40 & Yes \
    Qwen/Qwen2.5-3B & Qwen2.5 & 3.1 & 18.00 & 334.80 & Yes \
    Qwen/Qwen2.5-72B & Qwen2.5 & 72.7 & 18.00 & 7851.60 & Yes \
    Qwen/Qwen2.5-7B & Qwen2.5 & 7.6 & 18.00 & 820.80 & Yes \
    Qwen/Qwen3-0.6B & Qwen3 & 0.8 & 36.00 & 172.80 & No \
    Qwen/Qwen3-1.7B & Qwen3 & 2 & 36.00 & 432.00 & No \
    Qwen/Qwen3-14B & Qwen3 & 14.8 & 36.00 & 3196.80 & No \
    Qwen/Qwen3-235B-A22B-Thinking-2507 & Qwen3 & 235.1 & 36.00 & 50781.60 & No \
    Qwen/Qwen3-32B & Qwen3 & 32.8 & 36.00 & 7084.80 & No \
    Qwen/Qwen3-4B & Qwen3 & 4 & 36.00 & 864.00 & No \
    Qwen/Qwen3-8B & Qwen3 & 8.2 & 36.00 & 1771.20 & No \
    01-ai/Yi-1.5-34B & Yi & 34.4 & 3.60 & 743.04 & Yes \
    01-ai/Yi-1.5-34B-Chat & Yi & 34.4 & 3.60 & 743.04 & Yes \
    01-ai/Yi-1.5-6B & Yi & 6.1 & 3.60 & 131.76 & Yes \
    01-ai/Yi-1.5-6B-Chat & Yi & 6.1 & 3.60 & 131.76 & Yes \
    01-ai/Yi-1.5-9B & Yi & 8.8 & 3.60 & 190.08 & Yes \
    01-ai/Yi-34B & Yi & 34.4 & 3.10 & 639.84 & Yes \
    01-ai/Yi-6B & Yi & 6.1 & 3.10 & 113.46 & Yes \
    01-ai/Yi-Coder-1.5B & Yi & 1.5 & 2.40 & 21.60 & No \
    01-ai/Yi-Coder-1.5B-Chat & Yi & 1.5 & 2.40 & 21.60 & No \
    01-ai/Yi-Coder-9B & Yi & 8.8 & 2.40 & 126.72 & No \
    01-ai/Yi-Coder-9B-Chat & Yi & 8.8 & 2.40 & 126.72 & Yes \
    tiiuae/Falcon3-10B-Base & falcon & 10.3 & 14.00 & 865.20 & Yes \
    tiiuae/Falcon3-7B-Base & falcon & 7.5 & 14.00 & 630.00 & Yes \
    tiiuae/falcon-11B & falcon & 11.1 & 5.00 & 333.00 & Yes \
    tiiuae/falcon-40b & falcon & 41.8 & 1.00 & 240.00 & Yes \
    tiiuae/falcon-7b & falcon & 7.2 & 1.50 & 63.00 & Yes \
    gpt-4.1-2025-04-14 & gpt-4.1-2025-04-14 & — & — & — & No \
    gpt-4.1-mini-2025-04-14 & gpt-4.1-mini-2025-04-14 & — & — & — & No \
    gpt-4.1-nano-2025-04-14 & gpt-4.1-nano-2025-04-14 & — & — & — & No \
    o4-mini-2025-04-16 & o4-mini-2025-04-16 & — & — & — & No \
    microsoft/Phi-3-medium-128k-instruct & phi & 14 & 4.80 & 403.20 & Yes \
    microsoft/Phi-3-medium-4k-instruct & phi & 14 & 4.80 & 403.20 & Yes \
    microsoft/Phi-3-mini-128k-instruct & phi & 3.8 & 4.90 & 111.72 & Yes \
    microsoft/Phi-3-mini-4k-instruct & phi & 3.8 & 4.90 & 111.72 & Yes \
    microsoft/phi-1\\_5 & phi & 1.4 & 0.15 & 1.17 & Yes \
    microsoft/phi-4 & phi & 14.7 & 9.80 & 864.36 & Yes \
    bigcode/starcoderbase & starcoder & 15.5 & 1.00 & 93.00 & No \
    bigcode/starcoderbase-1b & starcoder & 15.5 & 1.00 & 6.00 & No \
    bigcode/starcoderbase-3b & starcoder & 15.5 & 1.00 & 18.00 & No \
    bigcode/starcoderbase-7b & starcoder & 15.5 & 1.00 & 42.00 & No \
    bigcode/starcoder2-15b & starcoder2 & 16 & 4.30 & 387.00 & Yes \
    bigcode/starcoder2-3b & starcoder2 & 3 & 3.30 & 59.40 & Yes \
    bigcode/starcoder2-7b & starcoder2 & 7.2 & 3.70 & 155.40 & Yes \
    \bottomrule
  \end{tabular}
  \caption{Models sorted by family then name, with size, pretraining tokens, training FLOPs, and whether an OpenLLM average metric exists (non-NA).}
  \label{tab:model_scaling_summary}
\end{table}