model_name,thinking_mode,model_family,instruction_tuned,source,AGIEval,AI2D,ARC-C,ARC-E,BBEH,BBH,BLINK,Bird-SQL,BoolQ,COCO-caption,ChartQA,CountBenchVQA,DROP,DocVQA,ECLeKTic,FACTS-Grounding,GMMLU-Lite,GPQA-Diamond,GSM8K,Global-MMLU-Lite,HellaSwag,HiddenMath,HumanEval,IFEval_strict_prompt,InfoVQA,LiveCodeBench,MATH,MBPP,MMLU,MMLU-Pro,MMMU,MMMU-val,N2C,NQ,OK-VQA,PIQA,ReMI,RealWorldQA,SIQA,SimpleQA,SpatialSenseVQA,TQA,TallyQA,TextVQA,VQAv2,WMT24++,WinoGrande
Google/Gemma-3-1B,Non-thinking,Gemma,Yes,Gemma3 Report Table 6 (Instruction fine-tuned),,,,,,,,6.4,,,,,,,,36.4,,19.2,,34.2,,15.8,,,,1.9,48.0,,,14.7,,,,,,,,,,2.2,,,,,,,
Google/Gemma-3-4B,Non-thinking,Gemma,Yes,Gemma3 Report Table 6 (Instruction fine-tuned),,,,,,,,36.3,,,,,,,,70.1,,30.8,,54.5,,43.0,,,,12.6,75.6,,,43.6,,48.8,,,,,,,,4.0,,,,,,,
Google/Gemma-3-12B,Non-thinking,Gemma,Yes,Gemma3 Report Table 6 (Instruction fine-tuned),,,,,,,,47.9,,,,,,,,75.8,,40.9,,69.5,,54.5,,,,24.6,83.8,,,60.6,,59.6,,,,,,,,6.3,,,,,,,
Google/Gemma-3-27B,Non-thinking,Gemma,Yes,Gemma3 Report Table 6 (Instruction fine-tuned),,,,,,,,54.4,,,,,,,,74.9,,42.4,,75.1,,60.3,,,,29.7,89.0,,,67.5,,64.9,,,,,,,,10.0,,,,,,,
Google/Gemma-3-1B,Non-thinking,Gemma,No,"Gemma3 Report Table 9 (Factuality, reasoning)",,,38.4,73.0,,28.4,,,63.2,,,,42.4,,,,,,,,62.3,,,,,,,,,,,,,9.48,,73.8,,,48.9,,,39.8,,,,,58.2
Google/Gemma-3-4B,Non-thinking,Gemma,No,"Gemma3 Report Table 9 (Factuality, reasoning)",,,56.2,82.4,,50.9,,,72.3,,,,60.1,,,,,,,,77.2,,,,,,,,,,,,,20.0,,79.6,,,51.9,,,65.8,,,,,64.7
Google/Gemma-3-12B,Non-thinking,Gemma,No,"Gemma3 Report Table 9 (Factuality, reasoning)",,,68.9,88.3,,72.6,,,78.8,,,,72.2,,,,,,,,84.2,,,,,,,,,,,,,31.4,,81.8,,,53.4,,,78.2,,,,,74.3
Google/Gemma-3-27B,Non-thinking,Gemma,No,"Gemma3 Report Table 9 (Factuality, reasoning)",,,70.6,89.0,,77.7,,,82.4,,,,77.2,,,,,,,,85.6,,,,,,,,,,,,,36.1,,83.3,,,54.9,,,85.5,,,,,78.8
Google/Gemma-3-4B,Non-thinking,Gemma,No,Gemma3 Report Table 10 (STEM + code),42.1,,,,,,,,,,,,,,,,,15.0,38.4,,,,36.0,,,,24.2,46.0,59.6,29.2,,,,,,,,,,,,,,,,,
Google/Gemma-3-12B,Non-thinking,Gemma,No,Gemma3 Report Table 10 (STEM + code),57.4,,,,,,,,,,,,,,,,,25.4,71.0,,,,45.7,,,,43.3,60.4,74.5,45.3,,,,,,,,,,,,,,,,,
Google/Gemma-3-27B,Non-thinking,Gemma,No,Gemma3 Report Table 10 (STEM + code),66.2,,,,,,,,,,,,,,,,,24.3,82.6,,,,48.8,,,,50.0,65.6,78.6,52.2,,,,,,,,,,,,,,,,,
Google/Gemma-3-4B,Non-thinking,Gemma,No,Gemma3 Report Table 11 (Multimodal),,63.2,,,,,38.0,,,102.0,63.6,26.1,,72.8,,,,,,,,,,,44.1,,,,,,39.2,,,,51.0,,27.3,45.5,,,50.9,,42.5,58.9,63.9,,
Google/Gemma-3-12B,Non-thinking,Gemma,No,Gemma3 Report Table 11 (Multimodal),,75.2,,,,,35.9,,,111.0,74.7,17.8,,82.3,,,,,,,,,,,54.8,,,,,,50.3,,,,58.7,,38.5,52.2,,,60.0,,51.8,66.5,71.2,,
Google/Gemma-3-27B,Non-thinking,Gemma,No,Gemma3 Report Table 11 (Multimodal),,79.0,,,,,39.6,,,116.0,76.3,68.0,,85.6,,,,,,,,,,,59.4,,,,,,56.1,,,,60.2,,44.8,53.9,,,59.4,,54.3,68.6,72.9,,
Google/Gemma-3-1B,Non-thinking,Gemma,Yes,Gemma3 Report Table 18 (Instruction fine-tuned extended),,,,,7.2,39.1,,,,,,,,,1.4,,34.2,,62.8,,,15.0,41.5,80.2,,5.0,48.0,35.2,38.8,,,,56.0,,,,,,,,,,,,,35.9,
Google/Gemma-3-4B,Non-thinking,Gemma,Yes,Gemma3 Report Table 18 (Instruction fine-tuned extended),,,,,11.0,72.2,,,,,,,,,4.6,,54.5,,89.2,,,42.0,71.3,90.2,,23.0,75.6,63.2,58.1,,,,70.3,,,,,,,,,,,,,46.8,
Google/Gemma-3-12B,Non-thinking,Gemma,Yes,Gemma3 Report Table 18 (Instruction fine-tuned extended),,,,,16.3,85.7,,,,,,,,,10.3,,69.5,,94.4,,,51.0,85.4,88.9,,32.0,83.8,73.0,71.9,,,,80.7,,,,,,,,,,,,,51.6,
Google/Gemma-3-27B,Non-thinking,Gemma,Yes,Gemma3 Report Table 18 (Instruction fine-tuned extended),,,,,19.3,87.6,,,,,,,,,16.7,,75.1,,95.9,,,56.0,87.8,90.4,,39.0,89.0,74.4,76.9,,,,84.5,,,,,,,,,,,,,53.4,
