name, params   , params_with_lm_head
6xs2,   3416064,              196608
6xs ,   4254720,              230400
5xs ,   5160960,              331776
5xs2,   6085632,              451584
5xs1,   7028736,              589824
4xs ,   7225344,              786432
4xs2,   8239104,              995328
4xs1,  11427840,             1769472
3xs ,  11870208,             2211840
3xs2,  14278656,             3010560
3xs1,  16809984,             3932160
xxs ,  17596416,             4718592
xxs3,  20459520,             5971968
xxs2,  26628096,             8921088
xxs4,  33386496,            12460032
xxs1,  36986880,            14450688
xs  ,  39395328,            16859136
xs3 ,  41803776,            19267584
xs2 ,  50921472,            25165824
xs1 ,  54067200,            28311552
s   ,  57212928,            31457280
s3  ,  94887936,            59473920
s2  , 109412352,            70778880
s1  , 116490240,            77856768
base, 123568128,            84934656
m5  , 160677888,           115605504
m4  , 202506240,           150994944
m3  , 215089152,           163577856
m2  , 227672064,           176160768
m1  , 240254976,           188743680
m   , 252837888,           201326592
