{"model.embed_tokens.weight": {"1": 0.1872449517250061, "4": 0.049085766077041626, "16": 0.012410925701260567, "64": 0.0034904039930552244, "256": 0.0010781697928905487, "1024": 0.00022433836420532316}, "model.layers.0.self_attn.q_proj.weight": {"1": 1.3060595989227295, "4": 0.19219553470611572, "16": 0.04924020543694496, "64": 0.01352609507739544, "256": 0.0037227727007120848, "1024": 0.0010042368667200208}, "model.layers.0.self_attn.k_proj.weight": {"1": 1.0959824323654175, "4": 0.1654554009437561, "16": 0.062375202775001526, "64": 0.018143590539693832, "256": 0.00734570762142539, "1024": 0.0008075623773038387}, "model.layers.0.self_attn.v_proj.weight": {"1": 0.8513705730438232, "4": 0.2546165883541107, "16": 0.05559617653489113, "64": 0.014795097522437572, "256": 0.005049324594438076, "1024": 0.001017183531075716}, "model.layers.0.self_attn.o_proj.weight": {"1": 0.5920318961143494, "4": 0.16358418762683868, "16": 0.04062434285879135, "64": 0.010934748686850071, "256": 0.0032264627516269684, "1024": 0.000882311025634408}, "model.layers.0.mlp.gate_proj.weight": {"1": 0.5003015398979187, "4": 0.13072475790977478, "16": 0.03308006003499031, "64": 0.009808240458369255, "256": 0.0027292354498058558, "1024": 0.0006323813577182591}, "model.layers.0.mlp.up_proj.weight": {"1": 0.6119828820228577, "4": 0.1697164624929428, "16": 0.040871135890483856, "64": 0.01218860037624836, "256": 0.0033318966161459684, "1024": 0.0008061904227361083}, "model.layers.0.mlp.down_proj.weight": {"1": 0.5908914804458618, "4": 0.14011292159557343, "16": 0.043735213577747345, "64": 0.011009978130459785, "256": 0.0035361910704523325, "1024": 0.0013727066107094288}, "model.layers.0.input_layernorm.weight": {"1": 0.4738501310348511, "4": 0.14169608056545258, "16": 0.014581792056560516, "64": 0.0074495431035757065, "256": 0.0015356196090579033, "1024": 0.00022686815646011382}, "model.layers.0.post_attention_layernorm.weight": {"1": 0.47849997878074646, "4": 0.12109509855508804, "16": 0.034169480204582214, "64": 0.008233116008341312, "256": 0.002686685649678111, "1024": 0.0006051332456991076}, "model.layers.1.self_attn.q_proj.weight": {"1": 1.2168666124343872, "4": 0.2709379494190216, "16": 0.058410391211509705, "64": 0.019076835364103317, "256": 0.010753662325441837, "1024": 0.000990239204838872}, "model.layers.1.self_attn.k_proj.weight": {"1": 0.9678229689598083, "4": 0.21932175755500793, "16": 0.061507679522037506, "64": 0.04154621437191963, "256": 0.009392709471285343, "1024": 0.0014150830684229732}, "model.layers.1.self_attn.v_proj.weight": {"1": 1.0305049419403076, "4": 0.24838997423648834, "16": 0.07442227005958557, "64": 0.01948435977101326, "256": 0.0050799669697880745, "1024": 0.001304387697018683}, "model.layers.1.self_attn.o_proj.weight": {"1": 0.5714910626411438, "4": 0.15580879151821136, "16": 0.03655983507633209, "64": 0.011686297133564949, "256": 0.003261346835643053, "1024": 0.0007899889023974538}, "model.layers.1.mlp.gate_proj.weight": {"1": 0.6694284081459045, "4": 0.17192642390727997, "16": 0.03896550461649895, "64": 0.012654687277972698, "256": 0.0034997740294784307, "1024": 0.0008197391289286315}, "model.layers.1.mlp.up_proj.weight": {"1": 0.6661015748977661, "4": 0.1749904453754425, "16": 0.04075003042817116, "64": 0.013015583157539368, "256": 0.003469703020527959, "1024": 0.000833883008453995}, "model.layers.1.mlp.down_proj.weight": {"1": 0.3263966143131256, "4": 0.08322221785783768, "16": 0.02154417149722576, "64": 0.005717473104596138, "256": 0.001392371952533722, "1024": 0.00034457436413504183}, "model.layers.1.input_layernorm.weight": {"1": 0.19460071623325348, "4": 0.3991505801677704, "16": 0.007106480188667774, "64": 0.005655960645526648, "256": 0.006141518708318472, "1024": 0.0012440383434295654}, "model.layers.1.post_attention_layernorm.weight": {"1": 0.7878860235214233, "4": 0.15586301684379578, "16": 0.03268919140100479, "64": 0.01218967605382204, "256": 0.003977062646299601, "1024": 0.0007590317400172353}, "model.layers.2.self_attn.q_proj.weight": {"1": 0.4244611859321594, "4": 0.08467923849821091, "16": 0.014219628646969795, "64": 0.00440400093793869, "256": 0.0015135875437408686, "1024": 0.0003035320551134646}, "model.layers.2.self_attn.k_proj.weight": {"1": 0.40694260597229004, "4": 0.08615344762802124, "16": 0.02527979202568531, "64": 0.010853790678083897, "256": 0.0017465968849137425, "1024": 0.0005157631821930408}, "model.layers.2.self_attn.v_proj.weight": {"1": 1.609889030456543, "4": 0.3612678647041321, "16": 0.10825937241315842, "64": 0.02996230125427246, "256": 0.006905697751790285, "1024": 0.001843231380917132}, "model.layers.2.self_attn.o_proj.weight": {"1": 0.5610947012901306, "4": 0.15751326084136963, "16": 0.03821280226111412, "64": 0.012131699360907078, "256": 0.0030988254584372044, "1024": 0.000831343699246645}, "model.layers.2.mlp.gate_proj.weight": {"1": 0.6202041506767273, "4": 0.1528172641992569, "16": 0.03554849326610565, "64": 0.011704945005476475, "256": 0.0029400079511106014, "1024": 0.0007664148579351604}, "model.layers.2.mlp.up_proj.weight": {"1": 0.6646523475646973, "4": 0.1765413135290146, "16": 0.03841168060898781, "64": 0.01381018664687872, "256": 0.003990102093666792, "1024": 0.0009085725178010762}, "model.layers.2.mlp.down_proj.weight": {"1": 0.4663757383823395, "4": 0.13408838212490082, "16": 0.030456500127911568, "64": 0.010174193419516087, "256": 0.0026657707057893276, "1024": 0.0008417621138505638}, "model.layers.2.input_layernorm.weight": {"1": 0.866866946220398, "4": 0.06819209456443787, "16": 0.030828488990664482, "64": 0.016848403960466385, "256": 0.004676977172493935, "1024": 0.0014809033600613475}, "model.layers.2.post_attention_layernorm.weight": {"1": 0.7155081629753113, "4": 0.1661609560251236, "16": 0.04050455614924431, "64": 0.013475185260176659, "256": 0.0034400210715830326, "1024": 0.0008707455708645284}, "model.layers.3.self_attn.q_proj.weight": {"1": 0.6401786208152771, "4": 0.1377042680978775, "16": 0.02861805073916912, "64": 0.01761784590780735, "256": 0.003556528128683567, "1024": 0.001393196522258222}, "model.layers.3.self_attn.k_proj.weight": {"1": 0.7044132351875305, "4": 0.10607139766216278, "16": 0.026981381699442863, "64": 0.014675316400825977, "256": 0.0038627057801932096, "1024": 0.0014501003315672278}, "model.layers.3.self_attn.v_proj.weight": {"1": 0.9553114175796509, "4": 0.29857051372528076, "16": 0.07737858593463898, "64": 0.021596349775791168, "256": 0.005041223950684071, "1024": 0.0014605384785681963}, "model.layers.3.self_attn.o_proj.weight": {"1": 0.4238573908805847, "4": 0.1398557722568512, "16": 0.030419116839766502, "64": 0.0106623824685812, "256": 0.002417018637061119, "1024": 0.0007211036863736808}, "model.layers.3.mlp.gate_proj.weight": {"1": 0.5497511625289917, "4": 0.1695123016834259, "16": 0.03483586758375168, "64": 0.013030493631958961, "256": 0.003096511587500572, "1024": 0.0009450488723814487}, "model.layers.3.mlp.up_proj.weight": {"1": 0.5284126996994019, "4": 0.15482278168201447, "16": 0.03677472844719887, "64": 0.012865104712545872, "256": 0.0025920651387423277, "1024": 0.0007668387261219323}, "model.layers.3.mlp.down_proj.weight": {"1": 0.4182348847389221, "4": 0.12633340060710907, "16": 0.027396185323596, "64": 0.008671143092215061, "256": 0.0021822478156536818, "1024": 0.000639149162452668}, "model.layers.3.input_layernorm.weight": {"1": 2.2457211017608643, "4": 1.1068700551986694, "16": 0.012575426138937473, "64": 0.04478492587804794, "256": 0.013761029578745365, "1024": 0.016842832788825035}, "model.layers.3.post_attention_layernorm.weight": {"1": 0.5637004375457764, "4": 0.16370519995689392, "16": 0.03888850659132004, "64": 0.012172361835837364, "256": 0.002969269175082445, "1024": 0.0012515606358647346}, "model.layers.4.self_attn.q_proj.weight": {"1": 0.4148421287536621, "4": 0.14753076434135437, "16": 0.034799642860889435, "64": 0.019023386761546135, "256": 0.0033456177916377783, "1024": 0.0007448042742908001}, "model.layers.4.self_attn.k_proj.weight": {"1": 0.4788739085197449, "4": 0.20432917773723602, "16": 0.055640727281570435, "64": 0.01754802279174328, "256": 0.002156671369448304, "1024": 0.0007925624959170818}, "model.layers.4.self_attn.v_proj.weight": {"1": 0.8480332493782043, "4": 0.22024483978748322, "16": 0.05287407338619232, "64": 0.014507673680782318, "256": 0.003384025301784277, "1024": 0.0009257029159925878}, "model.layers.4.self_attn.o_proj.weight": {"1": 0.3714883327484131, "4": 0.12007464468479156, "16": 0.026084432378411293, "64": 0.007610519416630268, "256": 0.001986015820875764, "1024": 0.0005153439706191421}, "model.layers.4.mlp.gate_proj.weight": {"1": 0.5212664008140564, "4": 0.16459216177463531, "16": 0.030147289857268333, "64": 0.00949886254966259, "256": 0.002349565736949444, "1024": 0.000544208160135895}, "model.layers.4.mlp.up_proj.weight": {"1": 0.47854921221733093, "4": 0.1443224847316742, "16": 0.02918342687189579, "64": 0.008920338936150074, "256": 0.0022759123239666224, "1024": 0.0005786492838524282}, "model.layers.4.mlp.down_proj.weight": {"1": 0.3781452178955078, "4": 0.11725841462612152, "16": 0.024628259241580963, "64": 0.007079390808939934, "256": 0.00192646577488631, "1024": 0.0005041769472882152}, "model.layers.4.input_layernorm.weight": {"1": 0.0677705705165863, "4": 0.5888911485671997, "16": 0.003537491662427783, "64": 0.04299971088767052, "256": 0.001135612721554935, "1024": 0.00021123660553712398}, "model.layers.4.post_attention_layernorm.weight": {"1": 0.3761127293109894, "4": 0.1672838032245636, "16": 0.02262909896671772, "64": 0.00869202520698309, "256": 0.001920394948683679, "1024": 0.00046240835217759013}, "model.layers.5.self_attn.q_proj.weight": {"1": 0.5345194935798645, "4": 0.14677999913692474, "16": 0.03443271294236183, "64": 0.003994664642959833, "256": 0.001603713259100914, "1024": 0.00047698296839371324}, "model.layers.5.self_attn.k_proj.weight": {"1": 0.3173857629299164, "4": 0.21411767601966858, "16": 0.024723149836063385, "64": 0.00523968692868948, "256": 0.0010724797612056136, "1024": 0.0004587113799061626}, "model.layers.5.self_attn.v_proj.weight": {"1": 0.8365506529808044, "4": 0.22977663576602936, "16": 0.05654868111014366, "64": 0.014772862195968628, "256": 0.003951997496187687, "1024": 0.001084434799849987}, "model.layers.5.self_attn.o_proj.weight": {"1": 0.33377760648727417, "4": 0.10609377920627594, "16": 0.021689999848604202, "64": 0.006399915087968111, "256": 0.0017054626950994134, "1024": 0.00045910532935522497}, "model.layers.5.mlp.gate_proj.weight": {"1": 0.28938254714012146, "4": 0.11853143572807312, "16": 0.01758355088531971, "64": 0.0046549211256206036, "256": 0.0017009610310196877, "1024": 0.00034371973015367985}, "model.layers.5.mlp.up_proj.weight": {"1": 0.39452770352363586, "4": 0.13208268582820892, "16": 0.026365987956523895, "64": 0.006965764798223972, "256": 0.0018967532087117434, "1024": 0.0004477992479223758}, "model.layers.5.mlp.down_proj.weight": {"1": 0.3268343210220337, "4": 0.10189282894134521, "16": 0.022241678088903427, "64": 0.005864099133759737, "256": 0.0016881551127880812, "1024": 0.00045519694685935974}, "model.layers.5.input_layernorm.weight": {"1": 0.021885456517338753, "4": 0.19328920543193817, "16": 0.0013847730588167906, "64": 0.0005373531021177769, "256": 9.298442455474287e-05, "1024": 0.00010451040725456551}, "model.layers.5.post_attention_layernorm.weight": {"1": 0.4824332892894745, "4": 0.11359746754169464, "16": 0.020535564050078392, "64": 0.006890307646244764, "256": 0.0017588033806532621, "1024": 0.0004107890126761049}, "model.layers.6.self_attn.q_proj.weight": {"1": 0.744517982006073, "4": 0.15264682471752167, "16": 0.03242383152246475, "64": 0.008283613249659538, "256": 0.0029708819929510355, "1024": 0.00044735168921761215}, "model.layers.6.self_attn.k_proj.weight": {"1": 0.6540988087654114, "4": 0.11009804159402847, "16": 0.02071375399827957, "64": 0.007355881854891777, "256": 0.0016642531845718622, "1024": 0.0003495026030577719}, "model.layers.6.self_attn.v_proj.weight": {"1": 0.6456158757209778, "4": 0.17726287245750427, "16": 0.03990720957517624, "64": 0.010606219060719013, "256": 0.0027437361422926188, "1024": 0.0006907291826792061}, "model.layers.6.self_attn.o_proj.weight": {"1": 0.2938341498374939, "4": 0.09231749922037125, "16": 0.02123769372701645, "64": 0.005502426531165838, "256": 0.0014520578552037477, "1024": 0.0004205932200420648}, "model.layers.6.mlp.gate_proj.weight": {"1": 0.3513147830963135, "4": 0.12961885333061218, "16": 0.02800876460969448, "64": 0.006585357710719109, "256": 0.0018041393486782908, "1024": 0.00043754311627708375}, "model.layers.6.mlp.up_proj.weight": {"1": 0.3854585587978363, "4": 0.12833808362483978, "16": 0.028183981776237488, "64": 0.006883422844111919, "256": 0.0017629018984735012, "1024": 0.0004295702965464443}, "model.layers.6.mlp.down_proj.weight": {"1": 0.33309659361839294, "4": 0.09837573021650314, "16": 0.024342497810721397, "64": 0.00589849753305316, "256": 0.0016581305535510182, "1024": 0.0004326024209149182}, "model.layers.6.input_layernorm.weight": {"1": 0.6758300065994263, "4": 0.09491206705570221, "16": 0.020635321736335754, "64": 0.02047666534781456, "256": 0.003675037296488881, "1024": 0.0017697170842438936}, "model.layers.6.post_attention_layernorm.weight": {"1": 0.33993303775787354, "4": 0.16163258254528046, "16": 0.030007805675268173, "64": 0.004949161782860756, "256": 0.0014113755896687508, "1024": 0.0005721592460758984}, "model.layers.7.self_attn.q_proj.weight": {"1": 0.3260212540626526, "4": 0.12501074373722076, "16": 0.028857892379164696, "64": 0.012048237025737762, "256": 0.002577864332124591, "1024": 0.0006305079441517591}, "model.layers.7.self_attn.k_proj.weight": {"1": 0.49233266711235046, "4": 0.16972845792770386, "16": 0.04886690527200699, "64": 0.013225012458860874, "256": 0.0025924991350620985, "1024": 0.0004424657381605357}, "model.layers.7.self_attn.v_proj.weight": {"1": 0.5622943043708801, "4": 0.16729064285755157, "16": 0.04261491820216179, "64": 0.008934615179896355, "256": 0.002609182382002473, "1024": 0.0005580971483141184}, "model.layers.7.self_attn.o_proj.weight": {"1": 0.27279654145240784, "4": 0.0812150314450264, "16": 0.020258363336324692, "64": 0.004812887869775295, "256": 0.001453760894946754, "1024": 0.0003957805165555328}, "model.layers.7.mlp.gate_proj.weight": {"1": 0.38962051272392273, "4": 0.10898399353027344, "16": 0.034172531217336655, "64": 0.009912396781146526, "256": 0.0027040622662752867, "1024": 0.0004233859071973711}, "model.layers.7.mlp.up_proj.weight": {"1": 0.3596349060535431, "4": 0.10351096838712692, "16": 0.027947572991251945, "64": 0.007146873977035284, "256": 0.001831834320910275, "1024": 0.00038446299731731415}, "model.layers.7.mlp.down_proj.weight": {"1": 0.3073596954345703, "4": 0.08490654826164246, "16": 0.022149227559566498, "64": 0.005822197534143925, "256": 0.0015026993351057172, "1024": 0.0003863975580316037}, "model.layers.7.input_layernorm.weight": {"1": 0.027606645599007607, "4": 0.026326127350330353, "16": 0.013065768405795097, "64": 0.00446332385763526, "256": 0.00016650866018608212, "1024": 4.4738888391293585e-05}, "model.layers.7.post_attention_layernorm.weight": {"1": 0.6462825536727905, "4": 0.09340481460094452, "16": 0.042564671486616135, "64": 0.012928461655974388, "256": 0.0027008356992155313, "1024": 0.0003391522914171219}, "model.layers.8.self_attn.q_proj.weight": {"1": 0.1879602074623108, "4": 0.05949018523097038, "16": 0.022372962906956673, "64": 0.005063088145107031, "256": 0.0019807936623692513, "1024": 0.00027023942675441504}, "model.layers.8.self_attn.k_proj.weight": {"1": 0.17242620885372162, "4": 0.14001280069351196, "16": 0.03859521821141243, "64": 0.010171754285693169, "256": 0.0018521694000810385, "1024": 0.0005506540765054524}, "model.layers.8.self_attn.v_proj.weight": {"1": 0.46529778838157654, "4": 0.12887752056121826, "16": 0.03259881213307381, "64": 0.008198417723178864, "256": 0.002289755968376994, "1024": 0.0005319461924955249}, "model.layers.8.self_attn.o_proj.weight": {"1": 0.2909315228462219, "4": 0.07481379806995392, "16": 0.02048298344016075, "64": 0.004979618359357119, "256": 0.0013433436397463083, "1024": 0.0003380755370017141}, "model.layers.8.mlp.gate_proj.weight": {"1": 0.36732542514801025, "4": 0.11791378259658813, "16": 0.03274893760681152, "64": 0.006741228513419628, "256": 0.001522111240774393, "1024": 0.00034465669887140393}, "model.layers.8.mlp.up_proj.weight": {"1": 0.3441968560218811, "4": 0.08974543958902359, "16": 0.025019435212016106, "64": 0.005609885789453983, "256": 0.001618524082005024, "1024": 0.0003540816833265126}, "model.layers.8.mlp.down_proj.weight": {"1": 0.29532307386398315, "4": 0.07032281905412674, "16": 0.020533567294478416, "64": 0.004976313095539808, "256": 0.0013586872955784202, "1024": 0.00036919722333550453}, "model.layers.8.input_layernorm.weight": {"1": 1.6007912158966064, "4": 0.218120276927948, "16": 0.03250131756067276, "64": 0.021449988707900047, "256": 0.012115150690078735, "1024": 0.0002244621719000861}, "model.layers.8.post_attention_layernorm.weight": {"1": 0.20323894917964935, "4": 0.044045060873031616, "16": 0.011250670999288559, "64": 0.002632135758176446, "256": 0.0007617253577336669, "1024": 0.0001288335188291967}, "model.layers.9.self_attn.q_proj.weight": {"1": 0.18865253031253815, "4": 0.05593262240290642, "16": 0.03078932873904705, "64": 0.004358484875410795, "256": 0.0017838393105193973, "1024": 0.0003739351232070476}, "model.layers.9.self_attn.k_proj.weight": {"1": 0.2508668601512909, "4": 0.16742409765720367, "16": 0.03238840401172638, "64": 0.006624463014304638, "256": 0.002133245812729001, "1024": 0.0003927682409994304}, "model.layers.9.self_attn.v_proj.weight": {"1": 0.38396093249320984, "4": 0.08840285241603851, "16": 0.02630688063800335, "64": 0.007009223103523254, "256": 0.001641712966375053, "1024": 0.00047179937246255577}, "model.layers.9.self_attn.o_proj.weight": {"1": 0.2782389521598816, "4": 0.06617625802755356, "16": 0.020301789045333862, "64": 0.004754474852234125, "256": 0.0013065729290246964, "1024": 0.00036406496656127274}, "model.layers.9.mlp.gate_proj.weight": {"1": 0.2715241312980652, "4": 0.06829781830310822, "16": 0.017305294051766396, "64": 0.004047010559588671, "256": 0.0012879016576334834, "1024": 0.00034688872983679175}, "model.layers.9.mlp.up_proj.weight": {"1": 0.2514065206050873, "4": 0.05738002806901932, "16": 0.019593164324760437, "64": 0.003905521472916007, "256": 0.0010396699653938413, "1024": 0.00029421006911434233}, "model.layers.9.mlp.down_proj.weight": {"1": 0.21465705335140228, "4": 0.053292110562324524, "16": 0.013880177401006222, "64": 0.003686765441671014, "256": 0.0010538152419030666, "1024": 0.0003658342466223985}, "model.layers.9.input_layernorm.weight": {"1": 0.19568119943141937, "4": 0.084781713783741, "16": 0.020511433482170105, "64": 0.00566010270267725, "256": 0.0006372606148943305, "1024": 0.00015235082537401468}, "model.layers.9.post_attention_layernorm.weight": {"1": 0.41517403721809387, "4": 0.046315211802721024, "16": 0.02214682847261429, "64": 0.004133013542741537, "256": 0.0014345067320391536, "1024": 0.00033291999716311693}, "model.layers.10.self_attn.q_proj.weight": {"1": 0.2788296639919281, "4": 0.0773957371711731, "16": 0.010363949462771416, "64": 0.0030646563973277807, "256": 0.003083780873566866, "1024": 0.0009093895205296576}, "model.layers.10.self_attn.k_proj.weight": {"1": 0.9526179432868958, "4": 0.20706792175769806, "16": 0.04109947010874748, "64": 0.011265179142355919, "256": 0.007841085083782673, "1024": 0.0022610498126596212}, "model.layers.10.self_attn.v_proj.weight": {"1": 0.6439330577850342, "4": 0.16220052540302277, "16": 0.04174812510609627, "64": 0.011153444647789001, "256": 0.0027448295149952173, "1024": 0.0008012137841433287}, "model.layers.10.self_attn.o_proj.weight": {"1": 0.2704717516899109, "4": 0.06289540231227875, "16": 0.017533812671899796, "64": 0.004567396827042103, "256": 0.0011656585847958922, "1024": 0.00037083803908899426}, "model.layers.10.mlp.gate_proj.weight": {"1": 0.26097407937049866, "4": 0.050002772361040115, "16": 0.013259146362543106, "64": 0.0035239134449511766, "256": 0.0009877332486212254, "1024": 0.00031209594453684986}, "model.layers.10.mlp.up_proj.weight": {"1": 0.17965932190418243, "4": 0.051170915365219116, "16": 0.01200967188924551, "64": 0.0030884856823831797, "256": 0.0007927697151899338, "1024": 0.0002335394819965586}, "model.layers.10.mlp.down_proj.weight": {"1": 0.15525971353054047, "4": 0.04412863031029701, "16": 0.011213497258722782, "64": 0.0028254466596990824, "256": 0.0007829443202354014, "1024": 0.00023269394296221435}, "model.layers.10.input_layernorm.weight": {"1": 1.4147294759750366, "4": 0.06426876783370972, "16": 0.06723158806562424, "64": 0.010888725519180298, "256": 0.007732268422842026, "1024": 0.0005045831203460693}, "model.layers.10.post_attention_layernorm.weight": {"1": 0.21214190125465393, "4": 0.0528077594935894, "16": 0.01019451767206192, "64": 0.0030639113392680883, "256": 0.001334568252786994, "1024": 0.00027659395709633827}, "model.layers.11.self_attn.q_proj.weight": {"1": 0.06337587535381317, "4": 0.05216663330793381, "16": 0.00582223292440176, "64": 0.0014331276761367917, "256": 0.0010095088509842753, "1024": 0.00012688299466390163}, "model.layers.11.self_attn.k_proj.weight": {"1": 0.1460721343755722, "4": 0.08399676531553268, "16": 0.015184937976300716, "64": 0.0019883227068930864, "256": 0.0017332581337541342, "1024": 0.00019793346291407943}, "model.layers.11.self_attn.v_proj.weight": {"1": 0.5587217807769775, "4": 0.1532893031835556, "16": 0.0399056151509285, "64": 0.009075991809368134, "256": 0.0024549849331378937, "1024": 0.0007088732672855258}, "model.layers.11.self_attn.o_proj.weight": {"1": 0.18450212478637695, "4": 0.050389714539051056, "16": 0.012594163417816162, "64": 0.0032839030027389526, "256": 0.0008236755966208875, "1024": 0.0002664200437720865}, "model.layers.11.mlp.gate_proj.weight": {"1": 0.16097579896450043, "4": 0.04185688495635986, "16": 0.011161678470671177, "64": 0.002660974860191345, "256": 0.0006629283307120204, "1024": 0.00019164809782523662}, "model.layers.11.mlp.up_proj.weight": {"1": 0.17191174626350403, "4": 0.04561521112918854, "16": 0.01143976952880621, "64": 0.0027803669217973948, "256": 0.0007614955538883805, "1024": 0.000195037413504906}, "model.layers.11.mlp.down_proj.weight": {"1": 0.14068742096424103, "4": 0.036029424518346786, "16": 0.00961409043520689, "64": 0.0025038293097168207, "256": 0.0006530752289108932, "1024": 0.00018757169891614467}, "model.layers.11.input_layernorm.weight": {"1": 0.024668317288160324, "4": 0.0034047579392790794, "16": 0.004071925766766071, "64": 0.0022170355077832937, "256": 7.932291919132695e-05, "1024": 1.6496329408255406e-05}, "model.layers.11.post_attention_layernorm.weight": {"1": 0.15092810988426208, "4": 0.04184328392148018, "16": 0.010539641603827477, "64": 0.002580617554485798, "256": 0.0005277132731862366, "1024": 0.00014393558376468718}, "model.layers.12.self_attn.q_proj.weight": {"1": 0.4021790623664856, "4": 0.0627371147274971, "16": 0.01580428145825863, "64": 0.006645865272730589, "256": 0.003297575516626239, "1024": 0.0002312921133125201}, "model.layers.12.self_attn.k_proj.weight": {"1": 0.3863478899002075, "4": 0.034280311316251755, "16": 0.01808745041489601, "64": 0.006027436815202236, "256": 0.0019148248247802258, "1024": 0.00019927367975469679}, "model.layers.12.self_attn.v_proj.weight": {"1": 0.6375876665115356, "4": 0.15440979599952698, "16": 0.03773845359683037, "64": 0.01031513512134552, "256": 0.002533173654228449, "1024": 0.0007046884275041521}, "model.layers.12.self_attn.o_proj.weight": {"1": 0.188748300075531, "4": 0.043922122567892075, "16": 0.012810759246349335, "64": 0.003286614315584302, "256": 0.0008578463457524776, "1024": 0.0002988885098602623}, "model.layers.12.mlp.gate_proj.weight": {"1": 0.14646750688552856, "4": 0.03423390910029411, "16": 0.009169417433440685, "64": 0.0023566572926938534, "256": 0.0006080997409299016, "1024": 0.00017200833826791495}, "model.layers.12.mlp.up_proj.weight": {"1": 0.13665902614593506, "4": 0.0330548956990242, "16": 0.009251508861780167, "64": 0.0023179345298558474, "256": 0.0005642078467644751, "1024": 0.00015811545017641038}, "model.layers.12.mlp.down_proj.weight": {"1": 0.10975432395935059, "4": 0.029384544119238853, "16": 0.0073015643283724785, "64": 0.0018836208619177341, "256": 0.0005144544411450624, "1024": 0.00019289235933683813}, "model.layers.12.input_layernorm.weight": {"1": 0.2977684438228607, "4": 0.01771450601518154, "16": 0.004196750931441784, "64": 0.0009507364593446255, "256": 0.0024012362118810415, "1024": 0.00013892058632336557}, "model.layers.12.post_attention_layernorm.weight": {"1": 0.13899248838424683, "4": 0.0315777063369751, "16": 0.008585482835769653, "64": 0.002399084623903036, "256": 0.0005362462252378464, "1024": 0.00016128504648804665}, "model.layers.13.self_attn.q_proj.weight": {"1": 0.08680626004934311, "4": 0.03412797302007675, "16": 0.006689957808703184, "64": 0.001340039074420929, "256": 0.0005714558647014201, "1024": 6.622300134040415e-05}, "model.layers.13.self_attn.k_proj.weight": {"1": 0.13117624819278717, "4": 0.021004335954785347, "16": 0.00614705728366971, "64": 0.0014182785525918007, "256": 0.0007570398738607764, "1024": 8.320329652633518e-05}, "model.layers.13.self_attn.v_proj.weight": {"1": 0.6115657687187195, "4": 0.1402696669101715, "16": 0.038131412118673325, "64": 0.009172213263809681, "256": 0.0024590352550148964, "1024": 0.0007499047787860036}, "model.layers.13.self_attn.o_proj.weight": {"1": 0.28232669830322266, "4": 0.07074056565761566, "16": 0.018423503264784813, "64": 0.00466281408444047, "256": 0.001430431380867958, "1024": 0.0006452660309150815}, "model.layers.13.mlp.gate_proj.weight": {"1": 0.10519444197416306, "4": 0.023850005120038986, "16": 0.006025173235684633, "64": 0.0014815147733315825, "256": 0.0004121582896914333, "1024": 0.0001257017720490694}, "model.layers.13.mlp.up_proj.weight": {"1": 0.10538439452648163, "4": 0.02712659351527691, "16": 0.006630315445363522, "64": 0.0017912712646648288, "256": 0.0004351865209173411, "1024": 0.00012099332525394857}, "model.layers.13.mlp.down_proj.weight": {"1": 0.08800069242715836, "4": 0.021007437258958817, "16": 0.005471148993819952, "64": 0.0013568714493885636, "256": 0.00040271427133120596, "1024": 0.00014723659842275083}, "model.layers.13.input_layernorm.weight": {"1": 0.18491198122501373, "4": 0.021390501409769058, "16": 0.026830893009901047, "64": 0.0018858681432902813, "256": 0.0015669127460569143, "1024": 0.0001780284073902294}, "model.layers.13.post_attention_layernorm.weight": {"1": 0.09637398272752762, "4": 0.025483127683401108, "16": 0.005954418797045946, "64": 0.0018213653238490224, "256": 0.0004560486995615065, "1024": 8.157001138897613e-05}, "model.layers.14.self_attn.q_proj.weight": {"1": 0.0881500318646431, "4": 0.017685912549495697, "16": 0.005791556090116501, "64": 0.0020728078670799732, "256": 0.0006918216240592301, "1024": 0.00014263979392126203}, "model.layers.14.self_attn.k_proj.weight": {"1": 0.11108745634555817, "4": 0.019338350743055344, "16": 0.010665415786206722, "64": 0.001480087055824697, "256": 0.0005536475800909102, "1024": 0.00013816962018609047}, "model.layers.14.self_attn.v_proj.weight": {"1": 0.6088870167732239, "4": 0.13691532611846924, "16": 0.036723729223012924, "64": 0.009642858058214188, "256": 0.002109955996274948, "1024": 0.0006423416780307889}, "model.layers.14.self_attn.o_proj.weight": {"1": 0.11042728275060654, "4": 0.028575921431183815, "16": 0.006736906245350838, "64": 0.001829109387472272, "256": 0.00046153401490300894, "1024": 0.0001451637945137918}, "model.layers.14.mlp.gate_proj.weight": {"1": 0.07063962519168854, "4": 0.01698547974228859, "16": 0.004366951994597912, "64": 0.0011305814841762185, "256": 0.0003116439620498568, "1024": 9.345284342998639e-05}, "model.layers.14.mlp.up_proj.weight": {"1": 0.057763177901506424, "4": 0.01663588359951973, "16": 0.0035473578609526157, "64": 0.0009473561076447368, "256": 0.00024859371478669345, "1024": 7.877853204263374e-05}, "model.layers.14.mlp.down_proj.weight": {"1": 0.09393829107284546, "4": 0.02226046472787857, "16": 0.006779473274946213, "64": 0.0017077645752578974, "256": 0.0004776057612616569, "1024": 0.00018699985230341554}, "model.layers.14.input_layernorm.weight": {"1": 0.04752838611602783, "4": 0.006947109010070562, "16": 0.001293282606638968, "64": 0.0001787915243767202, "256": 6.697780190734193e-05, "1024": 3.5424207453615963e-05}, "model.layers.14.post_attention_layernorm.weight": {"1": 0.07143907994031906, "4": 0.015965839847922325, "16": 0.004233693238347769, "64": 0.0013412388507276773, "256": 0.0002447825390845537, "1024": 7.422650378430262e-05}, "model.layers.15.self_attn.q_proj.weight": {"1": 0.0821196436882019, "4": 0.015984851866960526, "16": 0.005007769912481308, "64": 0.001749542891047895, "256": 0.0002871657779905945, "1024": 9.75803704932332e-05}, "model.layers.15.self_attn.k_proj.weight": {"1": 0.07397767156362534, "4": 0.02220071852207184, "16": 0.005878673866391182, "64": 0.0017887384165078402, "256": 0.0002976347168441862, "1024": 0.00013786868657916784}, "model.layers.15.self_attn.v_proj.weight": {"1": 0.246751070022583, "4": 0.06285376101732254, "16": 0.015204056166112423, "64": 0.004211129620671272, "256": 0.0010113805765286088, "1024": 0.0002992439840454608}, "model.layers.15.self_attn.o_proj.weight": {"1": 0.0712454691529274, "4": 0.017326179891824722, "16": 0.004162069875746965, "64": 0.0011526538291946054, "256": 0.0003148310643155128, "1024": 0.00012076532584615052}, "model.layers.15.mlp.gate_proj.weight": {"1": 0.045468635857105255, "4": 0.010950091294944286, "16": 0.0025912669952958822, "64": 0.0007378553855232894, "256": 0.00019522479851730168, "1024": 7.285273022716865e-05}, "model.layers.15.mlp.up_proj.weight": {"1": 0.046039704233407974, "4": 0.010554411448538303, "16": 0.0025578534696251154, "64": 0.0007368801161646843, "256": 0.00020413615857250988, "1024": 7.731385267106816e-05}, "model.layers.15.mlp.down_proj.weight": {"1": 0.029180502519011497, "4": 0.008169776760041714, "16": 0.0018297474598512053, "64": 0.0005215237615630031, "256": 0.00018139369785785675, "1024": 9.099959424929693e-05}, "model.layers.15.input_layernorm.weight": {"1": 0.06203458830714226, "4": 0.024793287739157677, "16": 0.003255364252254367, "64": 0.002105953637510538, "256": 0.0002703401551116258, "1024": 0.00012161985068814829}, "model.layers.15.post_attention_layernorm.weight": {"1": 0.041638296097517014, "4": 0.012411798350512981, "16": 0.0028245856519788504, "64": 0.0007795020355843008, "256": 0.00019049856928177178, "1024": 5.2521969337249175e-05}, "model.norm.weight": {"1": 0.0, "4": 0.0, "16": 1.3479660299748307e-14, "64": 2.2084845887823668e-13, "256": 3.477050895470124e-12, "1024": 5.953768728028663e-11}}