{"model.embed_tokens.weight": {"1": 0.32232680916786194, "4": 0.07750754803419113, "16": 0.04576542600989342, "64": 0.027462726458907127, "256": 0.027342870831489563, "1024": 0.027548952028155327}, "model.layers.0.self_attn.q_proj.weight": {"1": 1.3500385284423828, "4": 0.25823262333869934, "16": 0.17141403257846832, "64": 0.08959326148033142, "256": 0.1104671061038971, "1024": 0.1123402863740921}, "model.layers.0.self_attn.k_proj.weight": {"1": 1.6048723459243774, "4": 0.2808077335357666, "16": 0.19688278436660767, "64": 0.12097541987895966, "256": 0.11737098544836044, "1024": 0.12960976362228394}, "model.layers.0.self_attn.v_proj.weight": {"1": 1.3169474601745605, "4": 0.2970869541168213, "16": 0.17137503623962402, "64": 0.10187435150146484, "256": 0.09664688259363174, "1024": 0.0963672399520874}, "model.layers.0.self_attn.o_proj.weight": {"1": 0.9480679631233215, "4": 0.23088935017585754, "16": 0.1339050829410553, "64": 0.08260361850261688, "256": 0.08332116901874542, "1024": 0.08383065462112427}, "model.layers.0.mlp.gate_proj.weight": {"1": 0.8124935030937195, "4": 0.18112537264823914, "16": 0.09261034429073334, "64": 0.06097523123025894, "256": 0.061448805034160614, "1024": 0.061142317950725555}, "model.layers.0.mlp.up_proj.weight": {"1": 0.9261950254440308, "4": 0.22411300241947174, "16": 0.12060408294200897, "64": 0.07330713421106339, "256": 0.07287626713514328, "1024": 0.07334652543067932}, "model.layers.0.mlp.down_proj.weight": {"1": 0.9805135130882263, "4": 0.20778842270374298, "16": 0.11408251523971558, "64": 0.07059960067272186, "256": 0.07421520352363586, "1024": 0.0727822333574295}, "model.layers.0.input_layernorm.weight": {"1": 1.3625133037567139, "4": 0.09153713285923004, "16": 0.17999213933944702, "64": 0.09191139787435532, "256": 0.05466154217720032, "1024": 0.05575861036777496}, "model.layers.0.post_attention_layernorm.weight": {"1": 0.8370009660720825, "4": 0.19825805723667145, "16": 0.11728063225746155, "64": 0.0790310949087143, "256": 0.07894056290388107, "1024": 0.07931707054376602}, "model.layers.1.self_attn.q_proj.weight": {"1": 2.6082353591918945, "4": 0.3341374099254608, "16": 0.14528211951255798, "64": 0.08812040835618973, "256": 0.0813942700624466, "1024": 0.08269510418176651}, "model.layers.1.self_attn.k_proj.weight": {"1": 1.6444464921951294, "4": 0.3653080463409424, "16": 0.1444951593875885, "64": 0.07732823491096497, "256": 0.07279130071401596, "1024": 0.07484626024961472}, "model.layers.1.self_attn.v_proj.weight": {"1": 1.623691201210022, "4": 0.2783695161342621, "16": 0.13626377284526825, "64": 0.07380760461091995, "256": 0.07783577591180801, "1024": 0.07364192605018616}, "model.layers.1.self_attn.o_proj.weight": {"1": 0.9237194061279297, "4": 0.19867511093616486, "16": 0.10532794892787933, "64": 0.06348342448472977, "256": 0.06341864913702011, "1024": 0.06277807801961899}, "model.layers.1.mlp.gate_proj.weight": {"1": 0.9117048382759094, "4": 0.21750126779079437, "16": 0.11040829867124557, "64": 0.06604158133268356, "256": 0.06324805319309235, "1024": 0.06332586705684662}, "model.layers.1.mlp.up_proj.weight": {"1": 0.956207811832428, "4": 0.2221977263689041, "16": 0.11581895500421524, "64": 0.0664791688323021, "256": 0.06569960713386536, "1024": 0.06436017900705338}, "model.layers.1.mlp.down_proj.weight": {"1": 0.3719816207885742, "4": 0.08904346078634262, "16": 0.04489539563655853, "64": 0.0246950201690197, "256": 0.0220313910394907, "1024": 0.022297536954283714}, "model.layers.1.input_layernorm.weight": {"1": 1.663440227508545, "4": 0.5189417600631714, "16": 0.062469545751810074, "64": 0.0354030504822731, "256": 0.02131732553243637, "1024": 0.013075679540634155}, "model.layers.1.post_attention_layernorm.weight": {"1": 0.9977421760559082, "4": 0.27819183468818665, "16": 0.12926271557807922, "64": 0.08066956698894501, "256": 0.08386816829442978, "1024": 0.08165418356657028}, "model.layers.2.self_attn.q_proj.weight": {"1": 0.6825031042098999, "4": 0.12626051902770996, "16": 0.09006702154874802, "64": 0.07101888954639435, "256": 0.08096563816070557, "1024": 0.08387573063373566}, "model.layers.2.self_attn.k_proj.weight": {"1": 1.1649589538574219, "4": 0.2394658327102661, "16": 0.09315314143896103, "64": 0.06385555118322372, "256": 0.07079046219587326, "1024": 0.06788843870162964}, "model.layers.2.self_attn.v_proj.weight": {"1": 2.0657429695129395, "4": 0.3944760859012604, "16": 0.18063883483409882, "64": 0.0823751837015152, "256": 0.07505479454994202, "1024": 0.07188498228788376}, "model.layers.2.self_attn.o_proj.weight": {"1": 0.8908814787864685, "4": 0.1700006127357483, "16": 0.09785330295562744, "64": 0.05628357455134392, "256": 0.05344598367810249, "1024": 0.05248701572418213}, "model.layers.2.mlp.gate_proj.weight": {"1": 0.8242954015731812, "4": 0.1778024137020111, "16": 0.09391631931066513, "64": 0.058896396309137344, "256": 0.05305957421660423, "1024": 0.052949633449316025}, "model.layers.2.mlp.up_proj.weight": {"1": 0.9796479940414429, "4": 0.20086218416690826, "16": 0.09889490902423859, "64": 0.06356076151132584, "256": 0.0580347515642643, "1024": 0.057172585278749466}, "model.layers.2.mlp.down_proj.weight": {"1": 0.6705122590065002, "4": 0.14779241383075714, "16": 0.0803675651550293, "64": 0.0479443334043026, "256": 0.04410150274634361, "1024": 0.04372663423418999}, "model.layers.2.input_layernorm.weight": {"1": 8.079272270202637, "4": 0.03469689562916756, "16": 0.1561630517244339, "64": 0.3803986608982086, "256": 0.26930248737335205, "1024": 0.3487485647201538}, "model.layers.2.post_attention_layernorm.weight": {"1": 1.2303216457366943, "4": 0.16717782616615295, "16": 0.10440030694007874, "64": 0.0881137102842331, "256": 0.07493994385004044, "1024": 0.07712850719690323}, "model.layers.3.self_attn.q_proj.weight": {"1": 0.72869873046875, "4": 0.2273235321044922, "16": 0.10768016427755356, "64": 0.10422291606664658, "256": 0.09981834143400192, "1024": 0.09906350076198578}, "model.layers.3.self_attn.k_proj.weight": {"1": 0.7594853043556213, "4": 0.2444625347852707, "16": 0.1050882488489151, "64": 0.10922327637672424, "256": 0.10324512422084808, "1024": 0.10226906836032867}, "model.layers.3.self_attn.v_proj.weight": {"1": 1.0493693351745605, "4": 0.28369998931884766, "16": 0.1386188566684723, "64": 0.06366076320409775, "256": 0.05894775316119194, "1024": 0.056698787957429886}, "model.layers.3.self_attn.o_proj.weight": {"1": 0.6176233291625977, "4": 0.14228995144367218, "16": 0.07604245096445084, "64": 0.042391009628772736, "256": 0.04115058481693268, "1024": 0.04007018730044365}, "model.layers.3.mlp.gate_proj.weight": {"1": 0.7012240886688232, "4": 0.16906273365020752, "16": 0.0997336357831955, "64": 0.053042907267808914, "256": 0.04822886735200882, "1024": 0.048076435923576355}, "model.layers.3.mlp.up_proj.weight": {"1": 0.6509116291999817, "4": 0.16462171077728271, "16": 0.08824946731328964, "64": 0.04506710171699524, "256": 0.04315740987658501, "1024": 0.04188267141580582}, "model.layers.3.mlp.down_proj.weight": {"1": 0.5033785700798035, "4": 0.1305154711008072, "16": 0.0777755007147789, "64": 0.03994850441813469, "256": 0.03659544885158539, "1024": 0.0369560532271862}, "model.layers.3.input_layernorm.weight": {"1": 6.994138240814209, "4": 0.054808441549539566, "16": 0.023428576067090034, "64": 0.34555259346961975, "256": 0.040866319090127945, "1024": 0.03605581074953079}, "model.layers.3.post_attention_layernorm.weight": {"1": 0.8027821183204651, "4": 0.19337154924869537, "16": 0.1140492856502533, "64": 0.06158854812383652, "256": 0.060477469116449356, "1024": 0.06003616750240326}, "model.layers.4.self_attn.q_proj.weight": {"1": 0.5184328556060791, "4": 0.08562090992927551, "16": 0.07881193608045578, "64": 0.03392678126692772, "256": 0.038409288972616196, "1024": 0.037606995552778244}, "model.layers.4.self_attn.k_proj.weight": {"1": 0.4179142117500305, "4": 0.13714098930358887, "16": 0.07005492597818375, "64": 0.04015309736132622, "256": 0.04291198030114174, "1024": 0.04068977013230324}, "model.layers.4.self_attn.v_proj.weight": {"1": 0.7848964333534241, "4": 0.18816757202148438, "16": 0.11514222621917725, "64": 0.05236425623297691, "256": 0.04491252452135086, "1024": 0.04377495497465134}, "model.layers.4.self_attn.o_proj.weight": {"1": 0.4868355095386505, "4": 0.12459343671798706, "16": 0.07146456837654114, "64": 0.039235200732946396, "256": 0.03568486124277115, "1024": 0.03526982665061951}, "model.layers.4.mlp.gate_proj.weight": {"1": 0.5762957334518433, "4": 0.15107545256614685, "16": 0.08182340860366821, "64": 0.05010489746928215, "256": 0.044946782290935516, "1024": 0.04473213478922844}, "model.layers.4.mlp.up_proj.weight": {"1": 0.5631811022758484, "4": 0.14164073765277863, "16": 0.0825345441699028, "64": 0.04394209757447243, "256": 0.038016289472579956, "1024": 0.03827757388353348}, "model.layers.4.mlp.down_proj.weight": {"1": 0.44902941584587097, "4": 0.11907932907342911, "16": 0.06492813676595688, "64": 0.038220956921577454, "256": 0.03341846913099289, "1024": 0.034170545637607574}, "model.layers.4.input_layernorm.weight": {"1": 0.18468426167964935, "4": 0.06480280309915543, "16": 0.010920238681137562, "64": 0.004751862958073616, "256": 0.00800806749612093, "1024": 0.01746591180562973}, "model.layers.4.post_attention_layernorm.weight": {"1": 0.573096513748169, "4": 0.15382333099842072, "16": 0.07805518060922623, "64": 0.05773007124662399, "256": 0.052085988223552704, "1024": 0.050576359033584595}, "model.layers.5.self_attn.q_proj.weight": {"1": 0.6495600342750549, "4": 0.16757260262966156, "16": 0.0961330309510231, "64": 0.06843677908182144, "256": 0.06442105770111084, "1024": 0.05503802374005318}, "model.layers.5.self_attn.k_proj.weight": {"1": 0.5777522921562195, "4": 0.1150604635477066, "16": 0.052912723273038864, "64": 0.06067715585231781, "256": 0.054162006825208664, "1024": 0.041682783514261246}, "model.layers.5.self_attn.v_proj.weight": {"1": 0.8703118562698364, "4": 0.24867862462997437, "16": 0.10931508243083954, "64": 0.05852301046252251, "256": 0.04465110972523689, "1024": 0.04487717151641846}, "model.layers.5.self_attn.o_proj.weight": {"1": 0.3845295310020447, "4": 0.10193096101284027, "16": 0.05552142113447189, "64": 0.032915081828832626, "256": 0.02888673171401024, "1024": 0.02955164946615696}, "model.layers.5.mlp.gate_proj.weight": {"1": 0.27929019927978516, "4": 0.09089851379394531, "16": 0.05437644571065903, "64": 0.04438379779458046, "256": 0.034195832908153534, "1024": 0.03573903441429138}, "model.layers.5.mlp.up_proj.weight": {"1": 0.41520020365715027, "4": 0.11392731219530106, "16": 0.06509867310523987, "64": 0.043464068323373795, "256": 0.03493938967585564, "1024": 0.036572862416505814}, "model.layers.5.mlp.down_proj.weight": {"1": 0.35867640376091003, "4": 0.09207993000745773, "16": 0.05082494765520096, "64": 0.032619304955005646, "256": 0.027884995564818382, "1024": 0.028643643483519554}, "model.layers.5.input_layernorm.weight": {"1": 0.02516085095703602, "4": 0.22085411846637726, "16": 0.20977532863616943, "64": 0.19237388670444489, "256": 0.12805159389972687, "1024": 0.15090221166610718}, "model.layers.5.post_attention_layernorm.weight": {"1": 0.30806607007980347, "4": 0.12242750078439713, "16": 0.06850756704807281, "64": 0.05524902790784836, "256": 0.044001609086990356, "1024": 0.04680413752794266}, "model.layers.6.self_attn.q_proj.weight": {"1": 0.5726140141487122, "4": 0.20656365156173706, "16": 0.08057951927185059, "64": 0.04861833155155182, "256": 0.04617181047797203, "1024": 0.04738301783800125}, "model.layers.6.self_attn.k_proj.weight": {"1": 0.3951157033443451, "4": 0.08622506260871887, "16": 0.05577234923839569, "64": 0.03836217150092125, "256": 0.03602191060781479, "1024": 0.035082340240478516}, "model.layers.6.self_attn.v_proj.weight": {"1": 0.5948916077613831, "4": 0.17472587525844574, "16": 0.081135593354702, "64": 0.04474937915802002, "256": 0.03568437695503235, "1024": 0.036383096128702164}, "model.layers.6.self_attn.o_proj.weight": {"1": 0.3362196981906891, "4": 0.08057449012994766, "16": 0.04891091585159302, "64": 0.028823042288422585, "256": 0.025739209726452827, "1024": 0.026185357943177223}, "model.layers.6.mlp.gate_proj.weight": {"1": 0.3953127861022949, "4": 0.12181805074214935, "16": 0.06434635818004608, "64": 0.03456230089068413, "256": 0.03296225145459175, "1024": 0.03268912807106972}, "model.layers.6.mlp.up_proj.weight": {"1": 0.4129117429256439, "4": 0.11312733590602875, "16": 0.06892205029726028, "64": 0.034022338688373566, "256": 0.031727906316518784, "1024": 0.03146376088261604}, "model.layers.6.mlp.down_proj.weight": {"1": 0.3600001037120819, "4": 0.09435323625802994, "16": 0.053096503019332886, "64": 0.027996238321065903, "256": 0.02650955505669117, "1024": 0.026074888184666634}, "model.layers.6.input_layernorm.weight": {"1": 0.26544907689094543, "4": 0.1466922014951706, "16": 0.11854832619428635, "64": 0.06470448523759842, "256": 0.17171455919742584, "1024": 0.13194388151168823}, "model.layers.6.post_attention_layernorm.weight": {"1": 0.4055179953575134, "4": 0.13305869698524475, "16": 0.07636499404907227, "64": 0.04599494859576225, "256": 0.04604361206293106, "1024": 0.04774435609579086}, "model.layers.7.self_attn.q_proj.weight": {"1": 0.36033153533935547, "4": 0.11922699213027954, "16": 0.07292252779006958, "64": 0.04055357724428177, "256": 0.03216929733753204, "1024": 0.03329532966017723}, "model.layers.7.self_attn.k_proj.weight": {"1": 0.6969581842422485, "4": 0.12169089168310165, "16": 0.08508111536502838, "64": 0.03695768117904663, "256": 0.0302522461861372, "1024": 0.031035587191581726}, "model.layers.7.self_attn.v_proj.weight": {"1": 0.5021153092384338, "4": 0.13429932296276093, "16": 0.06875009834766388, "64": 0.032006245106458664, "256": 0.02946089766919613, "1024": 0.028134193271398544}, "model.layers.7.self_attn.o_proj.weight": {"1": 0.32454726099967957, "4": 0.08200830966234207, "16": 0.04823409020900726, "64": 0.02535255253314972, "256": 0.023652559146285057, "1024": 0.02385566383600235}, "model.layers.7.mlp.gate_proj.weight": {"1": 0.43115234375, "4": 0.09826376289129257, "16": 0.061876080930233, "64": 0.03466640040278435, "256": 0.034229304641485214, "1024": 0.0312579907476902}, "model.layers.7.mlp.up_proj.weight": {"1": 0.42093318700790405, "4": 0.09879418462514877, "16": 0.05934422090649605, "64": 0.030032893642783165, "256": 0.02969173528254032, "1024": 0.028864972293376923}, "model.layers.7.mlp.down_proj.weight": {"1": 0.33018994331359863, "4": 0.0829804316163063, "16": 0.0503644123673439, "64": 0.02539565972983837, "256": 0.02447950467467308, "1024": 0.024151818826794624}, "model.layers.7.input_layernorm.weight": {"1": 0.5929185748100281, "4": 0.016016993671655655, "16": 0.009052523411810398, "64": 0.03554142639040947, "256": 0.014844928868114948, "1024": 0.026122616603970528}, "model.layers.7.post_attention_layernorm.weight": {"1": 1.3024258613586426, "4": 0.09841741621494293, "16": 0.080252505838871, "64": 0.048610664904117584, "256": 0.04723803326487541, "1024": 0.04395316541194916}, "model.layers.8.self_attn.q_proj.weight": {"1": 0.29094162583351135, "4": 0.09943092614412308, "16": 0.04529315605759621, "64": 0.023153409361839294, "256": 0.029088620096445084, "1024": 0.029874851927161217}, "model.layers.8.self_attn.k_proj.weight": {"1": 0.6864627599716187, "4": 0.13046039640903473, "16": 0.04484208673238754, "64": 0.03293709084391594, "256": 0.035291656851768494, "1024": 0.03418515622615814}, "model.layers.8.self_attn.v_proj.weight": {"1": 0.44906505942344666, "4": 0.12189701944589615, "16": 0.07068412005901337, "64": 0.030108967795968056, "256": 0.02830687165260315, "1024": 0.027666114270687103}, "model.layers.8.self_attn.o_proj.weight": {"1": 0.2962900996208191, "4": 0.07694969326257706, "16": 0.047882143408060074, "64": 0.0248729158192873, "256": 0.022265931591391563, "1024": 0.02256297878921032}, "model.layers.8.mlp.gate_proj.weight": {"1": 0.3152430057525635, "4": 0.09044687449932098, "16": 0.0559023916721344, "64": 0.033188849687576294, "256": 0.030778635293245316, "1024": 0.029132183641195297}, "model.layers.8.mlp.up_proj.weight": {"1": 0.3229168653488159, "4": 0.0855853259563446, "16": 0.052249759435653687, "64": 0.02658921293914318, "256": 0.02407822757959366, "1024": 0.024127837270498276}, "model.layers.8.mlp.down_proj.weight": {"1": 0.2822558283805847, "4": 0.07603177428245544, "16": 0.045478455722332, "64": 0.022993728518486023, "256": 0.021491488441824913, "1024": 0.021242301911115646}, "model.layers.8.input_layernorm.weight": {"1": 0.3980277180671692, "4": 0.11061572283506393, "16": 0.21352097392082214, "64": 0.03961116820573807, "256": 0.04478773847222328, "1024": 0.03652598708868027}, "model.layers.8.post_attention_layernorm.weight": {"1": 0.13235072791576385, "4": 0.15083731710910797, "16": 0.04992637410759926, "64": 0.0503569096326828, "256": 0.05871029198169708, "1024": 0.054717183113098145}, "model.layers.9.self_attn.q_proj.weight": {"1": 0.294830858707428, "4": 0.04401104897260666, "16": 0.051250796765089035, "64": 0.018698066473007202, "256": 0.022011684253811836, "1024": 0.018906762823462486}, "model.layers.9.self_attn.k_proj.weight": {"1": 0.4574751555919647, "4": 0.06876067817211151, "16": 0.0843147337436676, "64": 0.026562171056866646, "256": 0.023101497441530228, "1024": 0.024166114628314972}, "model.layers.9.self_attn.v_proj.weight": {"1": 0.3898225724697113, "4": 0.09465107321739197, "16": 0.054382529109716415, "64": 0.026391953229904175, "256": 0.025145839899778366, "1024": 0.02435254491865635}, "model.layers.9.self_attn.o_proj.weight": {"1": 0.28284120559692383, "4": 0.07748465240001678, "16": 0.04674435779452324, "64": 0.022726941853761673, "256": 0.021046623587608337, "1024": 0.020895585417747498}, "model.layers.9.mlp.gate_proj.weight": {"1": 0.3037087321281433, "4": 0.06524765491485596, "16": 0.03546253219246864, "64": 0.019321013242006302, "256": 0.018604932352900505, "1024": 0.018952859565615654}, "model.layers.9.mlp.up_proj.weight": {"1": 0.2970978617668152, "4": 0.0699574425816536, "16": 0.03877544403076172, "64": 0.017813777551054955, "256": 0.016144316643476486, "1024": 0.01657579094171524}, "model.layers.9.mlp.down_proj.weight": {"1": 0.23709772527217865, "4": 0.06789608299732208, "16": 0.030480120331048965, "64": 0.01758425496518612, "256": 0.016786441206932068, "1024": 0.016610698774456978}, "model.layers.9.input_layernorm.weight": {"1": 0.5838891267776489, "4": 0.03436868265271187, "16": 0.11780451238155365, "64": 0.012812399305403233, "256": 0.01862942986190319, "1024": 0.01685958169400692}, "model.layers.9.post_attention_layernorm.weight": {"1": 0.5043879151344299, "4": 0.07774768769741058, "16": 0.041359324008226395, "64": 0.02625230886042118, "256": 0.029531238600611687, "1024": 0.02768006920814514}, "model.layers.10.self_attn.q_proj.weight": {"1": 0.14900211989879608, "4": 0.07236462831497192, "16": 0.020743180066347122, "64": 0.007142823655158281, "256": 0.003786309389397502, "1024": 0.003671560902148485}, "model.layers.10.self_attn.k_proj.weight": {"1": 0.42979130148887634, "4": 0.22627772390842438, "16": 0.09842410683631897, "64": 0.02048512175679207, "256": 0.011528495699167252, "1024": 0.010877535678446293}, "model.layers.10.self_attn.v_proj.weight": {"1": 0.6861532330513, "4": 0.15625615417957306, "16": 0.0527760274708271, "64": 0.028694352135062218, "256": 0.021755468100309372, "1024": 0.020901978015899658}, "model.layers.10.self_attn.o_proj.weight": {"1": 0.28248998522758484, "4": 0.06686493009328842, "16": 0.031129946932196617, "64": 0.01907726190984249, "256": 0.017970498651266098, "1024": 0.017514344304800034}, "model.layers.10.mlp.gate_proj.weight": {"1": 0.259822279214859, "4": 0.052920326590538025, "16": 0.025524044409394264, "64": 0.016110779717564583, "256": 0.014692689292132854, "1024": 0.014766111969947815}, "model.layers.10.mlp.up_proj.weight": {"1": 0.17582648992538452, "4": 0.049482520669698715, "16": 0.025785310193896294, "64": 0.016938727349042892, "256": 0.015072518028318882, "1024": 0.01508477795869112}, "model.layers.10.mlp.down_proj.weight": {"1": 0.1523008793592453, "4": 0.040823813527822495, "16": 0.022876938804984093, "64": 0.014240655116736889, "256": 0.013124109245836735, "1024": 0.013010903261601925}, "model.layers.10.input_layernorm.weight": {"1": 1.6057647466659546, "4": 0.09091441333293915, "16": 0.02047785371541977, "64": 0.03721952065825462, "256": 0.01139636617153883, "1024": 0.011179346591234207}, "model.layers.10.post_attention_layernorm.weight": {"1": 0.258114218711853, "4": 0.055981751531362534, "16": 0.035422831773757935, "64": 0.02285928651690483, "256": 0.021019645035266876, "1024": 0.021062053740024567}, "model.layers.11.self_attn.q_proj.weight": {"1": 0.25550147891044617, "4": 0.048751845955848694, "16": 0.012143934145569801, "64": 0.011449888348579407, "256": 0.008906230330467224, "1024": 0.007010519504547119}, "model.layers.11.self_attn.k_proj.weight": {"1": 0.3866561949253082, "4": 0.05973345413804054, "16": 0.03038228303194046, "64": 0.02151486650109291, "256": 0.008982028812170029, "1024": 0.007147032301872969}, "model.layers.11.self_attn.v_proj.weight": {"1": 0.4153164029121399, "4": 0.11774295568466187, "16": 0.049508046358823776, "64": 0.02282389998435974, "256": 0.016809474676847458, "1024": 0.016744008287787437}, "model.layers.11.self_attn.o_proj.weight": {"1": 0.16805170476436615, "4": 0.045696791261434555, "16": 0.024013567715883255, "64": 0.014895117841660976, "256": 0.01316488441079855, "1024": 0.012841837480664253}, "model.layers.11.mlp.gate_proj.weight": {"1": 0.14142535626888275, "4": 0.04031422361731529, "16": 0.022732507437467575, "64": 0.013873201794922352, "256": 0.012127918191254139, "1024": 0.01189750712364912}, "model.layers.11.mlp.up_proj.weight": {"1": 0.15531817078590393, "4": 0.04244584962725639, "16": 0.022398196160793304, "64": 0.013104659505188465, "256": 0.01198047399520874, "1024": 0.011856818571686745}, "model.layers.11.mlp.down_proj.weight": {"1": 0.12962739169597626, "4": 0.034799765795469284, "16": 0.017433080822229385, "64": 0.010930691845715046, "256": 0.009571975097060204, "1024": 0.009370970539748669}, "model.layers.11.input_layernorm.weight": {"1": 0.010095915757119656, "4": 0.012284161522984505, "16": 0.041473910212516785, "64": 0.04386681318283081, "256": 0.01134450826793909, "1024": 0.018199462443590164}, "model.layers.11.post_attention_layernorm.weight": {"1": 0.15256810188293457, "4": 0.04311325028538704, "16": 0.02387959137558937, "64": 0.015991058200597763, "256": 0.015655210241675377, "1024": 0.015252199955284595}, "model.layers.12.self_attn.q_proj.weight": {"1": 0.4198363721370697, "4": 0.12743636965751648, "16": 0.04176666587591171, "64": 0.02207248844206333, "256": 0.00960505846887827, "1024": 0.012944699265062809}, "model.layers.12.self_attn.k_proj.weight": {"1": 0.3225225508213043, "4": 0.06017113849520683, "16": 0.04710348695516586, "64": 0.02021433226764202, "256": 0.009587806649506092, "1024": 0.013618435710668564}, "model.layers.12.self_attn.v_proj.weight": {"1": 0.49008888006210327, "4": 0.11955643445253372, "16": 0.042520057410001755, "64": 0.01880744658410549, "256": 0.013189335353672504, "1024": 0.013072171248495579}, "model.layers.12.self_attn.o_proj.weight": {"1": 0.16250231862068176, "4": 0.03836187347769737, "16": 0.019802473485469818, "64": 0.01215620432049036, "256": 0.010417706333100796, "1024": 0.010397038422524929}, "model.layers.12.mlp.gate_proj.weight": {"1": 0.13128383457660675, "4": 0.030940257012844086, "16": 0.01467060949653387, "64": 0.00931678619235754, "256": 0.00830073095858097, "1024": 0.008123017847537994}, "model.layers.12.mlp.up_proj.weight": {"1": 0.12610942125320435, "4": 0.029826994985342026, "16": 0.014489442110061646, "64": 0.009159446693956852, "256": 0.0083418944850564, "1024": 0.008138533681631088}, "model.layers.12.mlp.down_proj.weight": {"1": 0.09509384632110596, "4": 0.023274339735507965, "16": 0.011344789527356625, "64": 0.008016831241548061, "256": 0.006698773708194494, "1024": 0.006793067324906588}, "model.layers.12.input_layernorm.weight": {"1": 0.06683720648288727, "4": 0.014220465905964375, "16": 0.033912625163793564, "64": 0.036594878882169724, "256": 0.0210626982152462, "1024": 0.035387828946113586}, "model.layers.12.post_attention_layernorm.weight": {"1": 0.13656775653362274, "4": 0.03317907825112343, "16": 0.02034989930689335, "64": 0.013716920278966427, "256": 0.012652553617954254, "1024": 0.012739500030875206}, "model.layers.13.self_attn.q_proj.weight": {"1": 0.06048744544386864, "4": 0.02809189260005951, "16": 0.016117844730615616, "64": 0.013119004666805267, "256": 0.012612580321729183, "1024": 0.010332779958844185}, "model.layers.13.self_attn.k_proj.weight": {"1": 0.08322291076183319, "4": 0.02233917824923992, "16": 0.016550293192267418, "64": 0.015507591888308525, "256": 0.013232686556875706, "1024": 0.010791993699967861}, "model.layers.13.self_attn.v_proj.weight": {"1": 0.4656282067298889, "4": 0.11589250713586807, "16": 0.03678624704480171, "64": 0.015339894220232964, "256": 0.010061494074761868, "1024": 0.009110958315432072}, "model.layers.13.self_attn.o_proj.weight": {"1": 0.20804357528686523, "4": 0.051429633051157, "16": 0.019879475235939026, "64": 0.009798755869269371, "256": 0.007297065109014511, "1024": 0.007047827355563641}, "model.layers.13.mlp.gate_proj.weight": {"1": 0.08164666593074799, "4": 0.019186990335583687, "16": 0.008563177660107613, "64": 0.005250766407698393, "256": 0.004690397996455431, "1024": 0.0046109785325825214}, "model.layers.13.mlp.up_proj.weight": {"1": 0.08164769411087036, "4": 0.019819173961877823, "16": 0.009316753596067429, "64": 0.005705669056624174, "256": 0.005213127937167883, "1024": 0.005086576100438833}, "model.layers.13.mlp.down_proj.weight": {"1": 0.06748180091381073, "4": 0.01791725866496563, "16": 0.008352537639439106, "64": 0.004614262375980616, "256": 0.004054047167301178, "1024": 0.0040255081839859486}, "model.layers.13.input_layernorm.weight": {"1": 0.11067476123571396, "4": 0.050245363265275955, "16": 0.0451710969209671, "64": 0.019149230793118477, "256": 0.016848251223564148, "1024": 0.014464292675256729}, "model.layers.13.post_attention_layernorm.weight": {"1": 0.08311104774475098, "4": 0.020665930584073067, "16": 0.011733492836356163, "64": 0.008350277319550514, "256": 0.00805735494941473, "1024": 0.008050279691815376}, "model.layers.14.self_attn.q_proj.weight": {"1": 0.05714922025799751, "4": 0.04940575733780861, "16": 0.029400788247585297, "64": 0.005299882031977177, "256": 0.003767374437302351, "1024": 0.00453852629289031}, "model.layers.14.self_attn.k_proj.weight": {"1": 0.06423240900039673, "4": 0.02755938470363617, "16": 0.014914080500602722, "64": 0.00252514542080462, "256": 0.001430919743143022, "1024": 0.0017205963376909494}, "model.layers.14.self_attn.v_proj.weight": {"1": 0.4145267605781555, "4": 0.10317455232143402, "16": 0.031380753964185715, "64": 0.013342680409550667, "256": 0.007766135036945343, "1024": 0.006785739678889513}, "model.layers.14.self_attn.o_proj.weight": {"1": 0.0825657770037651, "4": 0.022290082648396492, "16": 0.008667394518852234, "64": 0.004958077799528837, "256": 0.004265992436558008, "1024": 0.00414639338850975}, "model.layers.14.mlp.gate_proj.weight": {"1": 0.054715175181627274, "4": 0.014475100673735142, "16": 0.005301153287291527, "64": 0.0028426756616681814, "256": 0.002348666312173009, "1024": 0.0022468618117272854}, "model.layers.14.mlp.up_proj.weight": {"1": 0.04884592071175575, "4": 0.012071606703102589, "16": 0.004446901846677065, "64": 0.002627969952300191, "256": 0.002065841341391206, "1024": 0.0020035775378346443}, "model.layers.14.mlp.down_proj.weight": {"1": 0.06225080415606499, "4": 0.01732095517218113, "16": 0.005384000949561596, "64": 0.00284697487950325, "256": 0.0019451358821243048, "1024": 0.0017987174214795232}, "model.layers.14.input_layernorm.weight": {"1": 0.006877061910927296, "4": 0.011637491174042225, "16": 0.022316012531518936, "64": 0.002547594951465726, "256": 0.003745871130377054, "1024": 0.005005002953112125}, "model.layers.14.post_attention_layernorm.weight": {"1": 0.05679301172494888, "4": 0.01403405424207449, "16": 0.008243654854595661, "64": 0.005507970694452524, "256": 0.005095817614346743, "1024": 0.005085721146315336}, "model.layers.15.self_attn.q_proj.weight": {"1": 0.07454059273004532, "4": 0.008071939460933208, "16": 0.009640836156904697, "64": 0.003636155743151903, "256": 0.002760533709079027, "1024": 0.0029193779919296503}, "model.layers.15.self_attn.k_proj.weight": {"1": 0.1196090430021286, "4": 0.010736612603068352, "16": 0.01050722785294056, "64": 0.003868374042212963, "256": 0.0035377840977162123, "1024": 0.0035103512927889824}, "model.layers.15.self_attn.v_proj.weight": {"1": 0.18198883533477783, "4": 0.04592472314834595, "16": 0.013138631358742714, "64": 0.005044234450906515, "256": 0.0032281731255352497, "1024": 0.0028625261038541794}, "model.layers.15.self_attn.o_proj.weight": {"1": 0.05107273533940315, "4": 0.013475618325173855, "16": 0.004249007906764746, "64": 0.002372730290517211, "256": 0.0020905991550534964, "1024": 0.0021101683378219604}, "model.layers.15.mlp.gate_proj.weight": {"1": 0.03125530853867531, "4": 0.007879301905632019, "16": 0.002467326121404767, "64": 0.0010609269374981523, "256": 0.000699855387210846, "1024": 0.0006000357680022717}, "model.layers.15.mlp.up_proj.weight": {"1": 0.03189712390303612, "4": 0.008049946278333664, "16": 0.002529238583520055, "64": 0.0010462714126333594, "256": 0.0007089169812388718, "1024": 0.0006134964060038328}, "model.layers.15.mlp.down_proj.weight": {"1": 0.019089657813310623, "4": 0.005058234557509422, "16": 0.0012172320857644081, "64": 0.00036545470356941223, "256": 0.00015969571541063488, "1024": 0.00010435959848109633}, "model.layers.15.input_layernorm.weight": {"1": 0.08338350057601929, "4": 0.026649199426174164, "16": 0.007004828192293644, "64": 0.0024911181535571814, "256": 0.002751175547018647, "1024": 0.002250462770462036}, "model.layers.15.post_attention_layernorm.weight": {"1": 0.03922557830810547, "4": 0.011513839475810528, "16": 0.00417950889095664, "64": 0.0028567337431013584, "256": 0.0026056256610900164, "1024": 0.0025973254814743996}, "model.norm.weight": {"1": 0.0, "4": 0.0, "16": 1.3479660299748307e-14, "64": 2.2084845887823668e-13, "256": 3.477050895470124e-12, "1024": 5.953768728028663e-11}}