{"model.embed_tokens.weight": {"1": 0.1662873774766922, "4": 0.045718155801296234, "16": 0.011893970891833305, "64": 0.002674684626981616, "256": 0.0012330262688919902, "1024": 0.00036402203841134906}, "model.layers.0.self_attn.q_proj.weight": {"1": 0.42607179284095764, "4": 0.19825685024261475, "16": 0.0509411059319973, "64": 0.008357065729796886, "256": 0.005201013293117285, "1024": 0.0012139794416725636}, "model.layers.0.self_attn.k_proj.weight": {"1": 0.5388311743736267, "4": 0.17309784889221191, "16": 0.09788915514945984, "64": 0.033222496509552, "256": 0.0065336572006344795, "1024": 0.001520628109574318}, "model.layers.0.self_attn.v_proj.weight": {"1": 0.7252984046936035, "4": 0.2040412276983261, "16": 0.05536619946360588, "64": 0.013696557842195034, "256": 0.004959633573889732, "1024": 0.001778111793100834}, "model.layers.0.self_attn.o_proj.weight": {"1": 0.47041288018226624, "4": 0.1340707242488861, "16": 0.036717917770147324, "64": 0.0075408704578876495, "256": 0.0034277134109288454, "1024": 0.0011657580034807324}, "model.layers.0.mlp.gate_proj.weight": {"1": 0.3823353052139282, "4": 0.11322600394487381, "16": 0.02732313796877861, "64": 0.0062608434818685055, "256": 0.0030179184395819902, "1024": 0.0009944441262632608}, "model.layers.0.mlp.up_proj.weight": {"1": 0.48739808797836304, "4": 0.1433139592409134, "16": 0.03801023215055466, "64": 0.007836686447262764, "256": 0.003566646482795477, "1024": 0.0011427259305492043}, "model.layers.0.mlp.down_proj.weight": {"1": 0.4846201539039612, "4": 0.13999219238758087, "16": 0.03872250020503998, "64": 0.007352297659963369, "256": 0.0035476796329021454, "1024": 0.0013620463432744145}, "model.layers.0.input_layernorm.weight": {"1": 0.2265327125787735, "4": 0.0693894699215889, "16": 0.02904864028096199, "64": 0.0034719021059572697, "256": 0.0013373735127970576, "1024": 0.0005895171780139208}, "model.layers.0.post_attention_layernorm.weight": {"1": 0.4421984851360321, "4": 0.11035975813865662, "16": 0.028170980513095856, "64": 0.0065805078484117985, "256": 0.003270824672654271, "1024": 0.001115416525863111}, "model.layers.1.self_attn.q_proj.weight": {"1": 0.6193590760231018, "4": 0.15325601398944855, "16": 0.06214084476232529, "64": 0.010469034314155579, "256": 0.005409024190157652, "1024": 0.0016572738531976938}, "model.layers.1.self_attn.k_proj.weight": {"1": 0.43924978375434875, "4": 0.1597011685371399, "16": 0.09637361764907837, "64": 0.014779838733375072, "256": 0.0048333508893847466, "1024": 0.0016337822889909148}, "model.layers.1.self_attn.v_proj.weight": {"1": 0.7421355843544006, "4": 0.25372809171676636, "16": 0.06688442826271057, "64": 0.01762406900525093, "256": 0.011182648129761219, "1024": 0.0062920451164245605}, "model.layers.1.self_attn.o_proj.weight": {"1": 0.4570844769477844, "4": 0.13712316751480103, "16": 0.036723919212818146, "64": 0.006850472651422024, "256": 0.003339622402563691, "1024": 0.0010498956544324756}, "model.layers.1.mlp.gate_proj.weight": {"1": 0.503679096698761, "4": 0.1458376795053482, "16": 0.03542293980717659, "64": 0.0074887326918542385, "256": 0.00369048397988081, "1024": 0.0010736434487625957}, "model.layers.1.mlp.up_proj.weight": {"1": 0.5128355026245117, "4": 0.1551702469587326, "16": 0.03817494586110115, "64": 0.007635137531906366, "256": 0.0035562028642743826, "1024": 0.0011268004309386015}, "model.layers.1.mlp.down_proj.weight": {"1": 0.2549022436141968, "4": 0.07159683108329773, "16": 0.0185000691562891, "64": 0.0058629438281059265, "256": 0.0021577354054898024, "1024": 0.0014408157439902425}, "model.layers.1.input_layernorm.weight": {"1": 0.13954989612102509, "4": 0.434893399477005, "16": 0.10264363884925842, "64": 0.014035822823643684, "256": 0.015093638561666012, "1024": 0.0007738457643426955}, "model.layers.1.post_attention_layernorm.weight": {"1": 1.23784601688385, "4": 0.13471141457557678, "16": 0.05200871080160141, "64": 0.014059066772460938, "256": 0.003552296431735158, "1024": 0.0017079883255064487}, "model.layers.2.self_attn.q_proj.weight": {"1": 0.1580236703157425, "4": 0.07827680557966232, "16": 0.02135450951755047, "64": 0.002871167380362749, "256": 0.001657683402299881, "1024": 0.0007637475500814617}, "model.layers.2.self_attn.k_proj.weight": {"1": 0.21573346853256226, "4": 0.16199368238449097, "16": 0.039703648537397385, "64": 0.005020092241466045, "256": 0.0038824640214443207, "1024": 0.0011474412167444825}, "model.layers.2.self_attn.v_proj.weight": {"1": 1.1127421855926514, "4": 0.32654455304145813, "16": 0.09794411808252335, "64": 0.035138748586177826, "256": 0.022623926401138306, "1024": 0.017946559935808182}, "model.layers.2.self_attn.o_proj.weight": {"1": 0.41988807916641235, "4": 0.1320275366306305, "16": 0.0383652038872242, "64": 0.007209961302578449, "256": 0.003345170058310032, "1024": 0.001197674311697483}, "model.layers.2.mlp.gate_proj.weight": {"1": 0.46683135628700256, "4": 0.14006361365318298, "16": 0.03913576155900955, "64": 0.006808266043663025, "256": 0.0030536241829395294, "1024": 0.0010431346017867327}, "model.layers.2.mlp.up_proj.weight": {"1": 0.5075640082359314, "4": 0.16254109144210815, "16": 0.04498998820781708, "64": 0.007491135038435459, "256": 0.004014185164123774, "1024": 0.0010885620722547174}, "model.layers.2.mlp.down_proj.weight": {"1": 0.41147691011428833, "4": 0.11690961569547653, "16": 0.03195323050022125, "64": 0.006048095878213644, "256": 0.002679460449144244, "1024": 0.0010112865129485726}, "model.layers.2.input_layernorm.weight": {"1": 1.907247543334961, "4": 0.38881346583366394, "16": 0.039374321699142456, "64": 0.0007936132024042308, "256": 0.01050284318625927, "1024": 0.0013556674821302295}, "model.layers.2.post_attention_layernorm.weight": {"1": 0.4664061963558197, "4": 0.14915186166763306, "16": 0.04583889991044998, "64": 0.006288974080234766, "256": 0.004087675828486681, "1024": 0.0009143084171228111}, "model.layers.3.self_attn.q_proj.weight": {"1": 0.6986651420593262, "4": 0.1594415307044983, "16": 0.09252695739269257, "64": 0.00480904383584857, "256": 0.004391852766275406, "1024": 0.0014981328276917338}, "model.layers.3.self_attn.k_proj.weight": {"1": 0.6972332000732422, "4": 0.15607237815856934, "16": 0.09875063598155975, "64": 0.0037654596380889416, "256": 0.004283067770302296, "1024": 0.0012606392847374082}, "model.layers.3.self_attn.v_proj.weight": {"1": 0.9749365448951721, "4": 0.27230697870254517, "16": 0.0824936181306839, "64": 0.02687101811170578, "256": 0.01680309884250164, "1024": 0.014656937681138515}, "model.layers.3.self_attn.o_proj.weight": {"1": 0.3841339945793152, "4": 0.10982290655374527, "16": 0.02810659632086754, "64": 0.006444646045565605, "256": 0.002782456809654832, "1024": 0.0010225980076938868}, "model.layers.3.mlp.gate_proj.weight": {"1": 0.5105745196342468, "4": 0.13597923517227173, "16": 0.03726481646299362, "64": 0.008085747249424458, "256": 0.003425964852795005, "1024": 0.0011307800887152553}, "model.layers.3.mlp.up_proj.weight": {"1": 0.41940632462501526, "4": 0.13852091133594513, "16": 0.03758535906672478, "64": 0.006916666869074106, "256": 0.003260465105995536, "1024": 0.0009802101412788033}, "model.layers.3.mlp.down_proj.weight": {"1": 0.381377249956131, "4": 0.10847415030002594, "16": 0.024589749053120613, "64": 0.006116337608546019, "256": 0.002685812534764409, "1024": 0.0009440801222808659}, "model.layers.3.input_layernorm.weight": {"1": 3.904934883117676, "4": 0.9418230056762695, "16": 0.01951649785041809, "64": 0.00580079760402441, "256": 0.009529639966785908, "1024": 0.0024307300336658955}, "model.layers.3.post_attention_layernorm.weight": {"1": 0.508978545665741, "4": 0.1604815423488617, "16": 0.042676351964473724, "64": 0.007794589269906282, "256": 0.0036579982843250036, "1024": 0.000997969531454146}, "model.layers.4.self_attn.q_proj.weight": {"1": 0.34962108731269836, "4": 0.12260592728853226, "16": 0.04352620989084244, "64": 0.016142264008522034, "256": 0.00591144198551774, "1024": 0.0015074096154421568}, "model.layers.4.self_attn.k_proj.weight": {"1": 0.36859747767448425, "4": 0.09712584316730499, "16": 0.029785413295030594, "64": 0.008137046359479427, "256": 0.002443283563479781, "1024": 0.0008570684003643692}, "model.layers.4.self_attn.v_proj.weight": {"1": 0.6925183534622192, "4": 0.2242475003004074, "16": 0.058768849819898605, "64": 0.03016970120370388, "256": 0.022243740037083626, "1024": 0.017914611846208572}, "model.layers.4.self_attn.o_proj.weight": {"1": 0.33379313349723816, "4": 0.0985506996512413, "16": 0.021738072857260704, "64": 0.005898846313357353, "256": 0.0024851500056684017, "1024": 0.0010025716619566083}, "model.layers.4.mlp.gate_proj.weight": {"1": 0.3993643820285797, "4": 0.12550224363803864, "16": 0.025817273184657097, "64": 0.007653458509594202, "256": 0.0025144924875348806, "1024": 0.0010168469743803144}, "model.layers.4.mlp.up_proj.weight": {"1": 0.40788471698760986, "4": 0.12424225360155106, "16": 0.026016630232334137, "64": 0.00632448261603713, "256": 0.0024434986989945173, "1024": 0.0008741842466406524}, "model.layers.4.mlp.down_proj.weight": {"1": 0.3287700116634369, "4": 0.09752234816551208, "16": 0.01973496936261654, "64": 0.0054476275108754635, "256": 0.0022282993886619806, "1024": 0.0009317260119132698}, "model.layers.4.input_layernorm.weight": {"1": 0.3709874153137207, "4": 0.1612970381975174, "16": 0.05053231865167618, "64": 0.006733202841132879, "256": 0.001595127978362143, "1024": 0.0019504833035171032}, "model.layers.4.post_attention_layernorm.weight": {"1": 0.3922522962093353, "4": 0.11419041454792023, "16": 0.023082898929715157, "64": 0.005547831766307354, "256": 0.002609517192468047, "1024": 0.0006911249947734177}, "model.layers.5.self_attn.q_proj.weight": {"1": 0.2646075487136841, "4": 0.13927510380744934, "16": 0.015711229294538498, "64": 0.005196549464017153, "256": 0.001777258818037808, "1024": 0.0007299176650121808}, "model.layers.5.self_attn.k_proj.weight": {"1": 0.398280531167984, "4": 0.12454944849014282, "16": 0.01505084428936243, "64": 0.004796462599188089, "256": 0.0029775863513350487, "1024": 0.0012726413551717997}, "model.layers.5.self_attn.v_proj.weight": {"1": 0.8391510844230652, "4": 0.27057018876075745, "16": 0.05582078546285629, "64": 0.02839973010122776, "256": 0.017587438225746155, "1024": 0.015059484168887138}, "model.layers.5.self_attn.o_proj.weight": {"1": 0.2884954512119293, "4": 0.08715876936912537, "16": 0.01755472831428051, "64": 0.004752772860229015, "256": 0.001872942317277193, "1024": 0.0007735039107501507}, "model.layers.5.mlp.gate_proj.weight": {"1": 0.2610005736351013, "4": 0.0652543157339096, "16": 0.014120595529675484, "64": 0.006102410610765219, "256": 0.0035857486072927713, "1024": 0.0006264583207666874}, "model.layers.5.mlp.up_proj.weight": {"1": 0.3401379883289337, "4": 0.09830115735530853, "16": 0.019357725977897644, "64": 0.005301452241837978, "256": 0.0030845250003039837, "1024": 0.0007683272124268115}, "model.layers.5.mlp.down_proj.weight": {"1": 0.27693405747413635, "4": 0.08495865017175674, "16": 0.015944216400384903, "64": 0.004782714415341616, "256": 0.002312040887773037, "1024": 0.0007790135568939149}, "model.layers.5.input_layernorm.weight": {"1": 0.09045163542032242, "4": 0.13516557216644287, "16": 0.0009846801403909922, "64": 0.010140769183635712, "256": 0.0033069124910980463, "1024": 0.001200379221700132}, "model.layers.5.post_attention_layernorm.weight": {"1": 0.27249497175216675, "4": 0.08264289051294327, "16": 0.016137436032295227, "64": 0.006195696070790291, "256": 0.0029258145950734615, "1024": 0.0004944719839841127}, "model.layers.6.self_attn.q_proj.weight": {"1": 0.4086463451385498, "4": 0.19369864463806152, "16": 0.025927895680069923, "64": 0.008548246696591377, "256": 0.002348862122744322, "1024": 0.0007287526968866587}, "model.layers.6.self_attn.k_proj.weight": {"1": 0.21802371740341187, "4": 0.08387826383113861, "16": 0.025052471086382866, "64": 0.006291004829108715, "256": 0.003038818947970867, "1024": 0.0006325299036689103}, "model.layers.6.self_attn.v_proj.weight": {"1": 0.6751649975776672, "4": 0.1891307532787323, "16": 0.04363574460148811, "64": 0.01937497965991497, "256": 0.01366827916353941, "1024": 0.010736477561295033}, "model.layers.6.self_attn.o_proj.weight": {"1": 0.275519460439682, "4": 0.08065756410360336, "16": 0.015034779906272888, "64": 0.004343423526734114, "256": 0.0018950988305732608, "1024": 0.0008127745240926743}, "model.layers.6.mlp.gate_proj.weight": {"1": 0.32512474060058594, "4": 0.09686412662267685, "16": 0.02105637639760971, "64": 0.004613188561052084, "256": 0.002306785900145769, "1024": 0.0009569945395924151}, "model.layers.6.mlp.up_proj.weight": {"1": 0.3365936577320099, "4": 0.10081502795219421, "16": 0.021445022895932198, "64": 0.005318553652614355, "256": 0.0023611050564795732, "1024": 0.0010060789063572884}, "model.layers.6.mlp.down_proj.weight": {"1": 0.2915332019329071, "4": 0.08379005640745163, "16": 0.0171526987105608, "64": 0.0047251502983272076, "256": 0.0020621810108423233, "1024": 0.0009534288547001779}, "model.layers.6.input_layernorm.weight": {"1": 0.5145533084869385, "4": 0.07078666239976883, "16": 0.013800072483718395, "64": 0.03184616193175316, "256": 0.006337800528854132, "1024": 0.0024254072923213243}, "model.layers.6.post_attention_layernorm.weight": {"1": 0.2911042273044586, "4": 0.09078684449195862, "16": 0.02310354635119438, "64": 0.0050057009793818, "256": 0.0021126398351043463, "1024": 0.0014998487895354629}, "model.layers.7.self_attn.q_proj.weight": {"1": 0.2669698894023895, "4": 0.10000713169574738, "16": 0.021537890657782555, "64": 0.004737373441457748, "256": 0.002211178420111537, "1024": 0.0012178746983408928}, "model.layers.7.self_attn.k_proj.weight": {"1": 0.3890511393547058, "4": 0.11016247421503067, "16": 0.01963016949594021, "64": 0.005123365670442581, "256": 0.002177521586418152, "1024": 0.002005359623581171}, "model.layers.7.self_attn.v_proj.weight": {"1": 0.689462423324585, "4": 0.20688946545124054, "16": 0.0508396290242672, "64": 0.030794495716691017, "256": 0.02303350530564785, "1024": 0.020105060189962387}, "model.layers.7.self_attn.o_proj.weight": {"1": 0.25734591484069824, "4": 0.0750805139541626, "16": 0.014093868434429169, "64": 0.004416816867887974, "256": 0.0018576477887108922, "1024": 0.0010203017154708505}, "model.layers.7.mlp.gate_proj.weight": {"1": 0.35892796516418457, "4": 0.09542061388492584, "16": 0.01903372071683407, "64": 0.005848420783877373, "256": 0.002134802984073758, "1024": 0.001247424865141511}, "model.layers.7.mlp.up_proj.weight": {"1": 0.3390851318836212, "4": 0.08474594354629517, "16": 0.01847345381975174, "64": 0.005235810298472643, "256": 0.002212254563346505, "1024": 0.0010180076351389289}, "model.layers.7.mlp.down_proj.weight": {"1": 0.26874619722366333, "4": 0.0745837539434433, "16": 0.015349679626524448, "64": 0.005028305575251579, "256": 0.0021148205269128084, "1024": 0.0012134126154705882}, "model.layers.7.input_layernorm.weight": {"1": 0.24587246775627136, "4": 0.009899862110614777, "16": 0.009904704056680202, "64": 0.00044376906589604914, "256": 0.00015841939602978528, "1024": 0.0027352424804121256}, "model.layers.7.post_attention_layernorm.weight": {"1": 1.1578420400619507, "4": 0.08005845546722412, "16": 0.019538236781954765, "64": 0.01156172901391983, "256": 0.003079913556575775, "1024": 0.0007526223780587316}, "model.layers.8.self_attn.q_proj.weight": {"1": 0.36390048265457153, "4": 0.05387623608112335, "16": 0.014360738918185234, "64": 0.006426752544939518, "256": 0.0019081318750977516, "1024": 0.0007149308803491294}, "model.layers.8.self_attn.k_proj.weight": {"1": 0.34725281596183777, "4": 0.06634420156478882, "16": 0.016802752390503883, "64": 0.010023250244557858, "256": 0.002083435421809554, "1024": 0.0007809012313373387}, "model.layers.8.self_attn.v_proj.weight": {"1": 0.4752519726753235, "4": 0.14506174623966217, "16": 0.031100580468773842, "64": 0.012114458717405796, "256": 0.006798610556870699, "1024": 0.005303786136209965}, "model.layers.8.self_attn.o_proj.weight": {"1": 0.24843627214431763, "4": 0.0724201425909996, "16": 0.014746398665010929, "64": 0.005174534395337105, "256": 0.0023914994671940804, "1024": 0.001514163799583912}, "model.layers.8.mlp.gate_proj.weight": {"1": 0.21784614026546478, "4": 0.07149703055620193, "16": 0.016857802867889404, "64": 0.004835856147110462, "256": 0.0022149330470710993, "1024": 0.0013380419695749879}, "model.layers.8.mlp.up_proj.weight": {"1": 0.2341604083776474, "4": 0.07603511214256287, "16": 0.016063209623098373, "64": 0.0052156816236674786, "256": 0.00221311510540545, "1024": 0.0012597490567713976}, "model.layers.8.mlp.down_proj.weight": {"1": 0.20576857030391693, "4": 0.06772869825363159, "16": 0.013839486986398697, "64": 0.004736751783639193, "256": 0.002145542996004224, "1024": 0.001335174310952425}, "model.layers.8.input_layernorm.weight": {"1": 0.351271390914917, "4": 0.08426307886838913, "16": 0.0845814123749733, "64": 0.028109606355428696, "256": 0.0028092488646507263, "1024": 0.004007585346698761}, "model.layers.8.post_attention_layernorm.weight": {"1": 0.09147413074970245, "4": 0.034371644258499146, "16": 0.006162005476653576, "64": 0.0018364039715379477, "256": 0.0005036669899709523, "1024": 0.000387501873774454}, "model.layers.9.self_attn.q_proj.weight": {"1": 0.169815331697464, "4": 0.0610874705016613, "16": 0.02864677645266056, "64": 0.0038348566740751266, "256": 0.0017402989324182272, "1024": 0.000928544148337096}, "model.layers.9.self_attn.k_proj.weight": {"1": 0.31627461314201355, "4": 0.08207366615533829, "16": 0.02066132426261902, "64": 0.0035862065851688385, "256": 0.0025910481344908476, "1024": 0.0006185660604387522}, "model.layers.9.self_attn.v_proj.weight": {"1": 0.3233685791492462, "4": 0.1142345741391182, "16": 0.035575639456510544, "64": 0.024777280166745186, "256": 0.02296139858663082, "1024": 0.021387992426753044}, "model.layers.9.self_attn.o_proj.weight": {"1": 0.18798132240772247, "4": 0.06490933895111084, "16": 0.013764677569270134, "64": 0.004307750146836042, "256": 0.002178607974201441, "1024": 0.0015870481729507446}, "model.layers.9.mlp.gate_proj.weight": {"1": 0.17998546361923218, "4": 0.05043783038854599, "16": 0.013250300660729408, "64": 0.003930550068616867, "256": 0.0019382216269150376, "1024": 0.0010669142939150333}, "model.layers.9.mlp.up_proj.weight": {"1": 0.1497872769832611, "4": 0.0564647912979126, "16": 0.011433972977101803, "64": 0.003912045620381832, "256": 0.0016092251753434539, "1024": 0.0012213070876896381}, "model.layers.9.mlp.down_proj.weight": {"1": 0.15218700468540192, "4": 0.04605809226632118, "16": 0.010233908891677856, "64": 0.0032098498195409775, "256": 0.0013383087934926152, "1024": 0.0008434977498836815}, "model.layers.9.input_layernorm.weight": {"1": 0.1397417038679123, "4": 0.1326877772808075, "16": 0.010792672634124756, "64": 0.0030551119707524776, "256": 0.0022452573757618666, "1024": 0.0007804862689226866}, "model.layers.9.post_attention_layernorm.weight": {"1": 0.22704213857650757, "4": 0.05805134028196335, "16": 0.009896067902445793, "64": 0.0027564861811697483, "256": 0.001050483901053667, "1024": 0.0006962967454455793}, "model.layers.10.self_attn.q_proj.weight": {"1": 0.07781293988227844, "4": 0.02764432691037655, "16": 0.011594129726290703, "64": 0.0049619730561971664, "256": 0.0025571249425411224, "1024": 0.0022588735446333885}, "model.layers.10.self_attn.k_proj.weight": {"1": 0.4429526627063751, "4": 0.045609019696712494, "16": 0.028986122459173203, "64": 0.008260517381131649, "256": 0.004056296776980162, "1024": 0.0019697437528520823}, "model.layers.10.self_attn.v_proj.weight": {"1": 0.5090054273605347, "4": 0.1363607496023178, "16": 0.04597969725728035, "64": 0.026277819648385048, "256": 0.02106972597539425, "1024": 0.01963846944272518}, "model.layers.10.self_attn.o_proj.weight": {"1": 0.17702049016952515, "4": 0.046355508267879486, "16": 0.011732966639101505, "64": 0.004166295286267996, "256": 0.0021149562671780586, "1024": 0.0014820394571870565}, "model.layers.10.mlp.gate_proj.weight": {"1": 0.16264449059963226, "4": 0.03964485973119736, "16": 0.010304849594831467, "64": 0.0030569685623049736, "256": 0.0014818230411037803, "1024": 0.0008820913499221206}, "model.layers.10.mlp.up_proj.weight": {"1": 0.12855659425258636, "4": 0.037697210907936096, "16": 0.00955791212618351, "64": 0.004303991328924894, "256": 0.0024543001782149076, "1024": 0.0018426739843562245}, "model.layers.10.mlp.down_proj.weight": {"1": 0.12729912996292114, "4": 0.03577224537730217, "16": 0.008576486259698868, "64": 0.0028226450085639954, "256": 0.0013423203490674496, "1024": 0.0009316232171840966}, "model.layers.10.input_layernorm.weight": {"1": 0.39997345209121704, "4": 0.056603871285915375, "16": 0.04923196882009506, "64": 0.003587964456528425, "256": 0.0007019854965619743, "1024": 0.0011686317157000303}, "model.layers.10.post_attention_layernorm.weight": {"1": 0.12297744303941727, "4": 0.039624929428100586, "16": 0.008783995173871517, "64": 0.0026164024602621794, "256": 0.0008886184077709913, "1024": 0.00036742963129654527}, "model.layers.11.self_attn.q_proj.weight": {"1": 0.09801756590604782, "4": 0.018465092405676842, "16": 0.008037138730287552, "64": 0.0018169870600104332, "256": 0.0019312207587063313, "1024": 0.0009597809403203428}, "model.layers.11.self_attn.k_proj.weight": {"1": 0.28864333033561707, "4": 0.05978851765394211, "16": 0.0170341394841671, "64": 0.005973420105874538, "256": 0.00587261188775301, "1024": 0.003613634267821908}, "model.layers.11.self_attn.v_proj.weight": {"1": 0.38385114073753357, "4": 0.10827361792325974, "16": 0.0347425676882267, "64": 0.016371119767427444, "256": 0.01333666406571865, "1024": 0.012138969264924526}, "model.layers.11.self_attn.o_proj.weight": {"1": 0.12944339215755463, "4": 0.037799373269081116, "16": 0.00973021611571312, "64": 0.003810328198596835, "256": 0.002347614848986268, "1024": 0.0019199176458641887}, "model.layers.11.mlp.gate_proj.weight": {"1": 0.12841331958770752, "4": 0.030752671882510185, "16": 0.007543806452304125, "64": 0.002764214063063264, "256": 0.0012695849873125553, "1024": 0.0008887212607078254}, "model.layers.11.mlp.up_proj.weight": {"1": 0.1362648755311966, "4": 0.03281956911087036, "16": 0.008751250803470612, "64": 0.0033357541542500257, "256": 0.0016938460757955909, "1024": 0.0013100060168653727}, "model.layers.11.mlp.down_proj.weight": {"1": 0.10666992515325546, "4": 0.028056593611836433, "16": 0.007270817179232836, "64": 0.0030812593176960945, "256": 0.0017390206921845675, "1024": 0.001420038752257824}, "model.layers.11.input_layernorm.weight": {"1": 0.014012853614985943, "4": 0.02363351359963417, "16": 0.00667664036154747, "64": 0.00011868069123011082, "256": 0.00020996356033720076, "1024": 0.00023345966474153101}, "model.layers.11.post_attention_layernorm.weight": {"1": 0.11933741718530655, "4": 0.0295510645955801, "16": 0.007048982661217451, "64": 0.002174264984205365, "256": 0.0006105404463596642, "1024": 0.0002288793184561655}, "model.layers.12.self_attn.q_proj.weight": {"1": 0.3772880733013153, "4": 0.03387308120727539, "16": 0.016588671132922173, "64": 0.00291286944411695, "256": 0.0032178175169974566, "1024": 0.0020182249136269093}, "model.layers.12.self_attn.k_proj.weight": {"1": 0.2836039364337921, "4": 0.03811990097165108, "16": 0.024904241785407066, "64": 0.004628714639693499, "256": 0.00587422912940383, "1024": 0.002995566464960575}, "model.layers.12.self_attn.v_proj.weight": {"1": 0.40277329087257385, "4": 0.13015033304691315, "16": 0.04914284124970436, "64": 0.031079141423106194, "256": 0.028515005484223366, "1024": 0.027313662692904472}, "model.layers.12.self_attn.o_proj.weight": {"1": 0.11927080154418945, "4": 0.03194175288081169, "16": 0.009633878245949745, "64": 0.00465694535523653, "256": 0.0030755342449992895, "1024": 0.0027720469515770674}, "model.layers.12.mlp.gate_proj.weight": {"1": 0.10520981252193451, "4": 0.027036534622311592, "16": 0.006799196358770132, "64": 0.0021695990581065416, "256": 0.0009688434074632823, "1024": 0.0006594223668798804}, "model.layers.12.mlp.up_proj.weight": {"1": 0.09997738897800446, "4": 0.025987587869167328, "16": 0.006755470298230648, "64": 0.0021962847094982862, "256": 0.0011405239347368479, "1024": 0.0007886377861723304}, "model.layers.12.mlp.down_proj.weight": {"1": 0.08812558650970459, "4": 0.020966628566384315, "16": 0.006147011648863554, "64": 0.002251011785119772, "256": 0.0011377697810530663, "1024": 0.0009698939975351095}, "model.layers.12.input_layernorm.weight": {"1": 0.029852619394659996, "4": 0.01592455804347992, "16": 0.004469357896596193, "64": 0.0003654824977274984, "256": 0.0005025459686294198, "1024": 0.00028262854903005064}, "model.layers.12.post_attention_layernorm.weight": {"1": 0.11173076182603836, "4": 0.031562644988298416, "16": 0.007886786945164204, "64": 0.0016423448687419295, "256": 0.0005199193838052452, "1024": 0.00020100963592994958}, "model.layers.13.self_attn.q_proj.weight": {"1": 0.08735853433609009, "4": 0.013145750388503075, "16": 0.004849009681493044, "64": 0.0024022716097533703, "256": 0.001950549311004579, "1024": 0.0014775266172364354}, "model.layers.13.self_attn.k_proj.weight": {"1": 0.045802634209394455, "4": 0.021736102178692818, "16": 0.00462030665948987, "64": 0.0014001744566485286, "256": 0.0007619211683049798, "1024": 0.0005616599810309708}, "model.layers.13.self_attn.v_proj.weight": {"1": 0.3546817898750305, "4": 0.10852169990539551, "16": 0.03562162443995476, "64": 0.019577160477638245, "256": 0.016796747222542763, "1024": 0.016061238944530487}, "model.layers.13.self_attn.o_proj.weight": {"1": 0.13141052424907684, "4": 0.040642350912094116, "16": 0.01186878327280283, "64": 0.006172659806907177, "256": 0.004682993981987238, "1024": 0.004415563773363829}, "model.layers.13.mlp.gate_proj.weight": {"1": 0.06906864047050476, "4": 0.017350291833281517, "16": 0.004589544143527746, "64": 0.0014058336382731795, "256": 0.0006347981980070472, "1024": 0.00044654886005446315}, "model.layers.13.mlp.up_proj.weight": {"1": 0.07626180350780487, "4": 0.01843245141208172, "16": 0.004541361704468727, "64": 0.0016839754534885287, "256": 0.0008124505984596908, "1024": 0.000566528644412756}, "model.layers.13.mlp.down_proj.weight": {"1": 0.06424066424369812, "4": 0.015829594805836678, "16": 0.004301103763282299, "64": 0.0016163672553375363, "256": 0.0010083109373226762, "1024": 0.0008314388687722385}, "model.layers.13.input_layernorm.weight": {"1": 0.3376174569129944, "4": 0.09076862037181854, "16": 0.007500649429857731, "64": 0.0027068087365478277, "256": 0.002266694325953722, "1024": 0.0030233096331357956}, "model.layers.13.post_attention_layernorm.weight": {"1": 0.08141934126615524, "4": 0.021248897537589073, "16": 0.004630480892956257, "64": 0.0014464912237599492, "256": 0.00046766831655986607, "1024": 0.00019997036724817008}, "model.layers.14.self_attn.q_proj.weight": {"1": 0.13635554909706116, "4": 0.012130334973335266, "16": 0.0031302114948630333, "64": 0.001714922720566392, "256": 0.0007482729270122945, "1024": 0.0006206167163327336}, "model.layers.14.self_attn.k_proj.weight": {"1": 0.06122985854744911, "4": 0.011011054739356041, "16": 0.0029401592910289764, "64": 0.0013228522147983313, "256": 0.0008206309285014868, "1024": 0.0007697806577198207}, "model.layers.14.self_attn.v_proj.weight": {"1": 0.3324207067489624, "4": 0.09347452968358994, "16": 0.03402532637119293, "64": 0.017225399613380432, "256": 0.013261011801660061, "1024": 0.012520316056907177}, "model.layers.14.self_attn.o_proj.weight": {"1": 0.07021316140890121, "4": 0.017946181818842888, "16": 0.005270489491522312, "64": 0.002329214010387659, "256": 0.001543557271361351, "1024": 0.0013481895439326763}, "model.layers.14.mlp.gate_proj.weight": {"1": 0.04856593534350395, "4": 0.012495206668972969, "16": 0.003182477317750454, "64": 0.0010743390303105116, "256": 0.0005147174233570695, "1024": 0.000380088051315397}, "model.layers.14.mlp.up_proj.weight": {"1": 0.03787713497877121, "4": 0.009633694775402546, "16": 0.0025656702928245068, "64": 0.0007957855123095214, "256": 0.00039315945468842983, "1024": 0.0002821754023898393}, "model.layers.14.mlp.down_proj.weight": {"1": 0.08221694082021713, "4": 0.016661548987030983, "16": 0.006678994745016098, "64": 0.0034056250005960464, "256": 0.0028566664550453424, "1024": 0.002701902063563466}, "model.layers.14.input_layernorm.weight": {"1": 0.06683078408241272, "4": 0.007546831853687763, "16": 0.0021388952154666185, "64": 0.0013402336044237018, "256": 4.259479828760959e-05, "1024": 6.894388207001612e-05}, "model.layers.14.post_attention_layernorm.weight": {"1": 0.05788648873567581, "4": 0.013887944631278515, "16": 0.003752392716705799, "64": 0.0009347624145448208, "256": 0.00029758678283542395, "1024": 9.088488150155172e-05}, "model.layers.15.self_attn.q_proj.weight": {"1": 0.04589356482028961, "4": 0.009230249561369419, "16": 0.0024900336284190416, "64": 0.0006495830602943897, "256": 0.00023234756372403353, "1024": 7.699673005845398e-05}, "model.layers.15.self_attn.k_proj.weight": {"1": 0.09950850903987885, "4": 0.016301246359944344, "16": 0.0031503462232649326, "64": 0.001852723304182291, "256": 0.0009152679704129696, "1024": 0.0005707992822863162}, "model.layers.15.self_attn.v_proj.weight": {"1": 0.1941818743944168, "4": 0.05691016465425491, "16": 0.02281159721314907, "64": 0.016151702031493187, "256": 0.0132099948823452, "1024": 0.01278696022927761}, "model.layers.15.self_attn.o_proj.weight": {"1": 0.03535659238696098, "4": 0.009722228161990643, "16": 0.002389343921095133, "64": 0.0005460879765450954, "256": 0.00018837061361409724, "1024": 4.955753684043884e-05}, "model.layers.15.mlp.gate_proj.weight": {"1": 0.027235472574830055, "4": 0.0062119378708302975, "16": 0.0015381491975858808, "64": 0.00040256595821119845, "256": 0.00011824911052826792, "1024": 3.357783134561032e-05}, "model.layers.15.mlp.up_proj.weight": {"1": 0.02972959354519844, "4": 0.006424559745937586, "16": 0.0016365241026505828, "64": 0.00041595890070311725, "256": 0.00011575440294109285, "1024": 3.367444878676906e-05}, "model.layers.15.mlp.down_proj.weight": {"1": 0.01183491013944149, "4": 0.003264056984335184, "16": 0.0012040154542773962, "64": 0.0005461627733893692, "256": 0.0004469964769668877, "1024": 0.0004128431901335716}, "model.layers.15.input_layernorm.weight": {"1": 0.08715055137872696, "4": 0.020411139354109764, "16": 0.00417232234030962, "64": 0.0012878638226538897, "256": 0.0004990540910512209, "1024": 0.00016162804968189448}, "model.layers.15.post_attention_layernorm.weight": {"1": 0.041520487517118454, "4": 0.010188809596002102, "16": 0.002335408702492714, "64": 0.0006547215161845088, "256": 0.00018544822523836046, "1024": 5.1622570026665926e-05}, "model.norm.weight": {"1": 0.0, "4": 0.0, "16": 1.3479660299748307e-14, "64": 2.2084845887823668e-13, "256": 3.477050895470124e-12, "1024": 5.953768728028663e-11}}