{"model.embed_tokens.weight": {"1": 0.8541749715805054, "4": 0.16346989572048187, "16": 0.03717068210244179, "64": 0.011007220484316349, "256": 0.0027789107989519835, "1024": 0.0006875938270241022}, "model.layers.0.self_attn.q_proj.weight": {"1": 3.948641777038574, "4": 0.6094955801963806, "16": 0.13202990591526031, "64": 0.03367966413497925, "256": 0.012590531259775162, "1024": 0.0018821839476004243}, "model.layers.0.self_attn.k_proj.weight": {"1": 4.929811477661133, "4": 0.9377101063728333, "16": 0.3612509071826935, "64": 0.07702039182186127, "256": 0.015205702744424343, "1024": 0.004274934995919466}, "model.layers.0.self_attn.v_proj.weight": {"1": 4.366466522216797, "4": 0.7552000284194946, "16": 0.16058066487312317, "64": 0.06102981045842171, "256": 0.01370383519679308, "1024": 0.0027515992987900972}, "model.layers.0.self_attn.o_proj.weight": {"1": 2.496277093887329, "4": 0.44690805673599243, "16": 0.10302069038152695, "64": 0.029501650482416153, "256": 0.008136714808642864, "1024": 0.001798340235836804}, "model.layers.0.mlp.gate_proj.weight": {"1": 1.9929548501968384, "4": 0.33427250385284424, "16": 0.08407502621412277, "64": 0.023872381076216698, "256": 0.006233739200979471, "1024": 0.001477614277973771}, "model.layers.0.mlp.up_proj.weight": {"1": 2.6493706703186035, "4": 0.4557426869869232, "16": 0.11095564812421799, "64": 0.03112383931875229, "256": 0.008059301413595676, "1024": 0.0019868346862494946}, "model.layers.0.mlp.down_proj.weight": {"1": 2.682631492614746, "4": 0.44508156180381775, "16": 0.10433144122362137, "64": 0.029663454741239548, "256": 0.008037807419896126, "1024": 0.0019519675988703966}, "model.layers.0.input_layernorm.weight": {"1": 1.9860433340072632, "4": 0.42392829060554504, "16": 0.03622167930006981, "64": 0.012599704787135124, "256": 0.0038174691144376993, "1024": 0.0012270153965801}, "model.layers.0.post_attention_layernorm.weight": {"1": 1.9669381380081177, "4": 0.39071357250213623, "16": 0.08581631630659103, "64": 0.02497672103345394, "256": 0.006590405944734812, "1024": 0.0014418448554351926}, "model.layers.1.self_attn.q_proj.weight": {"1": 3.5605499744415283, "4": 0.6330692172050476, "16": 0.16683708131313324, "64": 0.06693015247583389, "256": 0.009443913586437702, "1024": 0.003172147087752819}, "model.layers.1.self_attn.k_proj.weight": {"1": 3.829929828643799, "4": 0.734792172908783, "16": 0.19097797572612762, "64": 0.06230471655726433, "256": 0.014033868908882141, "1024": 0.0026459801010787487}, "model.layers.1.self_attn.v_proj.weight": {"1": 4.932857036590576, "4": 0.7781570553779602, "16": 0.18938963115215302, "64": 0.05033911392092705, "256": 0.01286590751260519, "1024": 0.0033917382825165987}, "model.layers.1.self_attn.o_proj.weight": {"1": 2.358189582824707, "4": 0.4042700231075287, "16": 0.10402626544237137, "64": 0.02931063063442707, "256": 0.007253697142004967, "1024": 0.0018225585808977485}, "model.layers.1.mlp.gate_proj.weight": {"1": 2.453127384185791, "4": 0.4295739233493805, "16": 0.1028166115283966, "64": 0.03110433928668499, "256": 0.00825112871825695, "1024": 0.0019688147585839033}, "model.layers.1.mlp.up_proj.weight": {"1": 2.6068241596221924, "4": 0.4524388611316681, "16": 0.1124194785952568, "64": 0.033733926713466644, "256": 0.008572862483561039, "1024": 0.002065258799120784}, "model.layers.1.mlp.down_proj.weight": {"1": 0.9460200667381287, "4": 0.19182205200195312, "16": 0.045289285480976105, "64": 0.013085061684250832, "256": 0.003526914631947875, "1024": 0.0008076321100816131}, "model.layers.1.input_layernorm.weight": {"1": 2.9967992305755615, "4": 0.16697455942630768, "16": 0.3488468825817108, "64": 0.04685387760400772, "256": 0.002210760023444891, "1024": 0.0007907583494670689}, "model.layers.1.post_attention_layernorm.weight": {"1": 5.145291805267334, "4": 1.0083231925964355, "16": 0.09887021034955978, "64": 0.02960716187953949, "256": 0.016878141090273857, "1024": 0.002127374056726694}, "model.layers.2.self_attn.q_proj.weight": {"1": 1.4007046222686768, "4": 0.3174009919166565, "16": 0.0522211454808712, "64": 0.023360827937722206, "256": 0.003642704337835312, "1024": 0.0009089973755180836}, "model.layers.2.self_attn.k_proj.weight": {"1": 1.8263561725616455, "4": 0.44112685322761536, "16": 0.05211809650063515, "64": 0.026231952011585236, "256": 0.004930559545755386, "1024": 0.0014990981435403228}, "model.layers.2.self_attn.v_proj.weight": {"1": 6.635183334350586, "4": 1.299855351448059, "16": 0.2817990779876709, "64": 0.07565879821777344, "256": 0.018655745312571526, "1024": 0.004538857843726873}, "model.layers.2.self_attn.o_proj.weight": {"1": 2.3168692588806152, "4": 0.3996874988079071, "16": 0.0984790176153183, "64": 0.027279868721961975, "256": 0.00790097750723362, "1024": 0.0015872722724452615}, "model.layers.2.mlp.gate_proj.weight": {"1": 2.1635243892669678, "4": 0.4374319612979889, "16": 0.0876903235912323, "64": 0.027553508058190346, "256": 0.007755144964903593, "1024": 0.0015527313807979226}, "model.layers.2.mlp.up_proj.weight": {"1": 2.418009042739868, "4": 0.48839277029037476, "16": 0.11692380160093307, "64": 0.03608955070376396, "256": 0.009329923428595066, "1024": 0.002087945118546486}, "model.layers.2.mlp.down_proj.weight": {"1": 1.7474807500839233, "4": 0.3311675786972046, "16": 0.07871958613395691, "64": 0.02204819582402706, "256": 0.006322507746517658, "1024": 0.0012484622420743108}, "model.layers.2.input_layernorm.weight": {"1": 0.4497048258781433, "4": 5.419711589813232, "16": 0.029408464208245277, "64": 0.13418728113174438, "256": 0.004467477090656757, "1024": 0.010519368574023247}, "model.layers.2.post_attention_layernorm.weight": {"1": 2.392692804336548, "4": 0.4711170196533203, "16": 0.10575498640537262, "64": 0.02890293300151825, "256": 0.0076261721551418304, "1024": 0.0018182153580710292}, "model.layers.3.self_attn.q_proj.weight": {"1": 2.710239887237549, "4": 0.543728232383728, "16": 0.10704038292169571, "64": 0.029698902741074562, "256": 0.006096444558352232, "1024": 0.0013042747741565108}, "model.layers.3.self_attn.k_proj.weight": {"1": 2.047186851501465, "4": 1.1640312671661377, "16": 0.1186576560139656, "64": 0.03158225864171982, "256": 0.004448384512215853, "1024": 0.0008251387043856084}, "model.layers.3.self_attn.v_proj.weight": {"1": 4.375589847564697, "4": 0.704134464263916, "16": 0.2077392339706421, "64": 0.05283394083380699, "256": 0.01427320297807455, "1024": 0.0031564650125801563}, "model.layers.3.self_attn.o_proj.weight": {"1": 1.7329468727111816, "4": 0.26659297943115234, "16": 0.07637795805931091, "64": 0.020810885354876518, "256": 0.006553724408149719, "1024": 0.001187508343718946}, "model.layers.3.mlp.gate_proj.weight": {"1": 2.2223057746887207, "4": 0.33431440591812134, "16": 0.09790634363889694, "64": 0.026748551055788994, "256": 0.008397940546274185, "1024": 0.0016186516731977463}, "model.layers.3.mlp.up_proj.weight": {"1": 1.9789435863494873, "4": 0.3084290325641632, "16": 0.08343573659658432, "64": 0.026759251952171326, "256": 0.007799153681844473, "1024": 0.0014723079511895776}, "model.layers.3.mlp.down_proj.weight": {"1": 1.5658620595932007, "4": 0.25993335247039795, "16": 0.0708567425608635, "64": 0.01917361281812191, "256": 0.006171231158077717, "1024": 0.0011422926327213645}, "model.layers.3.input_layernorm.weight": {"1": 1.6956617832183838, "4": 10.931844711303711, "16": 0.027619510889053345, "64": 0.16559471189975739, "256": 0.023747917264699936, "1024": 0.0006402895087376237}, "model.layers.3.post_attention_layernorm.weight": {"1": 2.353757619857788, "4": 0.3060374855995178, "16": 0.09193609654903412, "64": 0.02905944362282753, "256": 0.009061808697879314, "1024": 0.0016228357562795281}, "model.layers.4.self_attn.q_proj.weight": {"1": 2.023283004760742, "4": 0.2426149994134903, "16": 0.07969393581151962, "64": 0.018627801910042763, "256": 0.008542848750948906, "1024": 0.00116342690307647}, "model.layers.4.self_attn.k_proj.weight": {"1": 2.7683067321777344, "4": 0.4276241064071655, "16": 0.05766802281141281, "64": 0.014339249581098557, "256": 0.005688432138413191, "1024": 0.001102884067222476}, "model.layers.4.self_attn.v_proj.weight": {"1": 2.5637569427490234, "4": 0.5084059238433838, "16": 0.13712267577648163, "64": 0.03960571065545082, "256": 0.01178981363773346, "1024": 0.002352016046643257}, "model.layers.4.self_attn.o_proj.weight": {"1": 1.2645220756530762, "4": 0.22354558110237122, "16": 0.06407517194747925, "64": 0.01694595254957676, "256": 0.005660671275109053, "1024": 0.0010698999976739287}, "model.layers.4.mlp.gate_proj.weight": {"1": 1.3626679182052612, "4": 0.25767460465431213, "16": 0.07657414674758911, "64": 0.017861120402812958, "256": 0.007169779855757952, "1024": 0.0013306497130542994}, "model.layers.4.mlp.up_proj.weight": {"1": 1.612501859664917, "4": 0.28006836771965027, "16": 0.07874801009893417, "64": 0.020900199189782143, "256": 0.007097357884049416, "1024": 0.0013598762452602386}, "model.layers.4.mlp.down_proj.weight": {"1": 1.1735347509384155, "4": 0.22229847311973572, "16": 0.06120377033948898, "64": 0.015027436427772045, "256": 0.005518954247236252, "1024": 0.0009987328667193651}, "model.layers.4.input_layernorm.weight": {"1": 0.2981126606464386, "4": 0.1023920327425003, "16": 0.02184353955090046, "64": 0.0034451198298484087, "256": 0.005936280358582735, "1024": 0.0001713944657240063}, "model.layers.4.post_attention_layernorm.weight": {"1": 1.1786961555480957, "4": 0.2500987946987152, "16": 0.06870957463979721, "64": 0.0191680658608675, "256": 0.0061304401606321335, "1024": 0.0012577342567965388}, "model.layers.5.self_attn.q_proj.weight": {"1": 1.5928171873092651, "4": 0.21665871143341064, "16": 0.07849585264921188, "64": 0.014806159771978855, "256": 0.007473488803952932, "1024": 0.0011635262053459883}, "model.layers.5.self_attn.k_proj.weight": {"1": 0.6708881258964539, "4": 0.16076382994651794, "16": 0.06178678572177887, "64": 0.012659970670938492, "256": 0.008888413198292255, "1024": 0.0010606577852740884}, "model.layers.5.self_attn.v_proj.weight": {"1": 2.851614475250244, "4": 0.5506244897842407, "16": 0.14050565659999847, "64": 0.036631323397159576, "256": 0.012327245436608791, "1024": 0.002399126999080181}, "model.layers.5.self_attn.o_proj.weight": {"1": 1.0337759256362915, "4": 0.19896487891674042, "16": 0.053472355008125305, "64": 0.01271843258291483, "256": 0.004790295846760273, "1024": 0.0008837440982460976}, "model.layers.5.mlp.gate_proj.weight": {"1": 0.8946852087974548, "4": 0.212892547249794, "16": 0.05452564358711243, "64": 0.01336673554033041, "256": 0.004595024511218071, "1024": 0.0010022082133218646}, "model.layers.5.mlp.up_proj.weight": {"1": 1.3537111282348633, "4": 0.2624357342720032, "16": 0.06720340251922607, "64": 0.015681827440857887, "256": 0.006169603671878576, "1024": 0.0011390881845727563}, "model.layers.5.mlp.down_proj.weight": {"1": 0.9858900904655457, "4": 0.1939639300107956, "16": 0.05391833558678627, "64": 0.01274101808667183, "256": 0.004534803330898285, "1024": 0.0008795633330009878}, "model.layers.5.input_layernorm.weight": {"1": 1.728295922279358, "4": 0.017735162749886513, "16": 0.075713150203228, "64": 0.0196843221783638, "256": 0.013880632817745209, "1024": 0.0002667567750904709}, "model.layers.5.post_attention_layernorm.weight": {"1": 1.0807796716690063, "4": 0.21763722598552704, "16": 0.06006719917058945, "64": 0.015517769381403923, "256": 0.0053028203547000885, "1024": 0.0010292018996551633}, "model.layers.6.self_attn.q_proj.weight": {"1": 1.5581828355789185, "4": 0.2258354127407074, "16": 0.0699094608426094, "64": 0.02672267146408558, "256": 0.007959072478115559, "1024": 0.0020870829466730356}, "model.layers.6.self_attn.k_proj.weight": {"1": 2.975287437438965, "4": 0.21655014157295227, "16": 0.04834255203604698, "64": 0.014341948553919792, "256": 0.004896777682006359, "1024": 0.0010413986165076494}, "model.layers.6.self_attn.v_proj.weight": {"1": 2.2772505283355713, "4": 0.4009881317615509, "16": 0.11109641194343567, "64": 0.027462821453809738, "256": 0.009207088500261307, "1024": 0.0018710250733420253}, "model.layers.6.self_attn.o_proj.weight": {"1": 0.8515419363975525, "4": 0.1685890257358551, "16": 0.04571555554866791, "64": 0.010971917770802975, "256": 0.004365229047834873, "1024": 0.0007650287006981671}, "model.layers.6.mlp.gate_proj.weight": {"1": 1.0931886434555054, "4": 0.2176346778869629, "16": 0.058254264295101166, "64": 0.013247445225715637, "256": 0.005472829099744558, "1024": 0.0010608748998492956}, "model.layers.6.mlp.up_proj.weight": {"1": 1.1695055961608887, "4": 0.22877813875675201, "16": 0.06215905770659447, "64": 0.01568407006561756, "256": 0.005842156708240509, "1024": 0.0011175702093169093}, "model.layers.6.mlp.down_proj.weight": {"1": 0.9297530651092529, "4": 0.18868041038513184, "16": 0.05085102841258049, "64": 0.012358618900179863, "256": 0.004442888777703047, "1024": 0.000853454926982522}, "model.layers.6.input_layernorm.weight": {"1": 4.977909564971924, "4": 0.6232596635818481, "16": 0.07028809189796448, "64": 0.0431973971426487, "256": 0.005982184316962957, "1024": 0.003204214619472623}, "model.layers.6.post_attention_layernorm.weight": {"1": 1.1323038339614868, "4": 0.34259095788002014, "16": 0.10448625683784485, "64": 0.0160524919629097, "256": 0.00486218323931098, "1024": 0.0016317295376211405}, "model.layers.7.self_attn.q_proj.weight": {"1": 1.0753698348999023, "4": 0.3165013790130615, "16": 0.05585600063204765, "64": 0.0187237411737442, "256": 0.010473782196640968, "1024": 0.0011541134444996715}, "model.layers.7.self_attn.k_proj.weight": {"1": 1.3101561069488525, "4": 0.38293150067329407, "16": 0.08366808295249939, "64": 0.02632497437298298, "256": 0.00796375423669815, "1024": 0.0015025080647319555}, "model.layers.7.self_attn.v_proj.weight": {"1": 1.7410786151885986, "4": 0.34220796823501587, "16": 0.08499755710363388, "64": 0.02307834103703499, "256": 0.007497189100831747, "1024": 0.0014477582881227136}, "model.layers.7.self_attn.o_proj.weight": {"1": 0.7776662111282349, "4": 0.15412823855876923, "16": 0.04165269434452057, "64": 0.009998836554586887, "256": 0.0034508456010371447, "1024": 0.0007141597452573478}, "model.layers.7.mlp.gate_proj.weight": {"1": 1.1699978113174438, "4": 0.21571309864521027, "16": 0.05324503034353256, "64": 0.014052762649953365, "256": 0.006138848606497049, "1024": 0.000984133337624371}, "model.layers.7.mlp.up_proj.weight": {"1": 1.0462379455566406, "4": 0.218255415558815, "16": 0.05686560645699501, "64": 0.014178547076880932, "256": 0.004535503685474396, "1024": 0.0009132006671279669}, "model.layers.7.mlp.down_proj.weight": {"1": 0.8437680006027222, "4": 0.1789652705192566, "16": 0.043809615075588226, "64": 0.011266440153121948, "256": 0.0035979021340608597, "1024": 0.000739881070330739}, "model.layers.7.input_layernorm.weight": {"1": 0.29752761125564575, "4": 0.2010776698589325, "16": 0.027861542999744415, "64": 0.022586852312088013, "256": 0.0015944020124152303, "1024": 0.0018928820500150323}, "model.layers.7.post_attention_layernorm.weight": {"1": 1.688008189201355, "4": 0.30037975311279297, "16": 0.06118270009756088, "64": 0.031689323484897614, "256": 0.004736943170428276, "1024": 0.0007506537367589772}, "model.layers.8.self_attn.q_proj.weight": {"1": 0.8687385320663452, "4": 0.14781728386878967, "16": 0.03667822480201721, "64": 0.015973730012774467, "256": 0.006431110668927431, "1024": 0.0012509250082075596}, "model.layers.8.self_attn.k_proj.weight": {"1": 1.0427908897399902, "4": 0.3628866672515869, "16": 0.061526767909526825, "64": 0.019302671775221825, "256": 0.004227388650178909, "1024": 0.001736756064929068}, "model.layers.8.self_attn.v_proj.weight": {"1": 1.4654438495635986, "4": 0.3233509361743927, "16": 0.07133423537015915, "64": 0.0206199511885643, "256": 0.006028821226209402, "1024": 0.001395871746353805}, "model.layers.8.self_attn.o_proj.weight": {"1": 0.7655295729637146, "4": 0.15611548721790314, "16": 0.038704268634319305, "64": 0.010030531324446201, "256": 0.003307739505544305, "1024": 0.000683366262819618}, "model.layers.8.mlp.gate_proj.weight": {"1": 0.7386465072631836, "4": 0.1751878410577774, "16": 0.0565592423081398, "64": 0.011836360208690166, "256": 0.005050711799412966, "1024": 0.0008964954758994281}, "model.layers.8.mlp.up_proj.weight": {"1": 0.7593807578086853, "4": 0.18197806179523468, "16": 0.04882890731096268, "64": 0.011459187604486942, "256": 0.003930688835680485, "1024": 0.0008091846248134971}, "model.layers.8.mlp.down_proj.weight": {"1": 0.6394131779670715, "4": 0.1544441431760788, "16": 0.036975305527448654, "64": 0.009227699600160122, "256": 0.0031381009612232447, "1024": 0.0006458473508246243}, "model.layers.8.input_layernorm.weight": {"1": 6.610959529876709, "4": 0.2385261505842209, "16": 0.0511539950966835, "64": 0.05590914934873581, "256": 0.010652804747223854, "1024": 0.005755394231528044}, "model.layers.8.post_attention_layernorm.weight": {"1": 0.33214521408081055, "4": 0.2010870724916458, "16": 0.01731790415942669, "64": 0.0037946526426821947, "256": 0.0013781144516542554, "1024": 0.000334033218678087}, "model.layers.9.self_attn.q_proj.weight": {"1": 0.33588242530822754, "4": 0.13610737025737762, "16": 0.03142828121781349, "64": 0.006565204821527004, "256": 0.0031789455097168684, "1024": 0.001314727240242064}, "model.layers.9.self_attn.k_proj.weight": {"1": 0.38277024030685425, "4": 0.13349555432796478, "16": 0.04148559644818306, "64": 0.01003562193363905, "256": 0.003654367057606578, "1024": 0.0014196295524016023}, "model.layers.9.self_attn.v_proj.weight": {"1": 0.9321321249008179, "4": 0.22191347181797028, "16": 0.054252590984106064, "64": 0.013724854215979576, "256": 0.004507849924266338, "1024": 0.0009420391288585961}, "model.layers.9.self_attn.o_proj.weight": {"1": 0.6612375974655151, "4": 0.1463351845741272, "16": 0.03638540208339691, "64": 0.00875059887766838, "256": 0.0029845957178622484, "1024": 0.000583753630053252}, "model.layers.9.mlp.gate_proj.weight": {"1": 0.6178025603294373, "4": 0.16281965374946594, "16": 0.03212367370724678, "64": 0.007986398413777351, "256": 0.0028044763021171093, "1024": 0.0004751347005367279}, "model.layers.9.mlp.up_proj.weight": {"1": 0.5231583118438721, "4": 0.12255124747753143, "16": 0.035003289580345154, "64": 0.007334091234952211, "256": 0.0028857854194939137, "1024": 0.0005212771357037127}, "model.layers.9.mlp.down_proj.weight": {"1": 0.4349507987499237, "4": 0.11714030802249908, "16": 0.02863152325153351, "64": 0.007284125313162804, "256": 0.0019367359345778823, "1024": 0.0004847522941417992}, "model.layers.9.input_layernorm.weight": {"1": 1.1896878480911255, "4": 0.11640933901071548, "16": 0.050491880625486374, "64": 0.00602897722274065, "256": 0.003759301034733653, "1024": 0.0007169171585701406}, "model.layers.9.post_attention_layernorm.weight": {"1": 0.459267795085907, "4": 0.10130277276039124, "16": 0.036992453038692474, "64": 0.006658107507973909, "256": 0.002838023705407977, "1024": 0.00040918172453530133}, "model.layers.10.self_attn.q_proj.weight": {"1": 0.37275242805480957, "4": 0.1401948630809784, "16": 0.0315982848405838, "64": 0.002300274558365345, "256": 0.0023588514886796474, "1024": 0.00028268288588151336}, "model.layers.10.self_attn.k_proj.weight": {"1": 1.583148717880249, "4": 0.1324789822101593, "16": 0.13841167092323303, "64": 0.009839150123298168, "256": 0.0074300700798630714, "1024": 0.0008239013259299099}, "model.layers.10.self_attn.v_proj.weight": {"1": 1.8126035928726196, "4": 0.3969913423061371, "16": 0.09666804224252701, "64": 0.02500953897833824, "256": 0.006053789518773556, "1024": 0.0015945506747812033}, "model.layers.10.self_attn.o_proj.weight": {"1": 0.5538536906242371, "4": 0.13120917975902557, "16": 0.0340874120593071, "64": 0.008712024427950382, "256": 0.002200994174927473, "1024": 0.0005615031695924699}, "model.layers.10.mlp.gate_proj.weight": {"1": 0.43294253945350647, "4": 0.11468386650085449, "16": 0.029028207063674927, "64": 0.007452452555298805, "256": 0.0018516931449994445, "1024": 0.00045530288480222225}, "model.layers.10.mlp.up_proj.weight": {"1": 0.41288188099861145, "4": 0.0941234827041626, "16": 0.024889076128602028, "64": 0.006546325981616974, "256": 0.001572177978232503, "1024": 0.00044401094783097506}, "model.layers.10.mlp.down_proj.weight": {"1": 0.3774823248386383, "4": 0.08882054686546326, "16": 0.022017424926161766, "64": 0.005845348350703716, "256": 0.0013747538905590773, "1024": 0.00036872419877909124}, "model.layers.10.input_layernorm.weight": {"1": 1.5294817686080933, "4": 0.13236327469348907, "16": 0.0753508135676384, "64": 0.006830789614468813, "256": 0.004137754440307617, "1024": 0.0012226133840158582}, "model.layers.10.post_attention_layernorm.weight": {"1": 0.4389062821865082, "4": 0.09961410611867905, "16": 0.025998419150710106, "64": 0.00627156114205718, "256": 0.0018111870158463717, "1024": 0.00040350123890675604}, "model.layers.11.self_attn.q_proj.weight": {"1": 0.1601051539182663, "4": 0.04867178201675415, "16": 0.01754160411655903, "64": 0.00403435667976737, "256": 0.0011466610012575984, "1024": 0.0003988063253927976}, "model.layers.11.self_attn.k_proj.weight": {"1": 0.24636025726795197, "4": 0.05050117149949074, "16": 0.02844296395778656, "64": 0.006221492774784565, "256": 0.0019074478186666965, "1024": 0.0009118531597778201}, "model.layers.11.self_attn.v_proj.weight": {"1": 1.3088384866714478, "4": 0.28863468766212463, "16": 0.08003481477499008, "64": 0.01949077844619751, "256": 0.004873070865869522, "1024": 0.001256645773537457}, "model.layers.11.self_attn.o_proj.weight": {"1": 0.4220152795314789, "4": 0.09816019237041473, "16": 0.024004798382520676, "64": 0.006450263783335686, "256": 0.0015760697424411774, "1024": 0.00041461753426119685}, "model.layers.11.mlp.gate_proj.weight": {"1": 0.36482757329940796, "4": 0.08958953619003296, "16": 0.019767874851822853, "64": 0.005527804605662823, "256": 0.001257902360521257, "1024": 0.000372054724721238}, "model.layers.11.mlp.up_proj.weight": {"1": 0.37510302662849426, "4": 0.09291303157806396, "16": 0.02323407679796219, "64": 0.005997190251946449, "256": 0.0013572701718658209, "1024": 0.0003804511798080057}, "model.layers.11.mlp.down_proj.weight": {"1": 0.3276909291744232, "4": 0.07606881856918335, "16": 0.018418174237012863, "64": 0.004846871364861727, "256": 0.001055880798958242, "1024": 0.000315926707116887}, "model.layers.11.input_layernorm.weight": {"1": 0.029330793768167496, "4": 0.005255275405943394, "16": 0.03629874438047409, "64": 0.007230471353977919, "256": 0.0003210922877769917, "1024": 0.0004014449077658355}, "model.layers.11.post_attention_layernorm.weight": {"1": 0.3110881745815277, "4": 0.09330429881811142, "16": 0.021493643522262573, "64": 0.006154298782348633, "256": 0.0015593457501381636, "1024": 0.0003415570536162704}, "model.layers.12.self_attn.q_proj.weight": {"1": 0.6253459453582764, "4": 0.22225308418273926, "16": 0.04657192528247833, "64": 0.010257809422910213, "256": 0.0028203807305544615, "1024": 0.00129918463062495}, "model.layers.12.self_attn.k_proj.weight": {"1": 0.4248933792114258, "4": 0.211192786693573, "16": 0.03202096372842789, "64": 0.007318535819649696, "256": 0.0020114846993237734, "1024": 0.0016307249898090959}, "model.layers.12.self_attn.v_proj.weight": {"1": 1.2953709363937378, "4": 0.31640395522117615, "16": 0.08248002082109451, "64": 0.020238958299160004, "256": 0.004613342694938183, "1024": 0.0012114396085962653}, "model.layers.12.self_attn.o_proj.weight": {"1": 0.3930041491985321, "4": 0.08968939632177353, "16": 0.02311738207936287, "64": 0.0058298069052398205, "256": 0.0013144869590178132, "1024": 0.0003566614759620279}, "model.layers.12.mlp.gate_proj.weight": {"1": 0.30849525332450867, "4": 0.07109980285167694, "16": 0.018928345292806625, "64": 0.004683374427258968, "256": 0.0010999065125361085, "1024": 0.00029316250584088266}, "model.layers.12.mlp.up_proj.weight": {"1": 0.30287787318229675, "4": 0.07357579469680786, "16": 0.01750010997056961, "64": 0.0044840602204203606, "256": 0.0011338916374370456, "1024": 0.000285208981949836}, "model.layers.12.mlp.down_proj.weight": {"1": 0.2206725925207138, "4": 0.05438670143485069, "16": 0.014824330806732178, "64": 0.003953972831368446, "256": 0.0009378804825246334, "1024": 0.0002523735456634313}, "model.layers.12.input_layernorm.weight": {"1": 0.1150616705417633, "4": 0.040003810077905655, "16": 0.019060419872403145, "64": 0.014389872550964355, "256": 0.00039650191320106387, "1024": 0.00017950449546333402}, "model.layers.12.post_attention_layernorm.weight": {"1": 0.30974793434143066, "4": 0.08540187776088715, "16": 0.020196320489048958, "64": 0.005040406249463558, "256": 0.0011589800706133246, "1024": 0.0003011560474988073}, "model.layers.13.self_attn.q_proj.weight": {"1": 0.13505282998085022, "4": 0.04639281705021858, "16": 0.007084982935339212, "64": 0.002106746193021536, "256": 0.0010236237430945039, "1024": 0.00024658063193783164}, "model.layers.13.self_attn.k_proj.weight": {"1": 0.21288615465164185, "4": 0.03750205039978027, "16": 0.008166964165866375, "64": 0.0028937985189259052, "256": 0.0011525362497195601, "1024": 0.0002319543855264783}, "model.layers.13.self_attn.v_proj.weight": {"1": 1.2509115934371948, "4": 0.2559223473072052, "16": 0.06988879293203354, "64": 0.018279146403074265, "256": 0.004463576711714268, "1024": 0.0010973497992381454}, "model.layers.13.self_attn.o_proj.weight": {"1": 0.4644298255443573, "4": 0.12555865943431854, "16": 0.03062235563993454, "64": 0.008738432079553604, "256": 0.0020278615411370993, "1024": 0.000506542157381773}, "model.layers.13.mlp.gate_proj.weight": {"1": 0.1832522749900818, "4": 0.047896482050418854, "16": 0.012330570258200169, "64": 0.003100608941167593, "256": 0.0007446952513419092, "1024": 0.0001901724754134193}, "model.layers.13.mlp.up_proj.weight": {"1": 0.2106896936893463, "4": 0.053558703511953354, "16": 0.012952069751918316, "64": 0.0033757397904992104, "256": 0.0007751787197776139, "1024": 0.00019878358580172062}, "model.layers.13.mlp.down_proj.weight": {"1": 0.1705469787120819, "4": 0.04356831684708595, "16": 0.010181306861341, "64": 0.002610706025734544, "256": 0.0006590320845134556, "1024": 0.00016725210298318416}, "model.layers.13.input_layernorm.weight": {"1": 0.26692694425582886, "4": 0.08601660281419754, "16": 0.027240019291639328, "64": 0.010479399003088474, "256": 0.0009289030567742884, "1024": 0.0004544403054751456}, "model.layers.13.post_attention_layernorm.weight": {"1": 0.19622668623924255, "4": 0.05150051787495613, "16": 0.01475802157074213, "64": 0.0033411462791264057, "256": 0.0007224787841551006, "1024": 0.00019163163960911334}, "model.layers.14.self_attn.q_proj.weight": {"1": 0.2721725404262543, "4": 0.054398391395807266, "16": 0.01808430813252926, "64": 0.0027989749796688557, "256": 0.000930359645280987, "1024": 0.00015964901831466705}, "model.layers.14.self_attn.k_proj.weight": {"1": 0.2488918900489807, "4": 0.045210886746644974, "16": 0.010522560216486454, "64": 0.0028054213616997004, "256": 0.0009603661601431668, "1024": 0.00014560618728864938}, "model.layers.14.self_attn.v_proj.weight": {"1": 1.2062115669250488, "4": 0.25375130772590637, "16": 0.06610160320997238, "64": 0.016296830028295517, "256": 0.003936461638659239, "1024": 0.000993636203929782}, "model.layers.14.self_attn.o_proj.weight": {"1": 0.20831413567066193, "4": 0.050808828324079514, "16": 0.012625128030776978, "64": 0.0032459262292832136, "256": 0.0008096820092760026, "1024": 0.00020892801694571972}, "model.layers.14.mlp.gate_proj.weight": {"1": 0.14306212961673737, "4": 0.033657222986221313, "16": 0.00820230320096016, "64": 0.002288920572027564, "256": 0.0005321442731656134, "1024": 0.00014005442790221423}, "model.layers.14.mlp.up_proj.weight": {"1": 0.11098659038543701, "4": 0.02718285471200943, "16": 0.006735761184245348, "64": 0.001802195911295712, "256": 0.00043410752550698817, "1024": 0.0001085751864593476}, "model.layers.14.mlp.down_proj.weight": {"1": 0.16176047921180725, "4": 0.04163924604654312, "16": 0.009707184508442879, "64": 0.003006214275956154, "256": 0.0010052345460280776, "1024": 0.0001577434886712581}, "model.layers.14.input_layernorm.weight": {"1": 0.5648335218429565, "4": 0.01208566129207611, "16": 0.006238847505301237, "64": 0.0015272221062332392, "256": 0.0003397305845282972, "1024": 3.855537579511292e-05}, "model.layers.14.post_attention_layernorm.weight": {"1": 0.14450408518314362, "4": 0.03503616899251938, "16": 0.008773877285420895, "64": 0.002291790209710598, "256": 0.0005150219076313078, "1024": 0.0001530265435576439}, "model.layers.15.self_attn.q_proj.weight": {"1": 0.16440752148628235, "4": 0.04611027240753174, "16": 0.010463299229741096, "64": 0.002279818058013916, "256": 0.0004745404003188014, "1024": 0.00020008689898531884}, "model.layers.15.self_attn.k_proj.weight": {"1": 0.2792946398258209, "4": 0.06765291839838028, "16": 0.018933622166514397, "64": 0.0037120990455150604, "256": 0.0010177354561164975, "1024": 0.0003479385923128575}, "model.layers.15.self_attn.v_proj.weight": {"1": 0.5004602074623108, "4": 0.13205482065677643, "16": 0.03322475031018257, "64": 0.008129148744046688, "256": 0.0018504320178180933, "1024": 0.0005155835533514619}, "model.layers.15.self_attn.o_proj.weight": {"1": 0.1253061592578888, "4": 0.02706211246550083, "16": 0.007189381401985884, "64": 0.0019271251512691379, "256": 0.0005948095349594951, "1024": 0.00011031870963051915}, "model.layers.15.mlp.gate_proj.weight": {"1": 0.08288994431495667, "4": 0.018486086279153824, "16": 0.0049590845592319965, "64": 0.0012020011199638247, "256": 0.0003097920271102339, "1024": 7.924147939775139e-05}, "model.layers.15.mlp.up_proj.weight": {"1": 0.08019460737705231, "4": 0.020836910232901573, "16": 0.0049894568510353565, "64": 0.0012909200740978122, "256": 0.0003083405608776957, "1024": 8.344910020241514e-05}, "model.layers.15.mlp.down_proj.weight": {"1": 0.049840234220027924, "4": 0.011365081183612347, "16": 0.0029863007366657257, "64": 0.0007424425566568971, "256": 0.00018122918845620006, "1024": 4.936724144499749e-05}, "model.layers.15.input_layernorm.weight": {"1": 0.27181050181388855, "4": 0.07203174382448196, "16": 0.033910881727933884, "64": 0.0038465827237814665, "256": 0.0006781500997021794, "1024": 0.0002651667455211282}, "model.layers.15.post_attention_layernorm.weight": {"1": 0.09556698054075241, "4": 0.02577953413128853, "16": 0.006462933961302042, "64": 0.0016804053448140621, "256": 0.00043216600897721946, "1024": 9.790217882255092e-05}, "model.norm.weight": {"1": 0.0, "4": 0.0, "16": 1.3479660299748307e-14, "64": 2.2084845887823668e-13, "256": 3.477050895470124e-12, "1024": 5.953768728028663e-11}}