[{"learning_rate": 0.0011948335721160095, "beta1": 0.9360043452616368, "beta2": 0.9989497406214962, "epsilon": 5.875814422073298e-06, "use_nesterov": false, "adamw_weight_decay": 0.010141964334059882, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.747304046223346}, {"learning_rate": 0.4060109803507517, "beta1": 0.9972408031165986, "beta2": 0.9868027286692506, "epsilon": 107.85861559302559, "use_nesterov": true, "adamw_weight_decay": 0.015620239959742821, "l2_weight_decay": 0.0, "warmup_fraction": 2.289161370180122e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.3241485833861578}, {"learning_rate": 0.0002118527403995637, "beta1": 0.6229650835415205, "beta2": 0.9727800493920264, "epsilon": 1.5402357939162808e-07, "use_nesterov": false, "adamw_weight_decay": 0.05360756231092083, "l2_weight_decay": 0.0, "warmup_fraction": 1.139506043021826e-05, "min_learning_rate_mult": 0.0013864545078620433, "constant_fraction": 0.2099310299628817}, {"learning_rate": 0.007531482507067026, "beta1": 0.6919155876981923, "beta2": 0.984342979679972, "epsilon": 3.592713026359696e-08, "use_nesterov": false, "adamw_weight_decay": 0.0003059674479201108, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0009554387155165385, "constant_fraction": 0.4224892293642567}, {"learning_rate": 0.05569700266024712, "beta1": 0.9742164724896906, "beta2": 0.999980948972404, "epsilon": 4.2139276965284695, "use_nesterov": false, "adamw_weight_decay": 0.00022331133037191596, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.5209910283942752}, {"learning_rate": 0.006954992428540949, "beta1": 0.9941177962325759, "beta2": 0.9930455329766189, "epsilon": 4.3517153884397565e-07, "use_nesterov": false, "adamw_weight_decay": 3.142332648519505e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.013619134087588858}, {"learning_rate": 0.020526066283142113, "beta1": 0.3573051949320971, "beta2": 0.8604303237563932, "epsilon": 8.87354819497349e-05, "use_nesterov": true, "adamw_weight_decay": 0.07217167553538734, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 1.566669185534864e-05, "constant_fraction": 0.8851679138723282}, {"learning_rate": 0.0005950867356750683, "beta1": 0.8912956998774763, "beta2": 0.9998316947284045, "epsilon": 1.4834761018841103e-07, "use_nesterov": true, "adamw_weight_decay": 0.04087020908564961, "l2_weight_decay": 0.0, "warmup_fraction": 0.008212683099401206, "min_learning_rate_mult": 0.0, "constant_fraction": 0.37760078274486286}, {"learning_rate": 0.005328687277638261, "beta1": 0.960474459618098, "beta2": 0.9992247804716405, "epsilon": 8.665059017026017e-08, "use_nesterov": true, "adamw_weight_decay": 0.005563237041504353, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.17233141309625333}, {"learning_rate": 0.0012415879131444274, "beta1": 0.9466569269853439, "beta2": 0.9406663837522827, "epsilon": 8.113630827139477e-08, "use_nesterov": false, "adamw_weight_decay": 7.25772958596056e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0010075665692423708, "constant_fraction": 0.47695142196433893}, {"learning_rate": 0.008119003241547558, "beta1": 0.17785142887647176, "beta2": 0.9603342914414136, "epsilon": 0.07971483354346376, "use_nesterov": false, "adamw_weight_decay": 0.014885428421372969, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.2066434431423435}, {"learning_rate": 0.7392511884271304, "beta1": 0.9969058762714528, "beta2": 0.8063934885831979, "epsilon": 2899.800988175767, "use_nesterov": false, "adamw_weight_decay": 0.07851195003468928, "l2_weight_decay": 0.0, "warmup_fraction": 0.0007327743964713479, "min_learning_rate_mult": 0.003306718891018076, "constant_fraction": 0.5563410540592247}, {"learning_rate": 0.00016536562796354645, "beta1": 0.9528014372252882, "beta2": 0.045647676154896955, "epsilon": 2.832299169214906e-06, "use_nesterov": true, "adamw_weight_decay": 0.011413102255753298, "l2_weight_decay": 0.0, "warmup_fraction": 0.001899807993750271, "min_learning_rate_mult": 0.26986516357814333, "constant_fraction": 0.4567955168857194}, {"learning_rate": 0.18795824057466287, "beta1": 0.9859737737254709, "beta2": 0.5653089879816942, "epsilon": 3.335463336449822, "use_nesterov": true, "adamw_weight_decay": 0.0038678836056147293, "l2_weight_decay": 1.2650873175731194e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.10792195362976087, "constant_fraction": 0.2050653689291535}, {"learning_rate": 0.3809343383814296, "beta1": 0.8490655073162814, "beta2": 0.9543268957980681, "epsilon": 0.03872341122423678, "use_nesterov": false, "adamw_weight_decay": 0.0003584021290810616, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0002529076538459554, "constant_fraction": 0.8601924538022118}, {"learning_rate": 0.0037546336890331242, "beta1": 0.8775621517947911, "beta2": 0.9612813868549973, "epsilon": 0.0031627447527590507, "use_nesterov": true, "adamw_weight_decay": 0.0026267194106628327, "l2_weight_decay": 7.467763351870469e-05, "warmup_fraction": 0.0004874241782181279, "min_learning_rate_mult": 0.0, "constant_fraction": 0.18384220439903465}, {"learning_rate": 0.00469149153710182, "beta1": 0.9963949268336045, "beta2": 0.9882032933236298, "epsilon": 2.0556253122637692e-05, "use_nesterov": false, "adamw_weight_decay": 0.03551680912823944, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.508648860672349}, {"learning_rate": 0.269689123664345, "beta1": 0.9851939131264303, "beta2": 0.9953555080862891, "epsilon": 46.27149536079999, "use_nesterov": true, "adamw_weight_decay": 0.06945616633643757, "l2_weight_decay": 2.1254769708706067e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.00016822813217496997, "constant_fraction": 0.4891041599832312}, {"learning_rate": 0.2946112786906611, "beta1": 0.9967842403006696, "beta2": 0.9998066384310356, "epsilon": 7.49808525880034, "use_nesterov": false, "adamw_weight_decay": 0.00034633751331971464, "l2_weight_decay": 0.00037920679770884715, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.2006529088821566}, {"learning_rate": 0.0009466940029950283, "beta1": 0.43976654692813555, "beta2": 0.09422257990189098, "epsilon": 2.1198936798793774e-07, "use_nesterov": false, "adamw_weight_decay": 0.006901888604529899, "l2_weight_decay": 0.0, "warmup_fraction": 0.007415260343818976, "min_learning_rate_mult": 0.0, "constant_fraction": 0.45198368113422815}, {"learning_rate": 0.006605918239653114, "beta1": 0.2841690021059714, "beta2": 0.9992672992089842, "epsilon": 0.001327132934851488, "use_nesterov": true, "adamw_weight_decay": 0.02392306691874896, "l2_weight_decay": 0.0, "warmup_fraction": 0.02222708793770892, "min_learning_rate_mult": 0.0007371259476300234, "constant_fraction": 0.41353779658723033}, {"learning_rate": 0.03328473522187636, "beta1": 0.695922284020845, "beta2": 0.9999749964250709, "epsilon": 5.510085280687549e-06, "use_nesterov": true, "adamw_weight_decay": 1.3616483749393619e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.36855650509871785}, {"learning_rate": 0.002037871737382014, "beta1": 0.4999480291116216, "beta2": 0.9975488402665105, "epsilon": 5.629735112669782e-08, "use_nesterov": true, "adamw_weight_decay": 0.027959453124392353, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.5272573788077217}, {"learning_rate": 0.7254442240822598, "beta1": 0.9980035735550082, "beta2": 0.9978058982852454, "epsilon": 3.608029087158177, "use_nesterov": true, "adamw_weight_decay": 0.03910615041329988, "l2_weight_decay": 1.6564251345632237e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.49496914955618243}, {"learning_rate": 0.00030679958650620343, "beta1": 0.5786296007973373, "beta2": 0.9962473778386212, "epsilon": 9.881212078017348e-06, "use_nesterov": false, "adamw_weight_decay": 0.0552077997390162, "l2_weight_decay": 0.0, "warmup_fraction": 0.006910808955954399, "min_learning_rate_mult": 0.0, "constant_fraction": 0.5178056624855656}, {"learning_rate": 0.004580500335844138, "beta1": 0.42294331145928554, "beta2": 0.9996340230663632, "epsilon": 4.174383801435289e-06, "use_nesterov": true, "adamw_weight_decay": 0.004445569065452187, "l2_weight_decay": 0.0, "warmup_fraction": 6.948092680429794e-05, "min_learning_rate_mult": 0.36568088280188504, "constant_fraction": 0.10712191682637984}, {"learning_rate": 0.9171472159241931, "beta1": 0.4506093382745956, "beta2": 0.9924355626169975, "epsilon": 0.49453367594585734, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0012527326770919818, "warmup_fraction": 0.009744274816923932, "min_learning_rate_mult": 0.0266978863112591, "constant_fraction": 0.8971019661114805}, {"learning_rate": 2.9447163484071296e-05, "beta1": 0.9691606337183314, "beta2": 0.9989585125548099, "epsilon": 7.781883464637546e-07, "use_nesterov": true, "adamw_weight_decay": 0.003416005191691127, "l2_weight_decay": 0.00033636491813117994, "warmup_fraction": 0.0, "min_learning_rate_mult": 8.271681891094787e-05, "constant_fraction": 0.8295182142229286}, {"learning_rate": 0.059056800908244333, "beta1": 0.9979373427592588, "beta2": 0.9938330632030862, "epsilon": 344.725102999615, "use_nesterov": true, "adamw_weight_decay": 0.03934631372010418, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.061508612557718}, {"learning_rate": 0.021407258908693726, "beta1": 0.9874085642878456, "beta2": 0.9933627509436138, "epsilon": 0.00012664317581489618, "use_nesterov": false, "adamw_weight_decay": 0.0005194491916429356, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.12799995165543976}, {"learning_rate": 0.0024973964878672135, "beta1": 0.9812673108414214, "beta2": 0.9998810424899762, "epsilon": 1.799183948024501e-07, "use_nesterov": false, "adamw_weight_decay": 0.01302528594887525, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.009161159921657114}, {"learning_rate": 0.016545614113341964, "beta1": 0.9571680062439369, "beta2": 0.9978921771337571, "epsilon": 30.681605649648162, "use_nesterov": true, "adamw_weight_decay": 0.08920493281728885, "l2_weight_decay": 0.0, "warmup_fraction": 0.003780054638242951, "min_learning_rate_mult": 0.0004917075603144025, "constant_fraction": 0.08176526869534129}, {"learning_rate": 0.0029774515901572988, "beta1": 0.6861201927356766, "beta2": 0.9423184997455455, "epsilon": 0.06613707662242599, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 6.488712335876705e-05, "warmup_fraction": 0.008201847662206328, "min_learning_rate_mult": 0.0, "constant_fraction": 0.04551418264183593}, {"learning_rate": 0.8536726182390881, "beta1": 0.9312868091170935, "beta2": 0.5020022870359607, "epsilon": 0.020513270916481918, "use_nesterov": false, "adamw_weight_decay": 0.02800995000639579, "l2_weight_decay": 0.00020683684367025042, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.2291717497216984}, {"learning_rate": 0.006162446106677524, "beta1": 0.9882268232265763, "beta2": 0.9874384399955896, "epsilon": 1.6157047191512658e-06, "use_nesterov": false, "adamw_weight_decay": 0.015440036372840006, "l2_weight_decay": 0.0, "warmup_fraction": 0.01622460127175336, "min_learning_rate_mult": 0.0, "constant_fraction": 0.6231303188982895}, {"learning_rate": 0.0021626690957712476, "beta1": 0.9891863693762482, "beta2": 0.9973390834080226, "epsilon": 0.0010970918128689843, "use_nesterov": false, "adamw_weight_decay": 0.03190585566487564, "l2_weight_decay": 0.0002843579744447266, "warmup_fraction": 0.051061189511100266, "min_learning_rate_mult": 0.0, "constant_fraction": 0.7876152138927769}, {"learning_rate": 0.007379732846587812, "beta1": 0.21455985508360065, "beta2": 0.9975219913102092, "epsilon": 0.028621289093680693, "use_nesterov": false, "adamw_weight_decay": 0.08439062817632467, "l2_weight_decay": 0.0, "warmup_fraction": 6.140523306908913e-05, "min_learning_rate_mult": 0.08777758724702553, "constant_fraction": 0.722042536538768}, {"learning_rate": 0.005580811723727004, "beta1": 0.9755869885515044, "beta2": 0.9998959096429231, "epsilon": 3.237718692732164e-08, "use_nesterov": true, "adamw_weight_decay": 0.0004896292318753444, "l2_weight_decay": 0.0, "warmup_fraction": 0.00010635738171895488, "min_learning_rate_mult": 0.0, "constant_fraction": 0.5379357239029984}, {"learning_rate": 0.006035982984156549, "beta1": 0.9784892288025606, "beta2": 0.9144914391160787, "epsilon": 1.8064519546983546, "use_nesterov": false, "adamw_weight_decay": 0.01762346737323144, "l2_weight_decay": 0.0031829313638007772, "warmup_fraction": 0.00037851167280734136, "min_learning_rate_mult": 0.0, "constant_fraction": 0.6981369081494088}, {"learning_rate": 0.015116800984175812, "beta1": 0.8048793120594091, "beta2": 0.9787783787650743, "epsilon": 2.5375446598127148e-08, "use_nesterov": true, "adamw_weight_decay": 2.2689784053986208e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.00046193769055471356, "min_learning_rate_mult": 0.001991487467627285, "constant_fraction": 0.4311201404562798}, {"learning_rate": 0.0015669132173408192, "beta1": 0.9182034442374868, "beta2": 0.9999101146579716, "epsilon": 4.67522402327135e-05, "use_nesterov": false, "adamw_weight_decay": 4.1117603032602165e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.2507866687610616}, {"learning_rate": 6.938971491668313e-05, "beta1": 0.986736469421531, "beta2": 0.42708983905783127, "epsilon": 2.386882839510034e-07, "use_nesterov": false, "adamw_weight_decay": 0.00020706333366600366, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.08499769524439205}, {"learning_rate": 0.000426457830656171, "beta1": 0.4723936509330219, "beta2": 0.999742578556759, "epsilon": 8.221014847347656e-05, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 1.247988823862065e-05, "warmup_fraction": 0.0014721226070019795, "min_learning_rate_mult": 0.2058664560226014, "constant_fraction": 0.9233353638532978}, {"learning_rate": 0.00885866161646567, "beta1": 0.9896677862448132, "beta2": 0.9971993988060598, "epsilon": 0.014930518787834817, "use_nesterov": true, "adamw_weight_decay": 0.022528644175180114, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.16565994357421981, "constant_fraction": 0.1038807855165701}, {"learning_rate": 0.0046370348328655985, "beta1": 0.6465762714651584, "beta2": 0.5410828979733621, "epsilon": 3.5281502704630626e-08, "use_nesterov": false, "adamw_weight_decay": 2.995571621863111e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 2.2553276928396914e-05, "constant_fraction": 0.4953694055142519}, {"learning_rate": 0.0006658730826373222, "beta1": 0.6596808943414707, "beta2": 0.9999721701515789, "epsilon": 6.848373628426456e-06, "use_nesterov": true, "adamw_weight_decay": 0.0031302081758472614, "l2_weight_decay": 0.0, "warmup_fraction": 5.286407684779102e-05, "min_learning_rate_mult": 2.7892563425365462e-05, "constant_fraction": 0.6315391402821301}, {"learning_rate": 0.0022453447365848238, "beta1": 0.9796730915771823, "beta2": 0.9751818491904727, "epsilon": 1.488203773019268e-07, "use_nesterov": true, "adamw_weight_decay": 0.02179581383497055, "l2_weight_decay": 1.8123820408053374e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.7215232551124435}, {"learning_rate": 0.0007844535995441051, "beta1": 0.950648062887881, "beta2": 0.9968542288086903, "epsilon": 0.021410443548851302, "use_nesterov": false, "adamw_weight_decay": 4.0236947369174454e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.016042318363260175, "min_learning_rate_mult": 0.0, "constant_fraction": 0.12373354810025927}, {"learning_rate": 0.002359618127740519, "beta1": 0.985602470144129, "beta2": 0.9999742141510605, "epsilon": 1.0801721128727414e-08, "use_nesterov": true, "adamw_weight_decay": 0.003022991422521959, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.985885048089519}, {"learning_rate": 0.0033135826794434557, "beta1": 0.9044714853556935, "beta2": 0.9996962680336305, "epsilon": 6.618239577070916e-06, "use_nesterov": true, "adamw_weight_decay": 0.021840173870201037, "l2_weight_decay": 0.0, "warmup_fraction": 1.9197629324705276e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.14644338961392522}, {"learning_rate": 0.0003260395096202062, "beta1": 0.7842479490197322, "beta2": 0.9999786000247527, "epsilon": 0.0034679530917765397, "use_nesterov": false, "adamw_weight_decay": 0.047091643979610326, "l2_weight_decay": 0.0, "warmup_fraction": 5.958583345289541e-05, "min_learning_rate_mult": 0.00016123121352611385, "constant_fraction": 0.7375788574052385}, {"learning_rate": 0.004116668671587615, "beta1": 0.9956100552079372, "beta2": 0.753815437831847, "epsilon": 2.389647603484162e-06, "use_nesterov": true, "adamw_weight_decay": 0.03630888125552768, "l2_weight_decay": 0.0, "warmup_fraction": 0.0005689260494374579, "min_learning_rate_mult": 0.0, "constant_fraction": 0.20460776219384424}, {"learning_rate": 0.6260232131396862, "beta1": 0.9940054395007056, "beta2": 0.835210144102467, "epsilon": 2.43094599932903, "use_nesterov": true, "adamw_weight_decay": 0.01048093916592776, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.002522236628370752, "constant_fraction": 0.9317678655161064}, {"learning_rate": 0.015663337711307727, "beta1": 0.08941702049805866, "beta2": 0.9998558430018095, "epsilon": 1.2000029492320807e-08, "use_nesterov": false, "adamw_weight_decay": 0.00036377680537807397, "l2_weight_decay": 0.0, "warmup_fraction": 0.002187727087237649, "min_learning_rate_mult": 2.4175512973321787e-05, "constant_fraction": 0.32313012629732907}, {"learning_rate": 0.004729645552650788, "beta1": 0.9987883509872364, "beta2": 0.85851150371598, "epsilon": 159.62524329372562, "use_nesterov": false, "adamw_weight_decay": 0.07642227310908171, "l2_weight_decay": 0.0, "warmup_fraction": 0.0017183061984680284, "min_learning_rate_mult": 0.0, "constant_fraction": 0.40715973868058974}, {"learning_rate": 0.9240991562009095, "beta1": 0.8611579269748804, "beta2": 0.8950711180627892, "epsilon": 8.124354853466915e-07, "use_nesterov": true, "adamw_weight_decay": 1.185788418355489e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.8043194933503905, "constant_fraction": 0.5886829619953604}, {"learning_rate": 0.0003033444884791146, "beta1": 0.7960016377487121, "beta2": 0.869085551376238, "epsilon": 0.0020915261149098523, "use_nesterov": false, "adamw_weight_decay": 0.007356587309209756, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.47336551908529734}, {"learning_rate": 0.1136185324421944, "beta1": 0.9985529664629275, "beta2": 0.9980006687292727, "epsilon": 0.00011435149936969389, "use_nesterov": false, "adamw_weight_decay": 0.0003458534727006035, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.154389469171214}, {"learning_rate": 0.0017173824059168398, "beta1": 0.9704783023041557, "beta2": 0.9996238829046785, "epsilon": 4.375678622515891e-08, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 4.927934173231157e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0008139197156025356, "constant_fraction": 0.7928361354695909}, {"learning_rate": 0.0003421120561880962, "beta1": 0.2521708077469659, "beta2": 0.9657228789772222, "epsilon": 2.9279649682378377e-07, "use_nesterov": true, "adamw_weight_decay": 0.001318163612300234, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.6381198910693957, "constant_fraction": 0.827345330115475}, {"learning_rate": 0.014737491713623948, "beta1": 0.6976128214293794, "beta2": 0.9991714743546354, "epsilon": 0.00021024992800636115, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.00010962279343240942, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.8414066287580567}, {"learning_rate": 0.04751773530983137, "beta1": 0.4305673578037347, "beta2": 0.9999585534073142, "epsilon": 0.08501392866525068, "use_nesterov": true, "adamw_weight_decay": 0.019501245054243124, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.31612056730730487}, {"learning_rate": 0.017503941884665915, "beta1": 0.9891314017660419, "beta2": 0.999818318654998, "epsilon": 0.0004172805482202484, "use_nesterov": true, "adamw_weight_decay": 0.06617211674371544, "l2_weight_decay": 0.0, "warmup_fraction": 0.06650991854176097, "min_learning_rate_mult": 0.00411903424834363, "constant_fraction": 0.6451687125448781}, {"learning_rate": 0.1011367887270034, "beta1": 0.5490328154544406, "beta2": 0.9777218869080583, "epsilon": 132.76922422076376, "use_nesterov": true, "adamw_weight_decay": 0.0008828400040857791, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.09743309540624216, "constant_fraction": 0.9673241262542214}, {"learning_rate": 0.006205743994108878, "beta1": 0.4391158524206118, "beta2": 0.9185157287733601, "epsilon": 8.11299667626203e-07, "use_nesterov": true, "adamw_weight_decay": 3.5509623728712005e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.45175417865011347, "constant_fraction": 0.01325819075539203}, {"learning_rate": 0.001605867725881288, "beta1": 0.9935170809773529, "beta2": 0.6257271296860358, "epsilon": 6.105429658264248e-06, "use_nesterov": true, "adamw_weight_decay": 0.02968560540753625, "l2_weight_decay": 0.0, "warmup_fraction": 0.0004246646201760265, "min_learning_rate_mult": 0.002279200105353506, "constant_fraction": 0.3825353164018179}, {"learning_rate": 0.1148328601783143, "beta1": 0.8797021271286377, "beta2": 0.8941654047487779, "epsilon": 7.766744654686835e-07, "use_nesterov": false, "adamw_weight_decay": 0.006977936141781617, "l2_weight_decay": 0.0, "warmup_fraction": 1.670547777334913e-05, "min_learning_rate_mult": 0.32482864277548196, "constant_fraction": 0.7304371025724673}, {"learning_rate": 0.0005497123075312411, "beta1": 0.9673043445341869, "beta2": 0.7982992648166137, "epsilon": 2.1804828650338113e-08, "use_nesterov": true, "adamw_weight_decay": 0.000669178168933356, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.05159423495003801}, {"learning_rate": 0.9467583846281915, "beta1": 0.8779326695570369, "beta2": 0.9996562853292086, "epsilon": 3.276280536742398, "use_nesterov": false, "adamw_weight_decay": 0.0009972411491527455, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.003896217044263458, "constant_fraction": 0.6685808643139575}, {"learning_rate": 0.0019999414797787864, "beta1": 0.9880655576006039, "beta2": 0.929282361639323, "epsilon": 8.340033188303708e-06, "use_nesterov": false, "adamw_weight_decay": 0.0001514553578418961, "l2_weight_decay": 0.0, "warmup_fraction": 8.2997105324652e-05, "min_learning_rate_mult": 0.002941773680902664, "constant_fraction": 0.5854119608704601}, {"learning_rate": 0.033015823907242114, "beta1": 0.9857182274488118, "beta2": 0.7042542715381099, "epsilon": 2.9258886241812982, "use_nesterov": false, "adamw_weight_decay": 0.018486884343241472, "l2_weight_decay": 0.00018108188873674553, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.005836884004030548, "constant_fraction": 0.7884308727226825}, {"learning_rate": 0.31785328952337916, "beta1": 0.32561253888757746, "beta2": 0.8388633965242362, "epsilon": 0.0029319684187637846, "use_nesterov": true, "adamw_weight_decay": 0.013592241864799232, "l2_weight_decay": 0.015136583865082171, "warmup_fraction": 0.005179218315347039, "min_learning_rate_mult": 0.18597564245802953, "constant_fraction": 0.682081348125826}, {"learning_rate": 0.0076628419677251996, "beta1": 0.8753896978132706, "beta2": 0.9979411325278748, "epsilon": 0.001596225554066469, "use_nesterov": false, "adamw_weight_decay": 0.00037376564758808735, "l2_weight_decay": 0.0, "warmup_fraction": 0.00011412461770982954, "min_learning_rate_mult": 0.000528976226545964, "constant_fraction": 0.5678721165052417}, {"learning_rate": 0.0035999620113150495, "beta1": 0.5190254517541821, "beta2": 0.9989306238210193, "epsilon": 0.5002237387696323, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.00019815216715163248, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.07336598874594835}, {"learning_rate": 0.00013346263883480994, "beta1": 0.7203565971161854, "beta2": 0.995280335456764, "epsilon": 6.085869773191886e-08, "use_nesterov": false, "adamw_weight_decay": 0.000528316228638813, "l2_weight_decay": 0.0030605735956689777, "warmup_fraction": 0.0016912176348707621, "min_learning_rate_mult": 0.0, "constant_fraction": 0.38820419487543534}, {"learning_rate": 0.002664364053267289, "beta1": 0.22402003602491327, "beta2": 0.9986427775338398, "epsilon": 2.5653081675454804e-05, "use_nesterov": true, "adamw_weight_decay": 0.00683636993154649, "l2_weight_decay": 0.0, "warmup_fraction": 1.0607335999081374e-05, "min_learning_rate_mult": 0.010779646347614604, "constant_fraction": 0.04820700364491837}, {"learning_rate": 0.0718156335233699, "beta1": 0.7869957042634564, "beta2": 0.9998104322185879, "epsilon": 0.00036220938307103496, "use_nesterov": true, "adamw_weight_decay": 0.00024539479273387243, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.00045680817866633044, "constant_fraction": 0.12405613431636453}, {"learning_rate": 0.00039143555347458716, "beta1": 0.7575258795913666, "beta2": 0.9999699005858058, "epsilon": 4.1209405655024936e-05, "use_nesterov": false, "adamw_weight_decay": 0.06060582437858091, "l2_weight_decay": 1.9790543051388825e-05, "warmup_fraction": 2.805334425986782e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.4528205075137348}, {"learning_rate": 0.8419298663194243, "beta1": 0.977812572363824, "beta2": 0.936118495101715, "epsilon": 34.44759228866291, "use_nesterov": false, "adamw_weight_decay": 0.00012976412967801644, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.00030051597098696006, "constant_fraction": 0.2139568195387005}, {"learning_rate": 0.002161876298559898, "beta1": 0.7672347005188771, "beta2": 0.9978736761254035, "epsilon": 0.0011122365421095644, "use_nesterov": true, "adamw_weight_decay": 0.00029229718432163896, "l2_weight_decay": 0.0, "warmup_fraction": 1.7208345505656825e-05, "min_learning_rate_mult": 0.005318478649477114, "constant_fraction": 0.5194586522737443}, {"learning_rate": 4.225214963389206e-05, "beta1": 0.7575390892541631, "beta2": 0.9998981996012044, "epsilon": 1.0070983693721689e-06, "use_nesterov": true, "adamw_weight_decay": 0.0009168374072037859, "l2_weight_decay": 0.0, "warmup_fraction": 2.4497746416198248e-05, "min_learning_rate_mult": 9.462203989155691e-05, "constant_fraction": 0.13032841203596812}, {"learning_rate": 0.019330559786754842, "beta1": 0.09919841634220872, "beta2": 0.992382366608737, "epsilon": 0.0013397996591995595, "use_nesterov": false, "adamw_weight_decay": 0.08466105373058126, "l2_weight_decay": 5.1319689711725545e-05, "warmup_fraction": 0.0012530008855071778, "min_learning_rate_mult": 0.00022437338973586268, "constant_fraction": 0.7791473042319687}, {"learning_rate": 0.05351156077198552, "beta1": 0.40163530922830315, "beta2": 0.9999862512484181, "epsilon": 4.093242096159943e-07, "use_nesterov": false, "adamw_weight_decay": 0.00024222179606165926, "l2_weight_decay": 0.005808337338109108, "warmup_fraction": 0.0002535501211759029, "min_learning_rate_mult": 7.779898231879631e-05, "constant_fraction": 0.0929780345005462}, {"learning_rate": 0.53809912091245, "beta1": 0.9408057510734603, "beta2": 0.9994697389637858, "epsilon": 5.712451629535776, "use_nesterov": false, "adamw_weight_decay": 0.00029108931678062004, "l2_weight_decay": 4.234274171690436e-05, "warmup_fraction": 0.0035455220874599206, "min_learning_rate_mult": 0.03097572663857465, "constant_fraction": 0.15897282405427682}, {"learning_rate": 0.00034288820410029516, "beta1": 0.9921673214347393, "beta2": 0.9997243601132744, "epsilon": 0.0002932756793184255, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 3.757756698154666e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.2399539437016751}, {"learning_rate": 0.015122622827514734, "beta1": 0.44792108264659425, "beta2": 0.9998769430986968, "epsilon": 9.182694650746448e-06, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 1.2520850689666434e-05, "warmup_fraction": 0.000256329301972915, "min_learning_rate_mult": 0.0794586108511552, "constant_fraction": 0.04806462658124999}, {"learning_rate": 0.0029351047798516646, "beta1": 0.9138938764270735, "beta2": 0.9992548574486934, "epsilon": 0.040995128766341336, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0008771711485803694, "warmup_fraction": 2.459212774340668e-05, "min_learning_rate_mult": 1.6550470294921915e-05, "constant_fraction": 0.16142721681108319}, {"learning_rate": 0.005050636545921047, "beta1": 0.850953249004073, "beta2": 0.5957345673653647, "epsilon": 0.37313639722572406, "use_nesterov": false, "adamw_weight_decay": 0.001785103038087073, "l2_weight_decay": 0.0, "warmup_fraction": 0.008181974683958489, "min_learning_rate_mult": 0.027343694463852642, "constant_fraction": 0.3437411410658896}, {"learning_rate": 3.075786080955033e-05, "beta1": 0.8498783525717659, "beta2": 0.9999706367676884, "epsilon": 0.0005064765585556977, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.00027236035595055617, "warmup_fraction": 1.8522604928076865e-05, "min_learning_rate_mult": 0.0010175944029615172, "constant_fraction": 0.38065912111848954}, {"learning_rate": 0.0076495198211411234, "beta1": 0.6049789312907772, "beta2": 0.9977402315584586, "epsilon": 3.932804135649151e-06, "use_nesterov": false, "adamw_weight_decay": 0.056270160908660286, "l2_weight_decay": 1.3435011978789584e-05, "warmup_fraction": 0.03063002937137159, "min_learning_rate_mult": 0.0, "constant_fraction": 0.25697623775122225}, {"learning_rate": 0.004985207758347677, "beta1": 0.9494850741666294, "beta2": 0.9565263830588709, "epsilon": 0.002264534569048189, "use_nesterov": false, "adamw_weight_decay": 0.004658530202937909, "l2_weight_decay": 0.00029402380059799873, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.1519940416562766, "constant_fraction": 0.37173959073839424}, {"learning_rate": 0.03034294786292426, "beta1": 0.9061005498226232, "beta2": 0.9999651773498998, "epsilon": 0.004448690350257421, "use_nesterov": true, "adamw_weight_decay": 2.813327719125671e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.0008097887247146719, "min_learning_rate_mult": 0.0, "constant_fraction": 0.3133020090381139}, {"learning_rate": 0.028073315511253312, "beta1": 0.8697413026923235, "beta2": 0.7157038318821071, "epsilon": 0.01737342824407588, "use_nesterov": true, "adamw_weight_decay": 0.06677169881431481, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.9894495517646844}, {"learning_rate": 0.0013354991047485882, "beta1": 0.9216362057253707, "beta2": 0.8782645154807605, "epsilon": 7.977673184197422e-06, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0004562536031699295, "warmup_fraction": 0.07850892499968037, "min_learning_rate_mult": 0.001697612658170397, "constant_fraction": 0.35982260590145687}, {"learning_rate": 0.0023688725610768405, "beta1": 0.38679888662382333, "beta2": 0.9201597145081466, "epsilon": 5.7245388363903584e-08, "use_nesterov": true, "adamw_weight_decay": 0.0015984762586699808, "l2_weight_decay": 0.0, "warmup_fraction": 0.000150654242650776, "min_learning_rate_mult": 4.240393064234011e-05, "constant_fraction": 0.5244234068643924}, {"learning_rate": 0.02321282328618115, "beta1": 0.9607605879155945, "beta2": 0.9978215987322792, "epsilon": 5.557185090631053e-05, "use_nesterov": true, "adamw_weight_decay": 0.03783444168225039, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.7527451305743805}, {"learning_rate": 0.16244912634637107, "beta1": 0.9983271575952054, "beta2": 0.2740114231150945, "epsilon": 9.243487459258198, "use_nesterov": true, "adamw_weight_decay": 0.05493699712143326, "l2_weight_decay": 0.000256452729391225, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.12612578569452493, "constant_fraction": 0.9595070350656295}, {"learning_rate": 0.0005336703683568101, "beta1": 0.20114991557744755, "beta2": 0.9733929876364751, "epsilon": 0.0005930710062186807, "use_nesterov": false, "adamw_weight_decay": 0.007354475517632676, "l2_weight_decay": 0.0, "warmup_fraction": 2.542716902701182e-05, "min_learning_rate_mult": 0.00021621614594183216, "constant_fraction": 0.34466683156078026}, {"learning_rate": 0.017631284230044914, "beta1": 0.9936477459450112, "beta2": 0.9999124614578503, "epsilon": 9.478651265128485e-05, "use_nesterov": false, "adamw_weight_decay": 7.949049170218843e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.08272775324270198}, {"learning_rate": 0.005795262567052012, "beta1": 0.6151843281774845, "beta2": 0.8103501748047303, "epsilon": 6.119960205473376e-06, "use_nesterov": false, "adamw_weight_decay": 0.025124193683596217, "l2_weight_decay": 0.0, "warmup_fraction": 0.0592897510146174, "min_learning_rate_mult": 1.1358671433558616e-05, "constant_fraction": 0.6753501046550373}, {"learning_rate": 0.0007372764295666724, "beta1": 0.880060025127238, "beta2": 0.9966643629526017, "epsilon": 0.00200769784849734, "use_nesterov": false, "adamw_weight_decay": 0.0006891842968407736, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.01884616232618778, "constant_fraction": 0.9882519313433598}, {"learning_rate": 0.03586958380963503, "beta1": 0.3971668360073206, "beta2": 0.9373864160256336, "epsilon": 0.00047606043363390037, "use_nesterov": true, "adamw_weight_decay": 0.04035901235401638, "l2_weight_decay": 2.2864560767947387e-05, "warmup_fraction": 0.05367797033434453, "min_learning_rate_mult": 0.0013982863710566187, "constant_fraction": 0.9742798678833579}, {"learning_rate": 0.022632708728709917, "beta1": 0.9698989351370865, "beta2": 0.7610250511329648, "epsilon": 3.320533902975392, "use_nesterov": true, "adamw_weight_decay": 0.0025120828928063338, "l2_weight_decay": 0.0, "warmup_fraction": 0.0021765942059963146, "min_learning_rate_mult": 1.2071593273200754e-05, "constant_fraction": 0.26228067731204985}, {"learning_rate": 0.05629308698386304, "beta1": 0.5797393297665632, "beta2": 0.9733124961914996, "epsilon": 0.16224040199164919, "use_nesterov": false, "adamw_weight_decay": 0.09113819503286849, "l2_weight_decay": 0.001085533345217514, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.5702687056391453, "constant_fraction": 0.40613292541694246}, {"learning_rate": 0.00035879231144031725, "beta1": 0.4813952846992222, "beta2": 0.8385899318291944, "epsilon": 0.0016124268274594314, "use_nesterov": false, "adamw_weight_decay": 0.00725495311054918, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.2565677900057758}, {"learning_rate": 0.004255015818872543, "beta1": 0.958352864134369, "beta2": 0.9792972219066615, "epsilon": 5.648345027550803, "use_nesterov": true, "adamw_weight_decay": 1.091665690398036e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 2.7438763192302623e-05, "constant_fraction": 0.3603337565764513}, {"learning_rate": 0.0024729400625813362, "beta1": 0.9814965016928294, "beta2": 0.9988455030462065, "epsilon": 0.0002889693778641971, "use_nesterov": true, "adamw_weight_decay": 0.0002000949668190974, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.6178405496166166}, {"learning_rate": 0.06673219541731416, "beta1": 0.10195156915817005, "beta2": 0.9630142906163145, "epsilon": 0.0030009582220666144, "use_nesterov": true, "adamw_weight_decay": 0.01724109882589828, "l2_weight_decay": 1.8890710983609315e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.35032884315856916}, {"learning_rate": 0.0016490070752883325, "beta1": 0.9943609291230994, "beta2": 0.9836200759270353, "epsilon": 0.0003585162548387341, "use_nesterov": true, "adamw_weight_decay": 0.002923330464909713, "l2_weight_decay": 0.0, "warmup_fraction": 0.0006265857485910409, "min_learning_rate_mult": 0.0, "constant_fraction": 0.2547615534452343}, {"learning_rate": 0.11493054031438858, "beta1": 0.6565897871534989, "beta2": 0.863869716972549, "epsilon": 0.3873665259578022, "use_nesterov": false, "adamw_weight_decay": 7.075679560198932e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.019568851639592686, "constant_fraction": 0.7448474603172126}, {"learning_rate": 0.018609802264796887, "beta1": 0.9607345388452747, "beta2": 0.9647243210127938, "epsilon": 0.0038432290108141856, "use_nesterov": false, "adamw_weight_decay": 1.927438176959627e-05, "l2_weight_decay": 0.0, "warmup_fraction": 8.89880756293437e-05, "min_learning_rate_mult": 9.756660537387331e-05, "constant_fraction": 0.3072774591358324}, {"learning_rate": 0.0007999355078347375, "beta1": 0.8330481928415305, "beta2": 0.9989640052917312, "epsilon": 0.0052857798259683736, "use_nesterov": false, "adamw_weight_decay": 0.004446187589970189, "l2_weight_decay": 0.00013975166471247842, "warmup_fraction": 0.00016098553948860176, "min_learning_rate_mult": 0.0, "constant_fraction": 0.39289267531455674}, {"learning_rate": 0.0002528552862959966, "beta1": 0.26006983973065945, "beta2": 0.6069491779015117, "epsilon": 0.000998155486841036, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 1.2014969631830218e-05, "warmup_fraction": 0.03600010045058839, "min_learning_rate_mult": 0.0, "constant_fraction": 0.1529252672835949}, {"learning_rate": 0.00013099446765822408, "beta1": 0.9646431455120911, "beta2": 0.9675179659790115, "epsilon": 3.7069681035800034e-08, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 2.7870599703153398e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.3616675102733766}, {"learning_rate": 0.2674253212434599, "beta1": 0.9815897815813792, "beta2": 0.9613601274096737, "epsilon": 6.282778473563094, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.00014477233398314416, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.392967059978672}, {"learning_rate": 0.005385064741783187, "beta1": 0.24210575246415977, "beta2": 0.9859510014886128, "epsilon": 1.7418243014866453e-08, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 1.5960509747292272e-05, "warmup_fraction": 0.03693253428233275, "min_learning_rate_mult": 0.0, "constant_fraction": 0.2730291737305116}, {"learning_rate": 0.022638824965945326, "beta1": 0.15081791432204372, "beta2": 0.9835640038114001, "epsilon": 0.00119937825354544, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 2.0397716209047918e-05, "warmup_fraction": 8.991218916800849e-05, "min_learning_rate_mult": 0.054666229353558526, "constant_fraction": 0.5763402900685655}, {"learning_rate": 0.0004948378917658887, "beta1": 0.9863856168428382, "beta2": 0.9998829472856956, "epsilon": 4.512911545213241e-07, "use_nesterov": false, "adamw_weight_decay": 0.00037977968378583526, "l2_weight_decay": 0.0, "warmup_fraction": 3.6293877410488895e-05, "min_learning_rate_mult": 0.0034838126451083628, "constant_fraction": 0.20114266258472013}, {"learning_rate": 0.007092035551944452, "beta1": 0.994975562610554, "beta2": 0.9988441543620612, "epsilon": 0.00046719820734180957, "use_nesterov": true, "adamw_weight_decay": 3.241560941738795e-05, "l2_weight_decay": 0.0004428645552935252, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0001608487833116635, "constant_fraction": 0.17189839520138472}, {"learning_rate": 0.03535826577107603, "beta1": 0.13772066248534942, "beta2": 0.7966648067237371, "epsilon": 0.1334175132678006, "use_nesterov": true, "adamw_weight_decay": 0.00017600272090871228, "l2_weight_decay": 0.0, "warmup_fraction": 2.122947820576959e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.11637690326585759}, {"learning_rate": 0.00028168357099500027, "beta1": 0.9553779472950821, "beta2": 0.9966512173754323, "epsilon": 0.0007581536054654355, "use_nesterov": true, "adamw_weight_decay": 0.01968540062814908, "l2_weight_decay": 0.0, "warmup_fraction": 1.9086261577600915e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.4671683764185772}, {"learning_rate": 0.0010480202118009123, "beta1": 0.9351418668610336, "beta2": 0.9791420592841489, "epsilon": 0.024184576117285292, "use_nesterov": true, "adamw_weight_decay": 0.0007869533697267028, "l2_weight_decay": 0.0, "warmup_fraction": 0.00043865735900454583, "min_learning_rate_mult": 0.0, "constant_fraction": 0.9351701845357883}, {"learning_rate": 0.0018410728768511533, "beta1": 0.9759641356250115, "beta2": 0.9998449796777209, "epsilon": 0.04490260578906858, "use_nesterov": true, "adamw_weight_decay": 0.00011527177310804488, "l2_weight_decay": 0.00855493640044763, "warmup_fraction": 2.4104776094084335e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.2618323851660326}, {"learning_rate": 0.023537099679341433, "beta1": 0.4540831242711527, "beta2": 0.9998966516891556, "epsilon": 0.209864973972594, "use_nesterov": true, "adamw_weight_decay": 0.010515397780791086, "l2_weight_decay": 0.0008148351571165988, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.007454538623536376, "constant_fraction": 0.6563079293826253}, {"learning_rate": 0.0025149317719032377, "beta1": 0.951581103089487, "beta2": 0.9990605573501696, "epsilon": 0.0005318005698373361, "use_nesterov": true, "adamw_weight_decay": 6.0381107579601176e-05, "l2_weight_decay": 0.009795204918348493, "warmup_fraction": 0.01015758485527111, "min_learning_rate_mult": 0.0, "constant_fraction": 0.054384272992565874}, {"learning_rate": 0.00024821804650233413, "beta1": 0.908217419207584, "beta2": 0.9099838475123146, "epsilon": 2.254063493611947e-08, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0010890918894423712, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.14793675913114246}, {"learning_rate": 0.007655398411165242, "beta1": 0.9818225159752517, "beta2": 0.9968611745152369, "epsilon": 5.786955822727182e-06, "use_nesterov": true, "adamw_weight_decay": 0.007907782133444495, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.7739464133732971, "constant_fraction": 0.00797169656493002}, {"learning_rate": 0.0006552203339367358, "beta1": 0.9765662769384855, "beta2": 0.9996107244628482, "epsilon": 2.4741591400660183e-05, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.00035944419076198964, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.04124479304259765}, {"learning_rate": 0.005240918941188341, "beta1": 0.9800239734313843, "beta2": 0.9999678114728205, "epsilon": 1.334501420182941e-06, "use_nesterov": false, "adamw_weight_decay": 0.034971418109883586, "l2_weight_decay": 0.0, "warmup_fraction": 0.00015379805952388302, "min_learning_rate_mult": 0.005732510882419294, "constant_fraction": 0.5554937730024632}, {"learning_rate": 0.013645246270366665, "beta1": 0.7949672995072423, "beta2": 0.9999429138059609, "epsilon": 0.023289489850239403, "use_nesterov": false, "adamw_weight_decay": 0.0013231654202281542, "l2_weight_decay": 0.0016090156114426377, "warmup_fraction": 0.0006666927873046041, "min_learning_rate_mult": 0.008123801278862579, "constant_fraction": 0.2308133619014412}, {"learning_rate": 0.0017710450822539558, "beta1": 0.4091046282579912, "beta2": 0.9999828444558054, "epsilon": 3.055432159946844e-06, "use_nesterov": false, "adamw_weight_decay": 1.0576799120141817e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.001163647734979517, "min_learning_rate_mult": 1.0396931006402346e-05, "constant_fraction": 0.6054811786191991}, {"learning_rate": 0.6224654241247495, "beta1": 0.9560725897560507, "beta2": 0.995039858033415, "epsilon": 2.0126510816558933e-06, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 1.9333459303366055e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.2437932883501157}, {"learning_rate": 0.0029605685754178243, "beta1": 0.9798178085043069, "beta2": 0.8619830860175198, "epsilon": 0.6101214361711133, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0023243625615719, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.5525451593075731}, {"learning_rate": 0.012905186889196665, "beta1": 0.5259569088825953, "beta2": 0.9999484960492412, "epsilon": 0.1226066122665656, "use_nesterov": true, "adamw_weight_decay": 0.0002411521272746668, "l2_weight_decay": 0.0, "warmup_fraction": 1.7322461903443057e-05, "min_learning_rate_mult": 0.0014950641394429127, "constant_fraction": 0.8946869589928942}, {"learning_rate": 0.2743976120401293, "beta1": 0.99709785734259, "beta2": 0.9013928417941852, "epsilon": 3.4176903967604924, "use_nesterov": false, "adamw_weight_decay": 0.039067226080177486, "l2_weight_decay": 0.0017123788876274495, "warmup_fraction": 0.0004014172591258483, "min_learning_rate_mult": 0.4789356156072599, "constant_fraction": 0.6005565177266565}, {"learning_rate": 0.12897160369203342, "beta1": 0.9634286215132759, "beta2": 0.9841816720036781, "epsilon": 2.7524498175494403e-08, "use_nesterov": true, "adamw_weight_decay": 6.412893613197517e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.09167857770523191}, {"learning_rate": 0.01651285951711436, "beta1": 0.8894232106382379, "beta2": 0.9962085509991604, "epsilon": 1.3681985962630137, "use_nesterov": true, "adamw_weight_decay": 0.0018003853271715373, "l2_weight_decay": 0.0, "warmup_fraction": 0.0020052049086760303, "min_learning_rate_mult": 0.0, "constant_fraction": 0.28759181054720406}, {"learning_rate": 0.0037370464109916855, "beta1": 0.23260253189778057, "beta2": 0.9538156760297238, "epsilon": 1.9347680865973533e-08, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.00018089576293281123, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.4510268880954925}, {"learning_rate": 0.0126369844922579, "beta1": 0.9874651350172847, "beta2": 0.9711133985675087, "epsilon": 1.3554747709183285e-06, "use_nesterov": true, "adamw_weight_decay": 0.008065879572815987, "l2_weight_decay": 0.0, "warmup_fraction": 2.4400354749331426e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.4774891554966608}, {"learning_rate": 0.0007301383570644908, "beta1": 0.9352621552787523, "beta2": 0.9987263183452451, "epsilon": 1.28453609569386e-07, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0003720930640337948, "warmup_fraction": 0.00017129526210561983, "min_learning_rate_mult": 0.0, "constant_fraction": 0.5839661981316295}, {"learning_rate": 0.00027521430652426633, "beta1": 0.7992118437180444, "beta2": 0.9959541094138679, "epsilon": 6.614204894493038e-06, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 1.2658091075509493e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.32292705158287716}, {"learning_rate": 0.013827099054979839, "beta1": 0.9604850932582151, "beta2": 0.9997702884229118, "epsilon": 8.797874243771355e-05, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.013789063520189226, "warmup_fraction": 4.278253706512248e-05, "min_learning_rate_mult": 0.1997659544936631, "constant_fraction": 0.7425506646162805}, {"learning_rate": 0.015260851752553118, "beta1": 0.8822260232776884, "beta2": 0.9979261408017531, "epsilon": 0.3132090384523755, "use_nesterov": false, "adamw_weight_decay": 0.0005372734371991511, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0008403627605445134, "constant_fraction": 0.7559355341938382}, {"learning_rate": 0.010435511867497839, "beta1": 0.9078132196031427, "beta2": 0.968388025964469, "epsilon": 8.85157124476991e-05, "use_nesterov": true, "adamw_weight_decay": 0.00022492519118541202, "l2_weight_decay": 0.0, "warmup_fraction": 2.8898476884053378e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.7701245141225076}, {"learning_rate": 0.05988286008946251, "beta1": 0.9989544542213168, "beta2": 0.9977814056532254, "epsilon": 1.3125772447042418e-05, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0024074894050741423, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.9451827254236849}, {"learning_rate": 0.0026856903192736827, "beta1": 0.9128134823700957, "beta2": 0.9999875751862817, "epsilon": 0.2560113080761634, "use_nesterov": true, "adamw_weight_decay": 0.0039042774630906655, "l2_weight_decay": 1.5592199126609664e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0015407350228623861, "constant_fraction": 0.06514672045364}, {"learning_rate": 0.02315684084302266, "beta1": 0.0017630609018862708, "beta2": 0.24933653281658263, "epsilon": 87.88478983407299, "use_nesterov": true, "adamw_weight_decay": 0.02936064549428679, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.5715060886949156}, {"learning_rate": 0.0014200194408531012, "beta1": 0.9859828330689878, "beta2": 0.9999686300935186, "epsilon": 1.3531445099837233e-07, "use_nesterov": true, "adamw_weight_decay": 0.0011003321621205387, "l2_weight_decay": 0.0, "warmup_fraction": 0.03911696569047552, "min_learning_rate_mult": 0.0, "constant_fraction": 0.8689536967486287}, {"learning_rate": 0.015534599050890186, "beta1": 0.24415124264402144, "beta2": 0.9719356571800822, "epsilon": 4.405119963042532e-07, "use_nesterov": false, "adamw_weight_decay": 6.294348572893663e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.9929590671033853}, {"learning_rate": 0.003293414114734189, "beta1": 0.5833936694033075, "beta2": 0.910302804168016, "epsilon": 0.08460127133093737, "use_nesterov": false, "adamw_weight_decay": 1.535968073019442e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.3947094128204991}, {"learning_rate": 0.12511802793578114, "beta1": 0.9770321575658111, "beta2": 0.996049066507413, "epsilon": 0.0012802055415149828, "use_nesterov": false, "adamw_weight_decay": 0.05101725621456468, "l2_weight_decay": 4.480567513856866e-05, "warmup_fraction": 0.00010064465341111626, "min_learning_rate_mult": 0.001327259499708592, "constant_fraction": 0.6237025681872427}, {"learning_rate": 0.24038653013684008, "beta1": 0.9960975384266212, "beta2": 0.9992934125003209, "epsilon": 3.8721020047449417, "use_nesterov": true, "adamw_weight_decay": 0.03528268355846348, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.16838241419556232, "constant_fraction": 0.478192786341995}, {"learning_rate": 0.004987097059061684, "beta1": 0.8716749990061345, "beta2": 0.9998782069955856, "epsilon": 392.8699512438671, "use_nesterov": true, "adamw_weight_decay": 0.03818954949371046, "l2_weight_decay": 0.0, "warmup_fraction": 0.0014429876021980368, "min_learning_rate_mult": 0.0, "constant_fraction": 0.7013674992945794}, {"learning_rate": 0.00012947231860307133, "beta1": 0.97417378212083, "beta2": 0.9589137656379667, "epsilon": 8.073606004738731e-07, "use_nesterov": true, "adamw_weight_decay": 0.015018479557758249, "l2_weight_decay": 0.0, "warmup_fraction": 4.433474054697261e-05, "min_learning_rate_mult": 0.0264220527012815, "constant_fraction": 0.5324899925175024}, {"learning_rate": 0.07867825266725731, "beta1": 0.8508209047742343, "beta2": 0.9986258254601117, "epsilon": 0.22538551678663193, "use_nesterov": false, "adamw_weight_decay": 0.09049882208857753, "l2_weight_decay": 0.0, "warmup_fraction": 0.0003469961169967077, "min_learning_rate_mult": 0.015649906042983157, "constant_fraction": 0.6599492997527072}, {"learning_rate": 0.01076435950462371, "beta1": 0.8479940884819016, "beta2": 0.9999131901303134, "epsilon": 0.008767580644509887, "use_nesterov": false, "adamw_weight_decay": 0.0016786693760900025, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.18616405474078723}, {"learning_rate": 0.0013770222618406608, "beta1": 0.9230529038263418, "beta2": 0.9992684825114927, "epsilon": 0.01723248256662958, "use_nesterov": true, "adamw_weight_decay": 0.0010517413386163636, "l2_weight_decay": 0.0, "warmup_fraction": 0.005832701313753735, "min_learning_rate_mult": 0.5335590413134687, "constant_fraction": 0.6910263557485928}, {"learning_rate": 0.05991253477469478, "beta1": 0.25075308200172963, "beta2": 0.9968287162361673, "epsilon": 6.072022493071219, "use_nesterov": true, "adamw_weight_decay": 2.348108070240037e-05, "l2_weight_decay": 0.0, "warmup_fraction": 6.534886794176106e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.7664811181022799}, {"learning_rate": 0.008296836361763127, "beta1": 0.33302975884465646, "beta2": 0.9998122882621882, "epsilon": 7.363920597614585e-05, "use_nesterov": false, "adamw_weight_decay": 0.03596331000118363, "l2_weight_decay": 0.0007797747557129984, "warmup_fraction": 1.2135381659685546e-05, "min_learning_rate_mult": 0.2398589167064265, "constant_fraction": 0.48433106831355466}, {"learning_rate": 0.0010991808773714664, "beta1": 0.9798234866913996, "beta2": 0.9715428341699145, "epsilon": 1.9229944275001372e-06, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0001477755048196289, "warmup_fraction": 3.66974152498129e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.9524129138831348}, {"learning_rate": 0.0007757214017264586, "beta1": 0.991277164014007, "beta2": 0.9956301844894834, "epsilon": 5.770887157474783e-06, "use_nesterov": false, "adamw_weight_decay": 0.09049817117347597, "l2_weight_decay": 0.03429263789891721, "warmup_fraction": 0.0011857364247750061, "min_learning_rate_mult": 0.00014185395288030553, "constant_fraction": 0.6020860549171245}, {"learning_rate": 0.018453337594683452, "beta1": 0.9969448486645008, "beta2": 0.9448186396936405, "epsilon": 0.371838308278872, "use_nesterov": false, "adamw_weight_decay": 0.0027804034565577264, "l2_weight_decay": 0.0, "warmup_fraction": 6.175091827959986e-05, "min_learning_rate_mult": 2.289604494579471e-05, "constant_fraction": 0.05927578336058026}, {"learning_rate": 0.6402610283597836, "beta1": 0.9344617388997203, "beta2": 0.9979587879967253, "epsilon": 11.309491583783192, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0008869542139248811, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0005243679574786853, "constant_fraction": 0.5082668477735848}, {"learning_rate": 0.28056294462223763, "beta1": 0.9878005153026121, "beta2": 0.9198628221786413, "epsilon": 0.00027102568140728453, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 1.4579503665356418e-05, "warmup_fraction": 0.0001199722167836134, "min_learning_rate_mult": 0.0, "constant_fraction": 0.7780825640362854}, {"learning_rate": 0.0012691138609008615, "beta1": 0.9814795498184988, "beta2": 0.9023987834237743, "epsilon": 0.03293526894156421, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0001213980631717083, "warmup_fraction": 0.056233480398215144, "min_learning_rate_mult": 0.0, "constant_fraction": 0.6866175239103398}, {"learning_rate": 0.019381313752157594, "beta1": 0.8723936121736572, "beta2": 0.9752230663198042, "epsilon": 7.141465748275466e-05, "use_nesterov": true, "adamw_weight_decay": 0.0010487996881050725, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.053993759666936314, "constant_fraction": 0.7052502257804253}, {"learning_rate": 0.02329689296068077, "beta1": 0.8873437699861644, "beta2": 0.9968409214695484, "epsilon": 0.0014362583326230569, "use_nesterov": true, "adamw_weight_decay": 9.282238352657935e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.059528839391253405, "min_learning_rate_mult": 0.0006780117193301016, "constant_fraction": 0.6976679460383692}, {"learning_rate": 0.013566987718228953, "beta1": 0.7271265235112772, "beta2": 0.9995729890188512, "epsilon": 0.0009436129394422457, "use_nesterov": false, "adamw_weight_decay": 0.017018934626987687, "l2_weight_decay": 0.0, "warmup_fraction": 5.767904145021253e-05, "min_learning_rate_mult": 0.0014697404133805307, "constant_fraction": 0.3819585205295133}, {"learning_rate": 0.10411767766241817, "beta1": 0.9912522313276194, "beta2": 0.9992476528019947, "epsilon": 8.757913497938685e-08, "use_nesterov": false, "adamw_weight_decay": 5.865937229629765e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.552239638219658}, {"learning_rate": 0.013023495397708992, "beta1": 0.6539419174992374, "beta2": 0.9998263783011304, "epsilon": 3.963934682335024e-07, "use_nesterov": false, "adamw_weight_decay": 0.00032427655690716635, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.7431265152353408}, {"learning_rate": 0.0899672999899066, "beta1": 0.3456667377144317, "beta2": 0.8728807908102283, "epsilon": 4.858124259624369e-05, "use_nesterov": true, "adamw_weight_decay": 1.4160455763500624e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.1044504016456066}, {"learning_rate": 0.12192528080611008, "beta1": 0.9243489853877745, "beta2": 0.2986616989580152, "epsilon": 3.029036947373334, "use_nesterov": false, "adamw_weight_decay": 0.05261983194802087, "l2_weight_decay": 0.000794770582832317, "warmup_fraction": 0.0, "min_learning_rate_mult": 4.1757369064920586e-05, "constant_fraction": 0.280915418914609}, {"learning_rate": 0.19967555469534556, "beta1": 0.029531191623897834, "beta2": 0.991090559682028, "epsilon": 8.064193036757631, "use_nesterov": true, "adamw_weight_decay": 0.021548920933331737, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0007552506769237623, "constant_fraction": 0.06863694958728972}, {"learning_rate": 0.3421291827824831, "beta1": 0.839624202118824, "beta2": 0.9989653082450918, "epsilon": 3.8467047480655844e-05, "use_nesterov": false, "adamw_weight_decay": 0.010698676248820366, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 2.917252672991638e-05, "constant_fraction": 0.748273672588207}, {"learning_rate": 0.15105408772922357, "beta1": 0.16412355181783667, "beta2": 0.9983169168696564, "epsilon": 0.6754396038458041, "use_nesterov": false, "adamw_weight_decay": 0.005414444675620732, "l2_weight_decay": 0.0, "warmup_fraction": 0.06838814092003954, "min_learning_rate_mult": 0.0012010540032213084, "constant_fraction": 0.9524154377154802}, {"learning_rate": 0.04192390238617632, "beta1": 0.2326607679928302, "beta2": 0.9999753803192444, "epsilon": 3.5591477993154e-07, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 1.673480980977649e-05, "warmup_fraction": 2.6125041819935977e-05, "min_learning_rate_mult": 0.000319688041195497, "constant_fraction": 0.87471861348328}, {"learning_rate": 0.0016142190184851232, "beta1": 0.8696063180644511, "beta2": 0.9943543488647871, "epsilon": 230.56225546924566, "use_nesterov": true, "adamw_weight_decay": 0.0006198802527941006, "l2_weight_decay": 0.0006772584124051061, "warmup_fraction": 7.668243652566069e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.5612893239864358}, {"learning_rate": 0.16441615149909594, "beta1": 0.8547323178865828, "beta2": 0.9836283487917175, "epsilon": 2651.1170582770033, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 1.1705800265323498e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.017963073603684435, "constant_fraction": 0.07176641072453893}, {"learning_rate": 0.19907323770298774, "beta1": 0.09510929382116962, "beta2": 0.8800860776739148, "epsilon": 2.0578962778260835e-06, "use_nesterov": true, "adamw_weight_decay": 0.000140146028637295, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.6079596908622462}, {"learning_rate": 0.004369142724253012, "beta1": 0.8415187173775391, "beta2": 0.9999397312076621, "epsilon": 0.00036456927789902847, "use_nesterov": true, "adamw_weight_decay": 0.03021500990701344, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0023743545568784314, "constant_fraction": 0.9218482050447006}, {"learning_rate": 0.0073676850750988695, "beta1": 0.995314204934738, "beta2": 0.9375859678777715, "epsilon": 0.7832057432372563, "use_nesterov": false, "adamw_weight_decay": 4.507223373162878e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.05828342580335166}, {"learning_rate": 0.022981705113841358, "beta1": 0.9257641378437944, "beta2": 0.9993607638118357, "epsilon": 0.0001185815367223993, "use_nesterov": true, "adamw_weight_decay": 0.0020540915423214105, "l2_weight_decay": 0.0, "warmup_fraction": 0.03660794861875707, "min_learning_rate_mult": 0.0, "constant_fraction": 0.6211892612444446}, {"learning_rate": 0.00037411786809741197, "beta1": 0.9647652720307804, "beta2": 0.9918020712527764, "epsilon": 6.179194231350513e-07, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0030377485145124078, "warmup_fraction": 0.01499453865345897, "min_learning_rate_mult": 0.0, "constant_fraction": 0.9946822915240985}, {"learning_rate": 2.2920454488161767e-05, "beta1": 0.8401571830611708, "beta2": 0.9997421376499773, "epsilon": 1.3987975168140132e-06, "use_nesterov": true, "adamw_weight_decay": 2.0721411502658612e-05, "l2_weight_decay": 0.0, "warmup_fraction": 4.120622506404625e-05, "min_learning_rate_mult": 0.42607084544349466, "constant_fraction": 0.9838309182561652}, {"learning_rate": 0.00023691939529349681, "beta1": 0.890435914008428, "beta2": 0.99775473513386, "epsilon": 0.0008738186129205545, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.034055521240836474, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.5376309790001482}, {"learning_rate": 0.46539216961360813, "beta1": 0.424285129100342, "beta2": 0.7585328798033393, "epsilon": 0.028787925063525607, "use_nesterov": false, "adamw_weight_decay": 3.411318624236937e-05, "l2_weight_decay": 0.0063085365761472514, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.002727885862030008, "constant_fraction": 0.6668942591632034}, {"learning_rate": 0.009751054650813714, "beta1": 0.6956211131931507, "beta2": 0.8085329568514862, "epsilon": 0.003620400944335599, "use_nesterov": false, "adamw_weight_decay": 0.0009093472106598998, "l2_weight_decay": 0.0, "warmup_fraction": 0.0075894808852545615, "min_learning_rate_mult": 1.718098555549216e-05, "constant_fraction": 0.591251851328669}, {"learning_rate": 4.461952041386242e-05, "beta1": 0.9536443180352802, "beta2": 0.9927221844841596, "epsilon": 0.04107885922814439, "use_nesterov": true, "adamw_weight_decay": 0.0012960344097265933, "l2_weight_decay": 0.013030338320919417, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.27772938954631826, "constant_fraction": 0.3245758389999376}, {"learning_rate": 0.3814186857372305, "beta1": 0.9924227849670088, "beta2": 0.9991786676774166, "epsilon": 67.99587450729007, "use_nesterov": false, "adamw_weight_decay": 0.07687872134881311, "l2_weight_decay": 0.0, "warmup_fraction": 0.0009749179203440622, "min_learning_rate_mult": 0.0, "constant_fraction": 0.9396191373862904}, {"learning_rate": 0.9945289112181416, "beta1": 0.8222630965156085, "beta2": 0.9727052651183921, "epsilon": 0.0001594000965295237, "use_nesterov": true, "adamw_weight_decay": 0.0007845349505795048, "l2_weight_decay": 0.0, "warmup_fraction": 0.0009099727225850322, "min_learning_rate_mult": 0.0, "constant_fraction": 0.6476642653403826}, {"learning_rate": 0.0018207275804423253, "beta1": 0.8384772475180772, "beta2": 0.9994065403687725, "epsilon": 0.3448426412399011, "use_nesterov": true, "adamw_weight_decay": 0.0003847543706831789, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.7402351596502392}, {"learning_rate": 0.04284435939553709, "beta1": 0.9022541578480916, "beta2": 0.99940684054184, "epsilon": 117.02892632177026, "use_nesterov": true, "adamw_weight_decay": 8.553693328756405e-05, "l2_weight_decay": 0.019416678579409197, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.9187503409103914}, {"learning_rate": 0.00020878762979817896, "beta1": 0.9922296879220267, "beta2": 0.9414103882364963, "epsilon": 0.5571082809990765, "use_nesterov": true, "adamw_weight_decay": 0.001881900323458898, "l2_weight_decay": 0.0, "warmup_fraction": 0.0008405562183828854, "min_learning_rate_mult": 0.0, "constant_fraction": 0.5886896084765049}, {"learning_rate": 0.006790257179528508, "beta1": 0.9977850525089806, "beta2": 0.9990904504071343, "epsilon": 0.0019622817788559326, "use_nesterov": false, "adamw_weight_decay": 0.00929592185838287, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.1503516275616702, "constant_fraction": 0.8291180126263541}, {"learning_rate": 0.00822528742071973, "beta1": 0.1675463126888732, "beta2": 0.3443978903037914, "epsilon": 1.6307008072651287e-08, "use_nesterov": true, "adamw_weight_decay": 0.001344663044729704, "l2_weight_decay": 5.121036733197683e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.05390752136105237}, {"learning_rate": 0.003435717681758884, "beta1": 0.9522653550424126, "beta2": 0.9985075820062271, "epsilon": 12.553000070980442, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 7.771353164314125e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.15994664573242412}, {"learning_rate": 0.10311391146567439, "beta1": 0.5083110612663718, "beta2": 0.9997249263354113, "epsilon": 23.307287706410506, "use_nesterov": false, "adamw_weight_decay": 0.0020774643473865898, "l2_weight_decay": 0.000296055440951101, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.34830928181838106}, {"learning_rate": 0.10132678894265121, "beta1": 0.987752225704418, "beta2": 0.9998846335532777, "epsilon": 6.41747112528794e-08, "use_nesterov": true, "adamw_weight_decay": 0.05209389342949178, "l2_weight_decay": 0.0, "warmup_fraction": 0.0006109201431719138, "min_learning_rate_mult": 0.0, "constant_fraction": 0.09593456654385246}, {"learning_rate": 0.0008781565939545333, "beta1": 0.09972820850859443, "beta2": 0.9999282742516604, "epsilon": 0.0011750138403328343, "use_nesterov": false, "adamw_weight_decay": 0.005342728227756276, "l2_weight_decay": 0.0, "warmup_fraction": 0.022767244505491974, "min_learning_rate_mult": 1.0663302071147409e-05, "constant_fraction": 0.07141387366858198}, {"learning_rate": 0.4315445887637084, "beta1": 0.6140202640814005, "beta2": 0.9999162184610435, "epsilon": 0.00013092554115140214, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 6.277221923652387e-05, "warmup_fraction": 6.558289568068631e-05, "min_learning_rate_mult": 0.048494621847040474, "constant_fraction": 0.01723108747531399}, {"learning_rate": 0.00605127671462394, "beta1": 0.8953545644960359, "beta2": 0.9999689932016114, "epsilon": 0.012321390679472688, "use_nesterov": true, "adamw_weight_decay": 0.019208398767777024, "l2_weight_decay": 0.0, "warmup_fraction": 0.012955698251526605, "min_learning_rate_mult": 0.0, "constant_fraction": 0.9985108200071299}, {"learning_rate": 0.020915007652870774, "beta1": 0.9816178968905618, "beta2": 0.9997824349765477, "epsilon": 0.0003575106351994028, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0002596102492536051, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.02745187901022627, "constant_fraction": 0.772960395344114}, {"learning_rate": 0.025102222059680036, "beta1": 0.1260545444488087, "beta2": 0.9427012541483917, "epsilon": 0.08274320415480915, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 5.0350495924988986e-05, "warmup_fraction": 0.0016686111851210077, "min_learning_rate_mult": 0.0, "constant_fraction": 0.3220707443363978}, {"learning_rate": 0.019783918610695873, "beta1": 0.8474310284929465, "beta2": 0.1251730616957274, "epsilon": 1440.6571127165016, "use_nesterov": false, "adamw_weight_decay": 0.0009322022352753782, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0002876100724694453, "constant_fraction": 0.038802103728877935}, {"learning_rate": 0.6322383822567756, "beta1": 0.984593022423469, "beta2": 0.9999504587445255, "epsilon": 1.9836901854509223e-06, "use_nesterov": false, "adamw_weight_decay": 8.522974416984825e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0002366262608670533, "constant_fraction": 0.1256889723724085}, {"learning_rate": 0.003295715688511139, "beta1": 0.9233411587034609, "beta2": 0.9048654945876934, "epsilon": 0.005279525081908732, "use_nesterov": true, "adamw_weight_decay": 0.0004848369148371181, "l2_weight_decay": 5.257228252693113e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.13883021852691974, "constant_fraction": 0.9402456532015023}, {"learning_rate": 0.0009537315130404785, "beta1": 0.9981104206933681, "beta2": 0.9999408052004845, "epsilon": 0.0007156185842629567, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.017384488022176757, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.31412090300077355}, {"learning_rate": 0.16417690383811367, "beta1": 0.9427790987485776, "beta2": 0.7006745309053013, "epsilon": 63.04082878971145, "use_nesterov": false, "adamw_weight_decay": 0.00014576032325304926, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.002315385371169962, "constant_fraction": 0.9609169974031246}, {"learning_rate": 0.09263709517860673, "beta1": 0.9632677790318591, "beta2": 0.9997221053902764, "epsilon": 9.278665604306666e-07, "use_nesterov": true, "adamw_weight_decay": 3.155116481969525e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.0012887519417553396, "min_learning_rate_mult": 0.0, "constant_fraction": 0.24666084723094717}, {"learning_rate": 0.01258429000322565, "beta1": 0.9748193858028378, "beta2": 0.9810460517306594, "epsilon": 0.05919290623614127, "use_nesterov": true, "adamw_weight_decay": 0.004230817755779783, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.8712580742399231}, {"learning_rate": 0.0018569120614589886, "beta1": 0.8594442444631316, "beta2": 0.6708832618400049, "epsilon": 0.0009609429795475088, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.03164444846304121, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.11871000109582902, "constant_fraction": 0.6888712204875518}, {"learning_rate": 0.0034248115678230787, "beta1": 0.9951073540334433, "beta2": 0.9152436302668332, "epsilon": 1.0541917748941824e-05, "use_nesterov": false, "adamw_weight_decay": 0.06833045828468752, "l2_weight_decay": 0.00018618545617168328, "warmup_fraction": 3.3041198789270416e-05, "min_learning_rate_mult": 0.06556244042106991, "constant_fraction": 0.7263207037314479}, {"learning_rate": 0.48195518325691183, "beta1": 0.8640215617315968, "beta2": 0.9946290101501138, "epsilon": 457.01465005602984, "use_nesterov": false, "adamw_weight_decay": 0.05413164625172243, "l2_weight_decay": 0.0, "warmup_fraction": 0.006613592063766546, "min_learning_rate_mult": 0.3032199142133492, "constant_fraction": 0.8479708626460396}, {"learning_rate": 0.01677207659570755, "beta1": 0.7198052929904057, "beta2": 0.9926988839927356, "epsilon": 1.882710468714079e-08, "use_nesterov": true, "adamw_weight_decay": 6.018915405887649e-05, "l2_weight_decay": 5.306779908586969e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.737590548163097, "constant_fraction": 0.5993183940169932}, {"learning_rate": 0.0137576604800053, "beta1": 0.7270104843964018, "beta2": 0.8918552150418698, "epsilon": 3.438468571772097e-07, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.00017317690431456037, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.34448288535286675}, {"learning_rate": 0.0077351241650570075, "beta1": 0.9986600755215074, "beta2": 0.9999892179751438, "epsilon": 3.3673984779296488e-06, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 3.49605130644589e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.6394554062309439}, {"learning_rate": 0.025789212993035916, "beta1": 0.9061037008031974, "beta2": 0.9960632752291046, "epsilon": 4.191873980094725, "use_nesterov": true, "adamw_weight_decay": 0.0640760546122682, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 8.514082434066225e-05, "constant_fraction": 0.6126044822378198}, {"learning_rate": 0.019632599068302493, "beta1": 0.9586135618912424, "beta2": 0.9860681178218872, "epsilon": 1.7062924833700837, "use_nesterov": false, "adamw_weight_decay": 3.0324004691195464e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.00017538849463706366, "min_learning_rate_mult": 0.0005249347103009662, "constant_fraction": 0.09706538506229023}, {"learning_rate": 0.5113996921223084, "beta1": 0.9770133537224546, "beta2": 0.9987604696755458, "epsilon": 6.142774677582399e-05, "use_nesterov": true, "adamw_weight_decay": 2.726024800174171e-05, "l2_weight_decay": 0.0, "warmup_fraction": 3.9983458603513536e-05, "min_learning_rate_mult": 2.0363489938675084e-05, "constant_fraction": 0.6141608739283829}, {"learning_rate": 0.009159823356497345, "beta1": 0.9505987145064679, "beta2": 0.9997873438433751, "epsilon": 2.2975881142832392e-08, "use_nesterov": false, "adamw_weight_decay": 1.2992081882149517e-05, "l2_weight_decay": 0.017294310537637483, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0004546349316003164, "constant_fraction": 0.1452918059926961}, {"learning_rate": 0.0941365383560292, "beta1": 0.9972965003871401, "beta2": 0.9995965679825132, "epsilon": 0.00011376715025499686, "use_nesterov": true, "adamw_weight_decay": 0.012086360531888603, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0008844611889412506, "constant_fraction": 0.46983582546687663}, {"learning_rate": 0.006133954293406546, "beta1": 0.9647093056077968, "beta2": 0.7338342451911373, "epsilon": 1.7231872582299593e-05, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.00024578801021433506, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.11471547011034322}, {"learning_rate": 0.023270170486803854, "beta1": 0.9868596910863907, "beta2": 0.9996224728968479, "epsilon": 1.703416803482406e-05, "use_nesterov": true, "adamw_weight_decay": 0.02766823292887286, "l2_weight_decay": 2.062394916578441e-05, "warmup_fraction": 1.342264502537682e-05, "min_learning_rate_mult": 0.0015233542037717737, "constant_fraction": 0.7331818298192633}, {"learning_rate": 0.00011435787383411343, "beta1": 0.3091873486517305, "beta2": 0.9881693544880124, "epsilon": 4.4141350498757947e-07, "use_nesterov": false, "adamw_weight_decay": 0.00047442725455745777, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.08601404722624617}, {"learning_rate": 0.01315653314095858, "beta1": 0.8852398912205006, "beta2": 0.9899347266303515, "epsilon": 4.9176775965172866e-05, "use_nesterov": false, "adamw_weight_decay": 0.00011037182489151941, "l2_weight_decay": 0.0, "warmup_fraction": 4.5113910266538476e-05, "min_learning_rate_mult": 0.8142565024816273, "constant_fraction": 0.7194077795982311}, {"learning_rate": 0.006794713364885392, "beta1": 0.8635285728654929, "beta2": 0.9992523027234685, "epsilon": 2.0636595932164825e-08, "use_nesterov": true, "adamw_weight_decay": 0.08328708981648836, "l2_weight_decay": 0.014119154685396155, "warmup_fraction": 1.3737112020094687e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.6453259324748636}, {"learning_rate": 0.9570879012208998, "beta1": 0.9533923412439109, "beta2": 0.9999777584969239, "epsilon": 76.4353332107754, "use_nesterov": true, "adamw_weight_decay": 0.03425725947401975, "l2_weight_decay": 0.0, "warmup_fraction": 0.015292925876652813, "min_learning_rate_mult": 0.021544863244142436, "constant_fraction": 0.668612279530753}, {"learning_rate": 0.2396374407781059, "beta1": 0.9777913683096756, "beta2": 0.9999880195706415, "epsilon": 4.882790512421987e-05, "use_nesterov": true, "adamw_weight_decay": 0.0031696218125413993, "l2_weight_decay": 0.02693213003703406, "warmup_fraction": 7.396389601730095e-05, "min_learning_rate_mult": 3.711147751836023e-05, "constant_fraction": 0.5899802526821165}, {"learning_rate": 0.6119705359848147, "beta1": 0.7660719131709677, "beta2": 0.9999492646333403, "epsilon": 0.0009022557841055048, "use_nesterov": false, "adamw_weight_decay": 9.116896416491339e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.0065863687697139735, "min_learning_rate_mult": 0.0, "constant_fraction": 0.056189169754257806}, {"learning_rate": 0.09883683787423758, "beta1": 0.992459172907466, "beta2": 0.996618307273998, "epsilon": 0.008944683423570146, "use_nesterov": true, "adamw_weight_decay": 0.0004420000907805581, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.07755501293110245}, {"learning_rate": 0.025280240251477636, "beta1": 0.9685709044287567, "beta2": 0.9999722891288026, "epsilon": 0.000678112574246387, "use_nesterov": false, "adamw_weight_decay": 0.0004764889253591128, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.03915269710353214, "constant_fraction": 0.7599238433827221}, {"learning_rate": 0.0838107131144011, "beta1": 0.6465530162024407, "beta2": 0.9994950278679391, "epsilon": 1.48301970962777, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.001887794609143935, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.00031573077676983244, "constant_fraction": 0.8548415821352753}, {"learning_rate": 0.02054286890327074, "beta1": 0.9877670902941115, "beta2": 0.9852930265352053, "epsilon": 0.00039436078475850076, "use_nesterov": true, "adamw_weight_decay": 0.012277809700643332, "l2_weight_decay": 1.0649147421051284e-05, "warmup_fraction": 0.005358924866864834, "min_learning_rate_mult": 0.014228942660940727, "constant_fraction": 0.8994159919824555}, {"learning_rate": 0.131654846159424, "beta1": 0.9966824188358862, "beta2": 0.999526000842444, "epsilon": 2.964640956629712e-05, "use_nesterov": true, "adamw_weight_decay": 0.043179160765076476, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.2506522643438923}, {"learning_rate": 0.22551414281153115, "beta1": 0.9936754930401867, "beta2": 0.9994364737437058, "epsilon": 0.05306339389848217, "use_nesterov": false, "adamw_weight_decay": 0.016538840243138016, "l2_weight_decay": 0.0, "warmup_fraction": 3.7249729843709355e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.8192689167995213}, {"learning_rate": 0.4429944509815205, "beta1": 0.9437506975702864, "beta2": 0.9355087884378893, "epsilon": 2.334747095254199e-08, "use_nesterov": true, "adamw_weight_decay": 8.325394090732559e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.702224870887491}, {"learning_rate": 0.10727056375654975, "beta1": 0.9338851352878516, "beta2": 0.7285573474584601, "epsilon": 33.54777391702044, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0016884440003315595, "warmup_fraction": 0.00014103820609793162, "min_learning_rate_mult": 0.0, "constant_fraction": 0.8958530580688326}, {"learning_rate": 0.0005303069676563245, "beta1": 0.9621341643346931, "beta2": 0.9993116629222081, "epsilon": 0.09999215169210834, "use_nesterov": true, "adamw_weight_decay": 5.1729753258383984e-05, "l2_weight_decay": 0.008210068531626587, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0005941064280093637, "constant_fraction": 0.36505927401884497}, {"learning_rate": 0.0012460765566757628, "beta1": 0.9643737174454002, "beta2": 0.9998970009191583, "epsilon": 0.7393180530477765, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0015432577526591311, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.31651839204989307}, {"learning_rate": 0.06219107635281434, "beta1": 0.8010432473176429, "beta2": 0.9999707385274426, "epsilon": 188.65074602003935, "use_nesterov": false, "adamw_weight_decay": 3.2419902781091713e-05, "l2_weight_decay": 0.00023224635613909244, "warmup_fraction": 0.015013450416739972, "min_learning_rate_mult": 0.0, "constant_fraction": 0.21547179185316356}, {"learning_rate": 0.0003443777602351824, "beta1": 0.9915654973366053, "beta2": 0.6381678252221719, "epsilon": 0.02620529779627119, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.00014877396306796505, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.02818818328858964, "constant_fraction": 0.1914227985969419}, {"learning_rate": 0.10219194968124987, "beta1": 0.9637535186893267, "beta2": 0.999989260028841, "epsilon": 3972.158489508664, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0011216391542219477, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.6411645077341968, "constant_fraction": 0.7249442054457736}, {"learning_rate": 0.004553127917916583, "beta1": 0.9483489528010572, "beta2": 0.997487332805381, "epsilon": 0.006446247551468225, "use_nesterov": true, "adamw_weight_decay": 0.05245008863087847, "l2_weight_decay": 0.031554511906965885, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.015647754402206584, "constant_fraction": 0.02427292894872657}, {"learning_rate": 0.006688303553773934, "beta1": 0.9982073016834572, "beta2": 0.999985493640601, "epsilon": 6.044453176351436e-06, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.00011156333270935727, "warmup_fraction": 1.726101276965304e-05, "min_learning_rate_mult": 0.0005978122720319491, "constant_fraction": 0.1532730918028029}, {"learning_rate": 0.04092642409399911, "beta1": 0.2606527850099992, "beta2": 0.992882565612852, "epsilon": 1.1220814525317918e-07, "use_nesterov": false, "adamw_weight_decay": 1.5041844313088449e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.00017502721457559293, "min_learning_rate_mult": 0.0, "constant_fraction": 0.6849503552291991}, {"learning_rate": 0.0028537812957163864, "beta1": 0.9447978222726168, "beta2": 0.9909012574988224, "epsilon": 110.68057099926948, "use_nesterov": false, "adamw_weight_decay": 6.780158467720605e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.0004545797885995719, "min_learning_rate_mult": 0.0047169504918863165, "constant_fraction": 0.3342798181039828}, {"learning_rate": 0.29935447172029467, "beta1": 0.7295300358539047, "beta2": 0.8670410828628053, "epsilon": 13.534222612087172, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.000271265972243285, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.020258565989631737, "constant_fraction": 0.334338861229867}, {"learning_rate": 0.5385759009797144, "beta1": 0.9470203460325338, "beta2": 0.997778860128218, "epsilon": 871.116097556107, "use_nesterov": false, "adamw_weight_decay": 0.011221904300546308, "l2_weight_decay": 3.9522238220698104e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.8705582191442393}, {"learning_rate": 0.02770844564248992, "beta1": 0.9673072799568008, "beta2": 0.9877183119723905, "epsilon": 3.0478113934935905e-08, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.005805611691690909, "warmup_fraction": 0.0, "min_learning_rate_mult": 7.619568775120942e-05, "constant_fraction": 0.1607415045027396}, {"learning_rate": 0.0077481757580766, "beta1": 0.9980456679452893, "beta2": 0.9999893050394703, "epsilon": 2.146978965643919e-05, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.013677035077798867, "warmup_fraction": 0.00018919963078531653, "min_learning_rate_mult": 0.0, "constant_fraction": 0.7763799962626241}, {"learning_rate": 0.005789833052900052, "beta1": 0.9963443630921962, "beta2": 0.985965250899819, "epsilon": 2.8882104471596835e-05, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 6.960252456418762e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0012208917324629954, "constant_fraction": 0.5832703174135823}, {"learning_rate": 0.33304879602168547, "beta1": 0.9974057293154148, "beta2": 0.9999718609215839, "epsilon": 5020.159033552083, "use_nesterov": true, "adamw_weight_decay": 0.019702976515631517, "l2_weight_decay": 0.0003208285377299527, "warmup_fraction": 0.0017546243261260433, "min_learning_rate_mult": 0.0, "constant_fraction": 0.8569937176977647}, {"learning_rate": 0.0004327925790844308, "beta1": 0.9690658494404186, "beta2": 0.7430751656836675, "epsilon": 0.1333456539793139, "use_nesterov": false, "adamw_weight_decay": 0.08231039858983227, "l2_weight_decay": 0.0, "warmup_fraction": 3.5033586825666905e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.35456351478708314}, {"learning_rate": 0.0017372022974910541, "beta1": 0.982337904618048, "beta2": 0.9313762240801586, "epsilon": 0.0010190142012240601, "use_nesterov": true, "adamw_weight_decay": 0.016186377619840625, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.2840274116154239}, {"learning_rate": 0.023561786696088213, "beta1": 0.9091252630599947, "beta2": 0.9118763408112831, "epsilon": 1.242126509196598e-08, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.015904783825505326, "warmup_fraction": 0.0, "min_learning_rate_mult": 1.8433213353771832e-05, "constant_fraction": 0.0144082340972157}, {"learning_rate": 0.36644290710023925, "beta1": 0.8623858414647336, "beta2": 0.968923492918848, "epsilon": 241.71386845885172, "use_nesterov": false, "adamw_weight_decay": 0.0035157144188948373, "l2_weight_decay": 0.0, "warmup_fraction": 5.7344633627101944e-05, "min_learning_rate_mult": 0.10729228474868995, "constant_fraction": 0.6452918527041421}, {"learning_rate": 0.7008132563616294, "beta1": 0.9878592480323491, "beta2": 0.9256588369827702, "epsilon": 18.53519404968476, "use_nesterov": false, "adamw_weight_decay": 0.025168252642697102, "l2_weight_decay": 0.0, "warmup_fraction": 1.6460083103458405e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.48642320213556256}, {"learning_rate": 0.48372352970151816, "beta1": 0.9090155316640738, "beta2": 0.9999884118024664, "epsilon": 0.001151461458628565, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 5.2878261366441576e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.02165116322477023}, {"learning_rate": 0.00020225634187668405, "beta1": 0.7496316680952213, "beta2": 0.49042440060465453, "epsilon": 0.00011677092260710994, "use_nesterov": false, "adamw_weight_decay": 0.0524640322770648, "l2_weight_decay": 0.006008794364428511, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.7562738292129023}, {"learning_rate": 0.0016533010683733877, "beta1": 0.3254475099356062, "beta2": 0.4297686511472817, "epsilon": 0.001984269295556009, "use_nesterov": true, "adamw_weight_decay": 0.003363402434071319, "l2_weight_decay": 0.019433564642694183, "warmup_fraction": 1.687324038905163e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.8104351866668116}, {"learning_rate": 0.046825896404436865, "beta1": 0.9790825817933471, "beta2": 0.9995445382356376, "epsilon": 6.125121597650108e-07, "use_nesterov": false, "adamw_weight_decay": 5.100076135070402e-05, "l2_weight_decay": 0.01952088165537641, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.054030232004832236, "constant_fraction": 0.021975992313512105}, {"learning_rate": 0.16677387000589103, "beta1": 0.9871726368638661, "beta2": 0.9994606933147668, "epsilon": 2.3211576724011113e-06, "use_nesterov": false, "adamw_weight_decay": 0.000267455682008456, "l2_weight_decay": 0.0040525724537173085, "warmup_fraction": 0.0002508406967344943, "min_learning_rate_mult": 0.0, "constant_fraction": 0.3634201157153999}, {"learning_rate": 0.047295874752145084, "beta1": 0.9775785954248002, "beta2": 0.8361770657369894, "epsilon": 5.258076466034855, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.011587961571459469, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.31693848415917447}, {"learning_rate": 0.3301151442111616, "beta1": 0.9250552393356208, "beta2": 0.9999738772185292, "epsilon": 0.05981018936387042, "use_nesterov": false, "adamw_weight_decay": 0.00018615740415244223, "l2_weight_decay": 0.01495511753755806, "warmup_fraction": 2.7238063587520665e-05, "min_learning_rate_mult": 0.015245992471951152, "constant_fraction": 0.9996181549582421}, {"learning_rate": 0.0023809290451303057, "beta1": 0.905825649306108, "beta2": 0.5918549197866138, "epsilon": 0.0477701314910599, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0006128454973817304, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.3758131589373942}, {"learning_rate": 0.0278647581360894, "beta1": 0.7707837210283497, "beta2": 0.27146500226502457, "epsilon": 7.908614842979522e-05, "use_nesterov": true, "adamw_weight_decay": 0.0003649107185929682, "l2_weight_decay": 2.0161008990883107e-05, "warmup_fraction": 0.0001550150927655711, "min_learning_rate_mult": 0.0, "constant_fraction": 0.2363174770675318}, {"learning_rate": 0.013668063350747968, "beta1": 0.9986787452822233, "beta2": 0.9995258187267485, "epsilon": 1.8702151329534609e-06, "use_nesterov": false, "adamw_weight_decay": 0.0009431503660976783, "l2_weight_decay": 0.0, "warmup_fraction": 1.4586587338820387e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.7624100487397523}, {"learning_rate": 0.06657639947550524, "beta1": 0.9985511876959209, "beta2": 0.977828557998213, "epsilon": 3.4436985382282893e-07, "use_nesterov": true, "adamw_weight_decay": 0.00012671429844426498, "l2_weight_decay": 0.0, "warmup_fraction": 0.006079617888457069, "min_learning_rate_mult": 0.001604462899760954, "constant_fraction": 0.7675467516519692}, {"learning_rate": 0.0038133143170788054, "beta1": 0.7492477457906155, "beta2": 0.9406919427293288, "epsilon": 0.00033088903636754364, "use_nesterov": false, "adamw_weight_decay": 0.01589964885560454, "l2_weight_decay": 0.014916604923284485, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.00016651767303288946, "constant_fraction": 0.02737022461774874}, {"learning_rate": 0.3367821291043801, "beta1": 0.9524980607011501, "beta2": 0.9996863967161917, "epsilon": 0.0009046418501331737, "use_nesterov": true, "adamw_weight_decay": 0.002543431875978067, "l2_weight_decay": 0.00019423347759966547, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.0028913438955439075}, {"learning_rate": 0.1754631134707925, "beta1": 0.9554902372489301, "beta2": 0.9985964219070712, "epsilon": 4.3673900504515244e-07, "use_nesterov": true, "adamw_weight_decay": 3.317227636456343e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.04620676047025919, "min_learning_rate_mult": 0.00033257478590026336, "constant_fraction": 0.49429442829867687}, {"learning_rate": 0.6668003113933759, "beta1": 0.9686812039577606, "beta2": 0.9995541251619776, "epsilon": 1.698903158327959e-06, "use_nesterov": false, "adamw_weight_decay": 0.06726358805333882, "l2_weight_decay": 0.04515815331388229, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.15561315966137462, "constant_fraction": 0.06716830213314051}, {"learning_rate": 0.05995074858978631, "beta1": 0.9490495584014185, "beta2": 0.667998094090951, "epsilon": 6859.06714404996, "use_nesterov": true, "adamw_weight_decay": 0.00025570261696060485, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 8.968787859331875e-05, "constant_fraction": 0.42258470374428714}, {"learning_rate": 0.8887859791582561, "beta1": 0.9584391293690215, "beta2": 0.999879008416271, "epsilon": 0.0025803622574945883, "use_nesterov": true, "adamw_weight_decay": 0.0021600912651529463, "l2_weight_decay": 0.00189947718509891, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.6440429904681843}, {"learning_rate": 0.39441573081737796, "beta1": 0.6173437763654944, "beta2": 0.5626398171118911, "epsilon": 13.147258314103503, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.013461730861940798, "warmup_fraction": 2.9250419964102373e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.5473911960274326}, {"learning_rate": 0.06027690378346685, "beta1": 0.5279152282546589, "beta2": 0.9994832240192252, "epsilon": 0.00010374077866748973, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.006609991047030713, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.7947465321058239}, {"learning_rate": 0.3136347149956882, "beta1": 0.8878481457312091, "beta2": 0.9999816424067114, "epsilon": 2.8740464308600017e-05, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.013245065916416254, "warmup_fraction": 4.5097404284098764e-05, "min_learning_rate_mult": 0.0933859842611187, "constant_fraction": 0.25933746855309614}, {"learning_rate": 0.0835371454743225, "beta1": 0.8389167058306451, "beta2": 0.9976174711518323, "epsilon": 0.016134863358299417, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.011033299621293584, "warmup_fraction": 0.0006472529701250368, "min_learning_rate_mult": 0.0, "constant_fraction": 0.5533734269637456}, {"learning_rate": 0.04985475739311088, "beta1": 0.9172813454726811, "beta2": 0.9992938620124079, "epsilon": 8.981060436609483e-08, "use_nesterov": true, "adamw_weight_decay": 0.0006521656067860081, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.00028247056845258665, "constant_fraction": 0.7436005911157851}, {"learning_rate": 0.004584946479652896, "beta1": 0.984618307841541, "beta2": 0.99867425772834, "epsilon": 0.6513314980981108, "use_nesterov": true, "adamw_weight_decay": 0.00656461587643647, "l2_weight_decay": 0.0, "warmup_fraction": 0.022339609799585176, "min_learning_rate_mult": 0.0, "constant_fraction": 0.23119255141657546}, {"learning_rate": 0.02698315737452664, "beta1": 0.9966410779019276, "beta2": 0.9937875307781808, "epsilon": 0.007943882046691818, "use_nesterov": false, "adamw_weight_decay": 0.00020434984644541015, "l2_weight_decay": 0.0, "warmup_fraction": 0.021729183962972104, "min_learning_rate_mult": 0.43972157436041, "constant_fraction": 0.2580386514214691}, {"learning_rate": 0.001125398101323347, "beta1": 0.9987056855293349, "beta2": 0.9999378844228235, "epsilon": 0.391178418428464, "use_nesterov": true, "adamw_weight_decay": 0.058732307180066966, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.001693244833379363, "constant_fraction": 0.7513900018533294}, {"learning_rate": 0.00011140347014868668, "beta1": 0.9859574682067698, "beta2": 0.9805563444191531, "epsilon": 0.005782444272796924, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.012155070903546743, "warmup_fraction": 0.0005772673444947373, "min_learning_rate_mult": 0.0, "constant_fraction": 0.5457168557927827}, {"learning_rate": 0.0008731214312661583, "beta1": 0.996436844620599, "beta2": 0.4856436590866604, "epsilon": 0.000624938004931852, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.003837087856488632, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0007260620404277924, "constant_fraction": 0.15097718083209788}, {"learning_rate": 0.006872996242162062, "beta1": 0.9169597844259907, "beta2": 0.9997835119658569, "epsilon": 1041.0953030742373, "use_nesterov": true, "adamw_weight_decay": 4.410761051021962e-05, "l2_weight_decay": 0.00026370309634584515, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.20051016129851146, "constant_fraction": 0.8423180076336422}, {"learning_rate": 0.0004201802240582025, "beta1": 0.990834763802036, "beta2": 0.9862330059650068, "epsilon": 0.30313264253485583, "use_nesterov": true, "adamw_weight_decay": 0.0014428806891222034, "l2_weight_decay": 0.0001437946355170288, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.34220755137217385}, {"learning_rate": 2.8403433803148767e-05, "beta1": 0.3407473841139177, "beta2": 0.9999882398078606, "epsilon": 1738.779479396756, "use_nesterov": false, "adamw_weight_decay": 6.306877730205347e-05, "l2_weight_decay": 3.0154717108607436e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.7085899040614267}, {"learning_rate": 0.2114693964522307, "beta1": 0.9158861098585881, "beta2": 0.9912890739859026, "epsilon": 1.075990329256662e-07, "use_nesterov": false, "adamw_weight_decay": 0.00010790470074937376, "l2_weight_decay": 2.1494514420873464e-05, "warmup_fraction": 0.000609167155102501, "min_learning_rate_mult": 0.0004667696683897301, "constant_fraction": 0.14577721208900407}, {"learning_rate": 0.01861904981450399, "beta1": 0.9988086436633122, "beta2": 0.9999899567620552, "epsilon": 2.3291476495539785, "use_nesterov": false, "adamw_weight_decay": 0.03150436127577518, "l2_weight_decay": 0.0010071157065768075, "warmup_fraction": 0.0, "min_learning_rate_mult": 1.876870070060126e-05, "constant_fraction": 0.828246374354574}, {"learning_rate": 0.31299550807775334, "beta1": 0.858327317795561, "beta2": 0.44744061549147207, "epsilon": 3.1620773310937225e-08, "use_nesterov": true, "adamw_weight_decay": 0.02125783526758575, "l2_weight_decay": 7.507416245703697e-05, "warmup_fraction": 0.09409871943043953, "min_learning_rate_mult": 0.0, "constant_fraction": 0.37929004806499134}, {"learning_rate": 0.038238845487270995, "beta1": 0.9855992982301374, "beta2": 0.454837529422943, "epsilon": 0.0001708790846617894, "use_nesterov": false, "adamw_weight_decay": 4.548924462690162e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.34872158651888197}, {"learning_rate": 0.0011004752842778951, "beta1": 0.7866624253080114, "beta2": 0.9999840790956753, "epsilon": 0.34456354552456026, "use_nesterov": false, "adamw_weight_decay": 0.05303466064350949, "l2_weight_decay": 0.0, "warmup_fraction": 0.07268472541761435, "min_learning_rate_mult": 0.0008631118564768212, "constant_fraction": 0.1448256483369572}, {"learning_rate": 0.30005261297780783, "beta1": 0.992716961829122, "beta2": 0.9999597933075914, "epsilon": 2.667694756454634e-05, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0003367232274234232, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.04052462987798559, "constant_fraction": 0.5079904008966848}, {"learning_rate": 0.000466676754694087, "beta1": 0.9944930222689273, "beta2": 0.9993380513000001, "epsilon": 1.2610292878690257, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 6.436488058199524e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 5.9723417295201795e-05, "constant_fraction": 0.4119522133488872}, {"learning_rate": 0.6244950036270002, "beta1": 0.9859146363285608, "beta2": 0.9999828424447572, "epsilon": 5.997964118789791, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 6.021432136844076e-05, "warmup_fraction": 0.038436110323877865, "min_learning_rate_mult": 0.0, "constant_fraction": 0.8573246252956911}, {"learning_rate": 0.0018948318787109849, "beta1": 0.9962685184787237, "beta2": 0.9988587731583137, "epsilon": 7163.864455480194, "use_nesterov": false, "adamw_weight_decay": 0.07399306110937089, "l2_weight_decay": 0.0, "warmup_fraction": 0.0040679589546772105, "min_learning_rate_mult": 0.00458579251358751, "constant_fraction": 0.8764714884862916}, {"learning_rate": 0.016995678554690943, "beta1": 0.9351347833863599, "beta2": 0.9964974972967524, "epsilon": 3.793140187975404e-06, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.058907741316623685, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.34785361775998247}, {"learning_rate": 0.0010389504095032176, "beta1": 0.9413689697150365, "beta2": 0.993473242887443, "epsilon": 7362.873650979379, "use_nesterov": false, "adamw_weight_decay": 0.0015223393543994553, "l2_weight_decay": 0.0, "warmup_fraction": 0.0015511184093374294, "min_learning_rate_mult": 0.24424963324543303, "constant_fraction": 0.8387344829263127}, {"learning_rate": 0.07928802322811165, "beta1": 0.9632593826719605, "beta2": 0.2661109977049073, "epsilon": 27.20130876202258, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.006210848203941328, "warmup_fraction": 0.06355197954304927, "min_learning_rate_mult": 0.001036708566020025, "constant_fraction": 0.4656963739937563}, {"learning_rate": 0.012026517264052686, "beta1": 0.9983552654183508, "beta2": 0.9999064061245823, "epsilon": 0.1726256363671029, "use_nesterov": false, "adamw_weight_decay": 0.05570858193400012, "l2_weight_decay": 0.09382761559874786, "warmup_fraction": 7.665607905625367e-05, "min_learning_rate_mult": 1.7186399698160296e-05, "constant_fraction": 0.3558824970506035}, {"learning_rate": 0.00025119967158780074, "beta1": 0.9682529880139529, "beta2": 0.9386724319479858, "epsilon": 133.4948640239797, "use_nesterov": true, "adamw_weight_decay": 0.04207800088769654, "l2_weight_decay": 0.0003673237515137192, "warmup_fraction": 0.0, "min_learning_rate_mult": 3.388390425144935e-05, "constant_fraction": 0.4552820932392191}, {"learning_rate": 0.007176467412618538, "beta1": 0.9907853958327537, "beta2": 0.5266113360150725, "epsilon": 500.43925353131186, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.008990085539639156, "warmup_fraction": 0.006631426639598046, "min_learning_rate_mult": 0.00010843864119007111, "constant_fraction": 0.2913104978765829}, {"learning_rate": 0.013370480517047728, "beta1": 0.9964948340445584, "beta2": 0.9998352592071472, "epsilon": 416.3682216687159, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.00010382580694984943, "warmup_fraction": 0.02118347181274819, "min_learning_rate_mult": 0.0, "constant_fraction": 0.3379334877455237}, {"learning_rate": 9.163183955919964e-05, "beta1": 0.9677042373862264, "beta2": 0.6729982710089979, "epsilon": 1.3804560330792302e-08, "use_nesterov": false, "adamw_weight_decay": 0.06367706478419946, "l2_weight_decay": 0.0, "warmup_fraction": 0.00019773592908685987, "min_learning_rate_mult": 0.0, "constant_fraction": 0.8939133780939167}, {"learning_rate": 4.3488207848878524e-05, "beta1": 0.8924614804542979, "beta2": 0.9994916304525914, "epsilon": 30.235800870436783, "use_nesterov": false, "adamw_weight_decay": 0.003059481130544422, "l2_weight_decay": 3.3853784718720135e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.01376996261299286, "constant_fraction": 0.6537445412372384}, {"learning_rate": 9.069325177866014e-05, "beta1": 0.9851008974007976, "beta2": 0.9780316396176365, "epsilon": 1024.0531503132452, "use_nesterov": true, "adamw_weight_decay": 3.2688794853610166e-05, "l2_weight_decay": 5.488124141531666e-05, "warmup_fraction": 3.654585103476019e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.6562452848006932}, {"learning_rate": 0.1375101296033968, "beta1": 0.7145297311287678, "beta2": 0.6846157308142673, "epsilon": 462.4154053799867, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.00014298311668644437, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.000189400109201416, "constant_fraction": 0.9748356947280172}, {"learning_rate": 1.5937070603492694e-05, "beta1": 0.9888680062250855, "beta2": 0.9639267398420464, "epsilon": 883.7242604567668, "use_nesterov": false, "adamw_weight_decay": 0.00012023510928971041, "l2_weight_decay": 0.0, "warmup_fraction": 1.1739824252376392e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.807666843845354}, {"learning_rate": 0.820934760438444, "beta1": 0.9431295736458315, "beta2": 0.9998839539724373, "epsilon": 0.000907977289490479, "use_nesterov": true, "adamw_weight_decay": 0.014676231524667545, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.43266275872318305}, {"learning_rate": 0.7753890414232453, "beta1": 0.41532499337850404, "beta2": 0.9997620032790744, "epsilon": 0.6197920933382269, "use_nesterov": false, "adamw_weight_decay": 0.06268590708680236, "l2_weight_decay": 0.0, "warmup_fraction": 0.0003578067325733004, "min_learning_rate_mult": 0.0, "constant_fraction": 0.33670027124600843}, {"learning_rate": 0.0006683558198140228, "beta1": 0.8384564175645739, "beta2": 0.9999736377673049, "epsilon": 4.674705855606126, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.012451490456871318, "warmup_fraction": 0.0, "min_learning_rate_mult": 1.1475082999257992e-05, "constant_fraction": 0.138192174792089}, {"learning_rate": 0.08129391209212311, "beta1": 0.5419168957465377, "beta2": 0.9577117900244295, "epsilon": 1.4922012110554835e-05, "use_nesterov": false, "adamw_weight_decay": 0.0007639046172491491, "l2_weight_decay": 0.04079660939183887, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.7034824810904439}, {"learning_rate": 0.008406273859401275, "beta1": 0.9965740733813586, "beta2": 0.9999520234675126, "epsilon": 3.2319639547429357, "use_nesterov": false, "adamw_weight_decay": 0.019051061170028957, "l2_weight_decay": 0.0010424827797776925, "warmup_fraction": 0.006413421980387978, "min_learning_rate_mult": 0.0, "constant_fraction": 0.5864817407608234}, {"learning_rate": 0.6226583194004327, "beta1": 0.8566779532152214, "beta2": 0.9999455839788711, "epsilon": 100.75980593288277, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0002825452414836558, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.9237910794610038}, {"learning_rate": 0.1488100966121965, "beta1": 0.926921896057771, "beta2": 0.2614055971473538, "epsilon": 4.956584152652382e-05, "use_nesterov": true, "adamw_weight_decay": 0.0005433445585306165, "l2_weight_decay": 0.00468632659334109, "warmup_fraction": 0.03743363110418479, "min_learning_rate_mult": 0.0, "constant_fraction": 0.59333401696363}, {"learning_rate": 4.7659066087437245e-05, "beta1": 0.998952263075961, "beta2": 0.9997457660445163, "epsilon": 3.5908924701527253e-06, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.04815636444880412, "warmup_fraction": 0.0, "min_learning_rate_mult": 7.887315937201103e-05, "constant_fraction": 0.5406115689168121}, {"learning_rate": 0.05130707976484287, "beta1": 0.9980448826815751, "beta2": 0.9999893077511991, "epsilon": 47.55738470772021, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.00012420319818282576, "warmup_fraction": 0.00023193485585274544, "min_learning_rate_mult": 0.0, "constant_fraction": 0.48717990334389416}, {"learning_rate": 0.09114732165134878, "beta1": 0.9982883682712059, "beta2": 0.9682688810303828, "epsilon": 9.446214515861679e-08, "use_nesterov": false, "adamw_weight_decay": 0.00795504224273, "l2_weight_decay": 0.0, "warmup_fraction": 0.00017783399145797617, "min_learning_rate_mult": 0.0, "constant_fraction": 0.625786950733936}, {"learning_rate": 0.001156232648214024, "beta1": 0.9979092862997715, "beta2": 0.99998351410326, "epsilon": 0.4928768834095508, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.00022204982474261317, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.34265946456084045, "constant_fraction": 0.7114425971940492}, {"learning_rate": 0.8068101895575366, "beta1": 0.9735998751695841, "beta2": 0.9999859458322505, "epsilon": 1.4000135746540062e-07, "use_nesterov": true, "adamw_weight_decay": 3.2026471972770275e-05, "l2_weight_decay": 0.0033590712452769384, "warmup_fraction": 0.00016104434280870636, "min_learning_rate_mult": 0.0, "constant_fraction": 0.5804675186403739}, {"learning_rate": 0.05056553040393424, "beta1": 0.4490949867715822, "beta2": 0.73560633518602, "epsilon": 0.0006765168239286473, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0002115172365790771, "warmup_fraction": 0.0033453644936483557, "min_learning_rate_mult": 5.4346524615227444e-05, "constant_fraction": 0.1761198298239398}, {"learning_rate": 8.034752425579177e-05, "beta1": 0.9934138080489328, "beta2": 0.2680253644218573, "epsilon": 0.004220754454743408, "use_nesterov": false, "adamw_weight_decay": 0.0006114064599721975, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.05722163157051493, "constant_fraction": 0.9309013199451506}, {"learning_rate": 0.00010895918455029036, "beta1": 0.9529452045486783, "beta2": 0.9992954809220868, "epsilon": 1.2013004773477416, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0024294358732730873, "warmup_fraction": 7.306422827517748e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.6278753110706454}, {"learning_rate": 0.0004903019107001204, "beta1": 0.9904628695781644, "beta2": 0.9998924485656415, "epsilon": 3144.330429958289, "use_nesterov": false, "adamw_weight_decay": 0.010613350601533053, "l2_weight_decay": 0.003752447561034353, "warmup_fraction": 0.0005906692774193561, "min_learning_rate_mult": 0.0, "constant_fraction": 0.17732130796621304}, {"learning_rate": 0.004506519824219216, "beta1": 0.7702861898821542, "beta2": 0.9801331369569521, "epsilon": 0.013711248660870558, "use_nesterov": true, "adamw_weight_decay": 1.0179935038086953e-05, "l2_weight_decay": 0.049671108852348614, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.09914024777188912}, {"learning_rate": 0.07551042615602264, "beta1": 0.5622441726404451, "beta2": 0.9953982654922727, "epsilon": 0.3969869809583905, "use_nesterov": true, "adamw_weight_decay": 1.9942242017511656e-05, "l2_weight_decay": 0.00044508461218179787, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.003805148699141289, "constant_fraction": 0.7590367030036856}, {"learning_rate": 0.02503839928534141, "beta1": 0.9985578970809886, "beta2": 0.9995395007193929, "epsilon": 0.01664027877812291, "use_nesterov": false, "adamw_weight_decay": 0.00010884876232276745, "l2_weight_decay": 1.287394600748136e-05, "warmup_fraction": 0.04469063063573968, "min_learning_rate_mult": 0.0, "constant_fraction": 0.012621199182168752}, {"learning_rate": 2.2053470970740652e-05, "beta1": 0.4266967179861224, "beta2": 0.9989066679443313, "epsilon": 0.0001270011704185884, "use_nesterov": false, "adamw_weight_decay": 0.024731211564005325, "l2_weight_decay": 0.0, "warmup_fraction": 0.00014785141184924083, "min_learning_rate_mult": 0.0, "constant_fraction": 0.559607084059825}, {"learning_rate": 0.00032062353110472945, "beta1": 0.994115758047093, "beta2": 0.9990085432853842, "epsilon": 6.586068697307845e-07, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.012448617572696214, "warmup_fraction": 0.08682970711209027, "min_learning_rate_mult": 8.19346549681992e-05, "constant_fraction": 0.1784197818238772}, {"learning_rate": 0.002002672427786374, "beta1": 0.6794301680528645, "beta2": 0.9988881081174189, "epsilon": 0.0001385896134479562, "use_nesterov": false, "adamw_weight_decay": 1.6419323276977053e-05, "l2_weight_decay": 0.0009487353020141956, "warmup_fraction": 0.00126667317508435, "min_learning_rate_mult": 0.006065566717226003, "constant_fraction": 0.6043460669575206}, {"learning_rate": 1.532091965875813e-05, "beta1": 0.9070245950991649, "beta2": 0.9819903919107402, "epsilon": 2707.6601865531975, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 5.9600057359861434e-05, "warmup_fraction": 0.002987049960720601, "min_learning_rate_mult": 0.004574543833880066, "constant_fraction": 0.5506961177964221}, {"learning_rate": 0.07576019071553294, "beta1": 0.9372904884336007, "beta2": 0.9999790371750418, "epsilon": 1.4630415645090063e-05, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.007206052798016881, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.5269064143089695}, {"learning_rate": 1.3145889095174035e-05, "beta1": 0.9587266795780162, "beta2": 0.9999665680253814, "epsilon": 0.28672759340962917, "use_nesterov": false, "adamw_weight_decay": 0.012072919386601823, "l2_weight_decay": 0.0010279108876173374, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.6676854671734553}, {"learning_rate": 0.007310827306090061, "beta1": 0.9983631821652917, "beta2": 0.9995941362042182, "epsilon": 1975.4060219138514, "use_nesterov": false, "adamw_weight_decay": 0.005686351516501697, "l2_weight_decay": 0.0018899654455264282, "warmup_fraction": 8.543474113764858e-05, "min_learning_rate_mult": 0.18785529503216486, "constant_fraction": 0.6812241096106758}, {"learning_rate": 0.02784974620772499, "beta1": 0.6989758782999029, "beta2": 0.9999893111140546, "epsilon": 0.6721009253216835, "use_nesterov": false, "adamw_weight_decay": 3.624673167970563e-05, "l2_weight_decay": 0.011215220139316286, "warmup_fraction": 0.006914192390026763, "min_learning_rate_mult": 0.0118129012805374, "constant_fraction": 0.600432272301936}, {"learning_rate": 0.00011488375816680019, "beta1": 0.9856406647185606, "beta2": 0.4001259285474583, "epsilon": 2.2233133731065197e-08, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.012116516825550523, "warmup_fraction": 3.919814900817333e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.3751372383732231}, {"learning_rate": 0.019684724307589364, "beta1": 0.998297388248413, "beta2": 0.9998632770926416, "epsilon": 843.4209708745113, "use_nesterov": false, "adamw_weight_decay": 0.00038629022979604804, "l2_weight_decay": 0.0, "warmup_fraction": 2.0108955165475032e-05, "min_learning_rate_mult": 0.03524821322630688, "constant_fraction": 0.561404094624595}, {"learning_rate": 0.08386951932989806, "beta1": 0.9954014649268009, "beta2": 0.9968700639324443, "epsilon": 81.97062736401037, "use_nesterov": false, "adamw_weight_decay": 0.0003695467366388471, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.285027683925935, "constant_fraction": 0.3659759457806968}, {"learning_rate": 0.2814008861826485, "beta1": 0.9988013634248339, "beta2": 0.9999373051097881, "epsilon": 84.38330480681157, "use_nesterov": true, "adamw_weight_decay": 4.8751996322373095e-05, "l2_weight_decay": 0.000949454240953452, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.6516227331885169}, {"learning_rate": 0.03598365905038542, "beta1": 0.9985425108015832, "beta2": 0.9991791358078623, "epsilon": 0.5677370372971922, "use_nesterov": true, "adamw_weight_decay": 1.2873464949502165e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.002454794416634076, "constant_fraction": 0.7722976114370796}, {"learning_rate": 1.4219589202193695e-05, "beta1": 0.9913987404180445, "beta2": 0.9999888020313752, "epsilon": 0.013206843562851647, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 7.333198967558657e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.1174641502309588}, {"learning_rate": 6.699501358932056e-05, "beta1": 0.718549685504354, "beta2": 0.9999360021233121, "epsilon": 0.9599227637228999, "use_nesterov": false, "adamw_weight_decay": 0.001512220502534823, "l2_weight_decay": 0.0006796496423098444, "warmup_fraction": 7.463411289057901e-05, "min_learning_rate_mult": 0.36030967912977696, "constant_fraction": 0.5542887986007424}, {"learning_rate": 1.022049063371937e-05, "beta1": 0.02458838078187997, "beta2": 0.9450989404018092, "epsilon": 0.01987828189998521, "use_nesterov": true, "adamw_weight_decay": 0.00010178613079332301, "l2_weight_decay": 0.01995353874971719, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.06680249227165856, "constant_fraction": 0.4317292903218336}, {"learning_rate": 0.09457308499245332, "beta1": 0.7630603853391921, "beta2": 0.9860780454161263, "epsilon": 4.119708660708564e-05, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0005933250865955295, "warmup_fraction": 0.0, "min_learning_rate_mult": 3.643076323833318e-05, "constant_fraction": 0.9043500753054071}, {"learning_rate": 1.3345657257695992e-05, "beta1": 0.9986096184836969, "beta2": 0.9990117364536384, "epsilon": 8.492822907577073e-06, "use_nesterov": true, "adamw_weight_decay": 3.690769607897085e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.10487527461686699, "constant_fraction": 0.6105992554607647}, {"learning_rate": 0.0002657936798247948, "beta1": 0.029247913570183526, "beta2": 0.6661844223993723, "epsilon": 0.00010107818723345976, "use_nesterov": false, "adamw_weight_decay": 6.371378741079396e-05, "l2_weight_decay": 0.05307119063100354, "warmup_fraction": 0.020026029618414546, "min_learning_rate_mult": 0.0, "constant_fraction": 0.1350559189749928}, {"learning_rate": 0.00014543029407501444, "beta1": 0.9945689074268044, "beta2": 0.9971026146203898, "epsilon": 118.41123650367041, "use_nesterov": true, "adamw_weight_decay": 1.455172856235826e-05, "l2_weight_decay": 0.0002833592582148114, "warmup_fraction": 0.0065112295646424226, "min_learning_rate_mult": 0.821894655162309, "constant_fraction": 0.30594539179558}, {"learning_rate": 5.9379696444596155e-05, "beta1": 0.9989396564733413, "beta2": 0.8715139695378881, "epsilon": 9.48167516141664, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.005676995402963017, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.5817003967677096}, {"learning_rate": 1.0673643333922883e-05, "beta1": 0.8932106935951781, "beta2": 0.9999755152585608, "epsilon": 4.6728499853910525e-05, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.001065905768247375, "warmup_fraction": 4.6120136744985675e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.031605183217433885}, {"learning_rate": 0.00019693820757923545, "beta1": 0.9820043428452243, "beta2": 0.12514592157859306, "epsilon": 203.6348720100544, "use_nesterov": false, "adamw_weight_decay": 0.00039573027183869517, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0002475580854008591, "constant_fraction": 0.6490157144867111}, {"learning_rate": 0.04156438754653971, "beta1": 0.9788306128690641, "beta2": 0.8352099413756829, "epsilon": 6.36102492730566e-08, "use_nesterov": false, "adamw_weight_decay": 3.6174646256841996e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.00021339075911626647, "constant_fraction": 0.019482367794813382}, {"learning_rate": 0.004392100860985699, "beta1": 0.4647096616507018, "beta2": 0.9157118378487258, "epsilon": 4.253038248208292, "use_nesterov": true, "adamw_weight_decay": 0.09901714522300598, "l2_weight_decay": 0.0, "warmup_fraction": 3.1451174367219e-05, "min_learning_rate_mult": 0.00028977571396976513, "constant_fraction": 0.9657319753038562}, {"learning_rate": 0.06390182889531293, "beta1": 0.9926498622184026, "beta2": 0.9702498094785663, "epsilon": 1.212733505410799e-07, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0007178036670522372, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0011350199757023966, "constant_fraction": 0.6233573035690348}, {"learning_rate": 0.00018307011519830694, "beta1": 0.8813327288082196, "beta2": 0.9999588938425509, "epsilon": 0.00023041197805944273, "use_nesterov": true, "adamw_weight_decay": 0.0010321860796457807, "l2_weight_decay": 0.0, "warmup_fraction": 9.151064419747315e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.1726755227778367}, {"learning_rate": 0.09576883028865969, "beta1": 0.988175159040144, "beta2": 0.7069467561473605, "epsilon": 6106.545923552775, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.02675457260148463, "warmup_fraction": 0.0, "min_learning_rate_mult": 1.0126636945985122e-05, "constant_fraction": 0.25062457653584713}, {"learning_rate": 0.00032821449587901625, "beta1": 0.8983999232369745, "beta2": 0.9999843505661776, "epsilon": 719.7073400891419, "use_nesterov": false, "adamw_weight_decay": 0.0043808159621560264, "l2_weight_decay": 0.013819048169863138, "warmup_fraction": 0.0002587263948481761, "min_learning_rate_mult": 0.9597615274476176, "constant_fraction": 0.9520649790931932}, {"learning_rate": 0.00170199123487788, "beta1": 0.42108910067481764, "beta2": 0.9999519924920202, "epsilon": 0.008328344391494566, "use_nesterov": false, "adamw_weight_decay": 0.029597132654895268, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.4358263454930832, "constant_fraction": 0.26149943800159803}, {"learning_rate": 0.004288641021498701, "beta1": 0.9987931426613702, "beta2": 0.9483498193367184, "epsilon": 0.027576143205674915, "use_nesterov": true, "adamw_weight_decay": 0.000377348800390435, "l2_weight_decay": 0.06290963663890593, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.4204315528811393}, {"learning_rate": 0.00037580031953518133, "beta1": 0.9942306961872942, "beta2": 0.999734999202418, "epsilon": 0.0003103653131957618, "use_nesterov": false, "adamw_weight_decay": 0.000270814207733495, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.00026610886263314393, "constant_fraction": 0.550205688210136}, {"learning_rate": 0.09884405509034513, "beta1": 0.9776961521031857, "beta2": 0.9944116133188875, "epsilon": 8398.942336441169, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 3.090394366284513e-05, "warmup_fraction": 0.006297220331610897, "min_learning_rate_mult": 0.0, "constant_fraction": 0.6966358214492594}, {"learning_rate": 0.00015605261390857234, "beta1": 0.9897750261410359, "beta2": 0.9998500208399087, "epsilon": 2.537549193243438, "use_nesterov": true, "adamw_weight_decay": 0.0009120384424226963, "l2_weight_decay": 2.1545570543629354e-05, "warmup_fraction": 1.5109965434587505e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.8276071570858236}, {"learning_rate": 0.004018168181427074, "beta1": 0.9778311311392015, "beta2": 0.9999434260266665, "epsilon": 0.028286927783902727, "use_nesterov": false, "adamw_weight_decay": 0.0007447345691340124, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.8388797278406646}, {"learning_rate": 2.5366691007794933e-05, "beta1": 0.9987401319928374, "beta2": 0.9970687915631368, "epsilon": 0.018459923787747898, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.00016035637816339535, "warmup_fraction": 0.00012044680367320243, "min_learning_rate_mult": 0.0, "constant_fraction": 0.10989329654894453}, {"learning_rate": 0.7734178492568113, "beta1": 0.9508094957329636, "beta2": 0.9993309537397715, "epsilon": 0.11232924420289055, "use_nesterov": false, "adamw_weight_decay": 0.08387119822781336, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0009195946169865449, "constant_fraction": 0.8982004388047752}, {"learning_rate": 0.03539059499483128, "beta1": 0.9897005811321858, "beta2": 0.9885584762273593, "epsilon": 5226.142173529346, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.00016536806409190246, "warmup_fraction": 0.012398298202629415, "min_learning_rate_mult": 0.0, "constant_fraction": 0.3051719886456191}, {"learning_rate": 7.68442643588484e-05, "beta1": 0.5729699458958615, "beta2": 0.9999795799797492, "epsilon": 5.670758404659329, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.033427810330456824, "warmup_fraction": 0.0026100965678541024, "min_learning_rate_mult": 0.0, "constant_fraction": 0.7721265916326487}, {"learning_rate": 0.0007727545498124005, "beta1": 0.9972852221819988, "beta2": 0.9999831432714368, "epsilon": 0.0005881097561695584, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.014436360200516465, "warmup_fraction": 1.6287814941802814e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.4758876132164479}, {"learning_rate": 0.00016166792202977888, "beta1": 0.9899406438524726, "beta2": 0.9966581268696953, "epsilon": 0.0003685411272776454, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 3.7031088594585666e-05, "warmup_fraction": 0.0004844458637000725, "min_learning_rate_mult": 0.061714901543336066, "constant_fraction": 0.8151658302901095}, {"learning_rate": 0.02812138071166694, "beta1": 0.9978613243890624, "beta2": 0.9926010901603651, "epsilon": 78.53911008217045, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 2.1101918568037518e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.19615887258691378}, {"learning_rate": 4.493737539292717e-05, "beta1": 0.11752239287017752, "beta2": 0.9995537865053588, "epsilon": 724.1067060228979, "use_nesterov": false, "adamw_weight_decay": 0.011628645367230227, "l2_weight_decay": 0.0, "warmup_fraction": 0.004960925581712661, "min_learning_rate_mult": 0.0, "constant_fraction": 0.6191129250791947}, {"learning_rate": 0.17265517895573837, "beta1": 0.9966666004861554, "beta2": 0.9952865066412435, "epsilon": 0.0183352251220297, "use_nesterov": true, "adamw_weight_decay": 0.00013065850511676102, "l2_weight_decay": 1.3937049755342298e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.000814443729075556, "constant_fraction": 0.34580163885855963}, {"learning_rate": 0.2733947744854976, "beta1": 0.972728959618751, "beta2": 0.45449056659740306, "epsilon": 1.9829055764517578e-07, "use_nesterov": false, "adamw_weight_decay": 0.06494276602354043, "l2_weight_decay": 0.012870757916308794, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.00011170516125826466, "constant_fraction": 0.22774622877736095}, {"learning_rate": 5.669629512214168e-05, "beta1": 0.9974620561608633, "beta2": 0.999962811178103, "epsilon": 5.186574566761839, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 2.9356369836208108e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.5935906546760441, "constant_fraction": 0.21981102942767772}, {"learning_rate": 2.4997453498776016e-05, "beta1": 0.9987069494728104, "beta2": 0.9992698395399476, "epsilon": 0.006141899856995343, "use_nesterov": false, "adamw_weight_decay": 0.010418859273212955, "l2_weight_decay": 0.0, "warmup_fraction": 0.00013507281964089432, "min_learning_rate_mult": 0.0, "constant_fraction": 0.08830464148151684}, {"learning_rate": 1.9924590725673e-05, "beta1": 0.3892497662083656, "beta2": 0.9999081872897078, "epsilon": 0.00018745768337454584, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0016882026959734074, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.008565199349248046, "constant_fraction": 0.36505564636565535}, {"learning_rate": 0.0009842189148135223, "beta1": 0.94651574759016, "beta2": 0.9998607262585981, "epsilon": 23.51252277517702, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.00020620474522529397, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.9164121098995625}, {"learning_rate": 4.0219774083301055e-05, "beta1": 0.3666709844577579, "beta2": 0.9157890905609376, "epsilon": 89.88931559786744, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 2.048988748488349e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0003565952838587183, "constant_fraction": 0.9448064452458975}, {"learning_rate": 1.1569804349583841e-05, "beta1": 0.9971325047316639, "beta2": 0.9996215377616267, "epsilon": 5.027361995116921e-07, "use_nesterov": true, "adamw_weight_decay": 0.001885262603101397, "l2_weight_decay": 0.000739054378372838, "warmup_fraction": 0.002822390200149852, "min_learning_rate_mult": 0.0, "constant_fraction": 0.5940195015178741}, {"learning_rate": 1.0852603796458478e-05, "beta1": 0.3007600253127658, "beta2": 0.8759149792984013, "epsilon": 0.0033095976029413484, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.022657070428601055, "warmup_fraction": 0.0001271933140894986, "min_learning_rate_mult": 0.0, "constant_fraction": 0.23632711784202298}, {"learning_rate": 0.0007162633912253167, "beta1": 0.9989171802156962, "beta2": 0.95694428688404, "epsilon": 0.00010274681487747752, "use_nesterov": true, "adamw_weight_decay": 0.001472345324254681, "l2_weight_decay": 0.030657869802871093, "warmup_fraction": 0.0, "min_learning_rate_mult": 8.353444186606395e-05, "constant_fraction": 0.4442365015267288}, {"learning_rate": 2.8215270602289254e-05, "beta1": 0.9947491477797441, "beta2": 0.3954074744833336, "epsilon": 1.4307736638266088e-07, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.001623150171149677, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.04114157098166926}, {"learning_rate": 7.450646614151382e-05, "beta1": 0.9989156856643318, "beta2": 0.8963136108019556, "epsilon": 1.2059712655949254e-07, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.048914744595379485, "warmup_fraction": 2.930581316903262e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.8577327062018985}, {"learning_rate": 1.6769091059331226e-05, "beta1": 0.71709708529259, "beta2": 0.937374330450984, "epsilon": 4.4495080936715726e-06, "use_nesterov": true, "adamw_weight_decay": 1.3481516352168464e-05, "l2_weight_decay": 0.0003010634622630666, "warmup_fraction": 0.050849396348855234, "min_learning_rate_mult": 0.0, "constant_fraction": 0.8521786519068554}, {"learning_rate": 8.054514713977168e-05, "beta1": 0.983868725841856, "beta2": 0.9999055663986515, "epsilon": 608.2023376626722, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.00277583286529234, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.9277666853153175}, {"learning_rate": 0.6377055367225362, "beta1": 0.9979398227036278, "beta2": 0.9998970902832014, "epsilon": 1.0832226568381885e-06, "use_nesterov": false, "adamw_weight_decay": 0.0011762763920022705, "l2_weight_decay": 0.00011871649822520991, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.6017694459763011}, {"learning_rate": 0.0002139149676840168, "beta1": 0.9972026463262926, "beta2": 0.9046216601206449, "epsilon": 2.102313065727758e-05, "use_nesterov": false, "adamw_weight_decay": 0.0002162646124017754, "l2_weight_decay": 0.0, "warmup_fraction": 0.0002072997016069292, "min_learning_rate_mult": 0.0019148614377363935, "constant_fraction": 0.3212758875281517}, {"learning_rate": 1.4953325323315652e-05, "beta1": 0.9950810167941807, "beta2": 0.9995094128268065, "epsilon": 0.0019829935948056402, "use_nesterov": false, "adamw_weight_decay": 0.00025048425473720587, "l2_weight_decay": 0.001987414284929346, "warmup_fraction": 0.0, "min_learning_rate_mult": 7.866446491603098e-05, "constant_fraction": 0.4222146618223276}, {"learning_rate": 0.05028334299941158, "beta1": 0.9514751290581651, "beta2": 0.9900302078635603, "epsilon": 3.839488076199265e-06, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.002996989965812699, "warmup_fraction": 0.001076434211011302, "min_learning_rate_mult": 0.9820148330258691, "constant_fraction": 0.8889168187701979}, {"learning_rate": 0.045583990072661215, "beta1": 0.9676198221876651, "beta2": 0.9257596197979705, "epsilon": 5010.129597974867, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.00012714066151535327, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.00019828976351559194, "constant_fraction": 0.8602832999341775}, {"learning_rate": 0.03925750601525622, "beta1": 0.9899879006222343, "beta2": 0.9993963162935503, "epsilon": 0.0003002977260806783, "use_nesterov": true, "adamw_weight_decay": 0.014857313070892888, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0005189265814038618, "constant_fraction": 0.8566780261825233}, {"learning_rate": 0.2615545983050384, "beta1": 0.2723814457867325, "beta2": 0.999187141799463, "epsilon": 392.7456658084946, "use_nesterov": true, "adamw_weight_decay": 0.0035401813577238908, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.9014309442276632}, {"learning_rate": 0.061846672270955756, "beta1": 0.812505209181548, "beta2": 0.9962163593048048, "epsilon": 5.323221717462392, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.029123437220814404, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.058248850841829104, "constant_fraction": 0.9552774444784183}, {"learning_rate": 0.013088601285270937, "beta1": 0.9927003475582047, "beta2": 0.9884712811743919, "epsilon": 0.0007863570964555409, "use_nesterov": false, "adamw_weight_decay": 0.005672038100033439, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 4.3460099647923614e-05, "constant_fraction": 0.8103626367206453}, {"learning_rate": 1.0681862306349509e-05, "beta1": 0.4245379047767269, "beta2": 0.9999894626908725, "epsilon": 1.836610001029924e-06, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0018122186283111485, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.001674203515334875, "constant_fraction": 0.37974594824318264}, {"learning_rate": 0.02511879935465365, "beta1": 0.9873624879129935, "beta2": 0.41366056252272165, "epsilon": 0.00020540013066066597, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.06202074813469012, "warmup_fraction": 0.005198025387809378, "min_learning_rate_mult": 0.00018890362583448783, "constant_fraction": 0.5850424589084879}, {"learning_rate": 0.0024752027371094084, "beta1": 0.8551466084020514, "beta2": 0.9991280839055179, "epsilon": 5.819129049338152e-08, "use_nesterov": true, "adamw_weight_decay": 0.0007678265218878735, "l2_weight_decay": 0.020055227986943466, "warmup_fraction": 0.005595007253939452, "min_learning_rate_mult": 0.0011741103474576888, "constant_fraction": 0.31045881578951684}, {"learning_rate": 0.0044897833650418915, "beta1": 0.9981887032828827, "beta2": 0.3586118733067791, "epsilon": 0.00010327320539393058, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.023401540337527012, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.007338757663487333, "constant_fraction": 0.04738248442821058}, {"learning_rate": 0.36773644298353014, "beta1": 0.6362263722939135, "beta2": 0.9999294479326444, "epsilon": 0.0017830511243456962, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0004936824004418885, "warmup_fraction": 0.013704056800093706, "min_learning_rate_mult": 0.0, "constant_fraction": 0.5461115772339424}, {"learning_rate": 0.0022047479973742296, "beta1": 0.14155876399722056, "beta2": 0.9989085711758282, "epsilon": 0.9682842414474462, "use_nesterov": false, "adamw_weight_decay": 0.04189595496283904, "l2_weight_decay": 0.0010340123789073711, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.06411530315948089}, {"learning_rate": 0.009349730071803786, "beta1": 0.9950348581289398, "beta2": 0.8390545109212662, "epsilon": 0.0020927765603113613, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.006470891502199188, "warmup_fraction": 0.0003815959210832205, "min_learning_rate_mult": 0.31478359000253475, "constant_fraction": 0.053584794531799096}, {"learning_rate": 0.00012800118508402654, "beta1": 0.8984847808082502, "beta2": 0.9357492055361215, "epsilon": 0.021759141569843158, "use_nesterov": true, "adamw_weight_decay": 0.0013428114210981149, "l2_weight_decay": 0.001627880393869421, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.9378060049254}, {"learning_rate": 0.31069006017257816, "beta1": 0.9963320358510267, "beta2": 0.9302868255304727, "epsilon": 601.0487900550694, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.012084607244167692, "warmup_fraction": 0.0016102840941798306, "min_learning_rate_mult": 0.0008450344232373543, "constant_fraction": 0.5204479758632768}, {"learning_rate": 0.0007996140772392538, "beta1": 0.9981583471080211, "beta2": 0.9994359463672353, "epsilon": 0.11187330546709434, "use_nesterov": true, "adamw_weight_decay": 0.00039337930002194, "l2_weight_decay": 0.0, "warmup_fraction": 0.02684885705763259, "min_learning_rate_mult": 0.0, "constant_fraction": 0.7815562369821453}, {"learning_rate": 0.0325627351125573, "beta1": 0.9672211846236949, "beta2": 0.9947333660637748, "epsilon": 1496.4534576909373, "use_nesterov": false, "adamw_weight_decay": 0.0031287199756988245, "l2_weight_decay": 0.001338540772851294, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.41520899253476873}, {"learning_rate": 5.9563579399373896e-05, "beta1": 0.9912305273157465, "beta2": 0.9997962409438348, "epsilon": 28.80813991166612, "use_nesterov": false, "adamw_weight_decay": 0.01572329155811353, "l2_weight_decay": 3.924846437453497e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 2.177586020718093e-05, "constant_fraction": 0.8624956540326072}, {"learning_rate": 4.476309082022166e-05, "beta1": 0.9937411904534748, "beta2": 0.9999632570862297, "epsilon": 0.1332544321248041, "use_nesterov": true, "adamw_weight_decay": 0.07039146926628931, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.027268700723024897, "constant_fraction": 0.947266328554967}, {"learning_rate": 2.5341037335087848e-05, "beta1": 0.994675412932621, "beta2": 0.9999580568816822, "epsilon": 3.789944896864214e-08, "use_nesterov": true, "adamw_weight_decay": 0.08935969318555272, "l2_weight_decay": 0.023550965820150815, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.10161983244423066, "constant_fraction": 0.5984540963406323}, {"learning_rate": 0.18423550608792696, "beta1": 0.9968118745987524, "beta2": 0.9992345250604753, "epsilon": 6.907610446719499e-07, "use_nesterov": true, "adamw_weight_decay": 0.044176436226420215, "l2_weight_decay": 0.05680494423619285, "warmup_fraction": 0.0013116086261951404, "min_learning_rate_mult": 0.24216562521556284, "constant_fraction": 0.9467349958385552}, {"learning_rate": 9.828371112519713e-05, "beta1": 0.9890996710613894, "beta2": 0.9999871850796298, "epsilon": 2.9991607874490107, "use_nesterov": true, "adamw_weight_decay": 0.0015724618277796708, "l2_weight_decay": 0.00020569734823310982, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.782240929916094}, {"learning_rate": 0.0037530477860836502, "beta1": 0.9986848468480207, "beta2": 0.9998899345099934, "epsilon": 0.0009383140900204217, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 6.65467613379731e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 4.986182375668412e-05, "constant_fraction": 0.34980615892886435}, {"learning_rate": 1.214464264937742e-05, "beta1": 0.46965199245747324, "beta2": 0.9985739576801873, "epsilon": 0.016199614306416463, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.014636893627990716, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.41655917638393414}, {"learning_rate": 0.0017887220295297655, "beta1": 0.9986523203957988, "beta2": 0.9774316855243319, "epsilon": 73.28981862311942, "use_nesterov": true, "adamw_weight_decay": 0.004969014791525844, "l2_weight_decay": 2.6201968857920516e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.690313118947009}, {"learning_rate": 0.16895812798017035, "beta1": 0.8333115265139209, "beta2": 0.9980099066245002, "epsilon": 5.696929881147833e-06, "use_nesterov": false, "adamw_weight_decay": 5.425283919829837e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.20590558679317184}, {"learning_rate": 0.013339023155487868, "beta1": 0.8772460272561292, "beta2": 0.6997079269927124, "epsilon": 5646.7768363791065, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0009530178364265956, "warmup_fraction": 0.03843389565459758, "min_learning_rate_mult": 0.0, "constant_fraction": 0.6938236115628553}, {"learning_rate": 0.03584131639550316, "beta1": 0.8394554650553652, "beta2": 0.9991158319202075, "epsilon": 0.5996464750148159, "use_nesterov": true, "adamw_weight_decay": 6.153279913532162e-05, "l2_weight_decay": 0.03566453986792376, "warmup_fraction": 6.80670804519652e-05, "min_learning_rate_mult": 0.0019579630547007375, "constant_fraction": 0.19067789349542197}, {"learning_rate": 0.0022560160213354625, "beta1": 0.3134172831729821, "beta2": 0.9822313595510433, "epsilon": 1.787202646474074, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.01796309542301316, "warmup_fraction": 0.00251722445582774, "min_learning_rate_mult": 1.1593502263459836e-05, "constant_fraction": 0.4757092875982579}, {"learning_rate": 3.76555882170645e-05, "beta1": 0.9925076926884936, "beta2": 0.9942574994137252, "epsilon": 2.234943335054811e-07, "use_nesterov": true, "adamw_weight_decay": 0.0011740591988258038, "l2_weight_decay": 0.012964773747961483, "warmup_fraction": 0.0001245114064163121, "min_learning_rate_mult": 0.0, "constant_fraction": 0.1791696853700292}, {"learning_rate": 8.844928926466121e-05, "beta1": 0.6987705643970186, "beta2": 0.8810813957281685, "epsilon": 0.5813725084457466, "use_nesterov": true, "adamw_weight_decay": 0.011880221692796953, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.2154198419362474}, {"learning_rate": 0.0003697949144441597, "beta1": 0.9533045551712472, "beta2": 0.9984558374661429, "epsilon": 28.563677817481345, "use_nesterov": true, "adamw_weight_decay": 0.028308440846170832, "l2_weight_decay": 4.094245151769986e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.9238634186925818}, {"learning_rate": 6.225127618111153e-05, "beta1": 0.9764376230626652, "beta2": 0.9824052117792915, "epsilon": 0.5589946437025044, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.02375253155806047, "warmup_fraction": 0.05070299645888822, "min_learning_rate_mult": 0.0, "constant_fraction": 0.2473184202685642}, {"learning_rate": 0.00012915241746262436, "beta1": 0.9929475569152562, "beta2": 0.9949778837808113, "epsilon": 3.8711059915722936, "use_nesterov": true, "adamw_weight_decay": 0.029780927993200333, "l2_weight_decay": 1.955480370736167e-05, "warmup_fraction": 1.146598125607089e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.594041457961027}, {"learning_rate": 7.248643825201349e-05, "beta1": 0.9944160062131489, "beta2": 0.9970994631247664, "epsilon": 0.02487766287108851, "use_nesterov": true, "adamw_weight_decay": 0.024294138955137413, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.7046037430442432}, {"learning_rate": 3.6320600296680235e-05, "beta1": 0.966302279231746, "beta2": 0.9972734695840538, "epsilon": 3.771335359495574e-05, "use_nesterov": true, "adamw_weight_decay": 0.022584767793418954, "l2_weight_decay": 8.321548913660184e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.6884769232539149}, {"learning_rate": 0.7624421492036078, "beta1": 0.9918107308389682, "beta2": 0.9983599112469898, "epsilon": 0.006392137200785426, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.00016945884129271192, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.7874384575526875}, {"learning_rate": 1.0521045212516575e-05, "beta1": 0.9496971040440005, "beta2": 0.9944724721413932, "epsilon": 7.995602514614722, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 4.646819454387938e-05, "warmup_fraction": 6.879901306382299e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.8961937664273317}, {"learning_rate": 0.0006810756604358635, "beta1": 0.9937647578196501, "beta2": 0.9998940423639543, "epsilon": 2.4540197355174643e-07, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0007731039467565046, "warmup_fraction": 0.047520879267062464, "min_learning_rate_mult": 0.0002299069830624156, "constant_fraction": 0.7904170127574637}, {"learning_rate": 1.5272318714270615e-05, "beta1": 0.44583893284278975, "beta2": 0.9998626897664439, "epsilon": 3709.0912824578177, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 6.0482067211325096e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0004266204698871537, "constant_fraction": 0.6479274338338492}, {"learning_rate": 0.01637653940005997, "beta1": 0.8853334605566153, "beta2": 0.9999073833968196, "epsilon": 2052.2394822077736, "use_nesterov": false, "adamw_weight_decay": 1.3072146457144287e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.8061276205950726}, {"learning_rate": 0.008546896581639929, "beta1": 0.9969760169906653, "beta2": 0.9999150162960175, "epsilon": 3.566315030639487e-06, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0006305225741224833, "warmup_fraction": 0.01493743542241144, "min_learning_rate_mult": 0.1382276934688122, "constant_fraction": 0.4046069376202419}, {"learning_rate": 0.016043436953459396, "beta1": 0.9962013843924813, "beta2": 0.9991281866689485, "epsilon": 2060.708508463648, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.00020537214831732687, "warmup_fraction": 0.003631297841118542, "min_learning_rate_mult": 0.0, "constant_fraction": 0.16067461994004661}, {"learning_rate": 0.20974817023751274, "beta1": 0.6456623887359726, "beta2": 0.9993339582027844, "epsilon": 1320.41764489082, "use_nesterov": false, "adamw_weight_decay": 4.9615919433060643e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.2501580792608986, "constant_fraction": 0.8230429433341123}, {"learning_rate": 8.38780386600525e-05, "beta1": 0.9958006308949275, "beta2": 0.9999743011378112, "epsilon": 425.7733507955501, "use_nesterov": true, "adamw_weight_decay": 0.06784919756419362, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.2296863616140309}, {"learning_rate": 0.004431771946768311, "beta1": 0.6039543589515792, "beta2": 0.8753275974743968, "epsilon": 1321.2474926184589, "use_nesterov": false, "adamw_weight_decay": 9.838509459869302e-05, "l2_weight_decay": 2.9309776949965563e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.8790667843152113}, {"learning_rate": 0.007125968559804296, "beta1": 0.06039113938677154, "beta2": 0.8771886474501213, "epsilon": 0.008324419099153664, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 5.391187545664084e-05, "warmup_fraction": 0.00017759156121275793, "min_learning_rate_mult": 0.0, "constant_fraction": 0.9795225856068038}, {"learning_rate": 1.831272078916418e-05, "beta1": 0.9432399297851054, "beta2": 0.9441962753794975, "epsilon": 1.713801215088547e-06, "use_nesterov": false, "adamw_weight_decay": 0.08346914342987115, "l2_weight_decay": 0.0, "warmup_fraction": 1.1775905970861931e-05, "min_learning_rate_mult": 0.017092848741849916, "constant_fraction": 0.6381219820926074}, {"learning_rate": 2.2519436572354903e-05, "beta1": 0.9931845992429021, "beta2": 0.9843739473236951, "epsilon": 0.06842695530143984, "use_nesterov": true, "adamw_weight_decay": 0.002237269912268732, "l2_weight_decay": 0.0048180865491586795, "warmup_fraction": 2.8211768526243236e-05, "min_learning_rate_mult": 0.00036173001681144947, "constant_fraction": 0.5790146412984896}, {"learning_rate": 0.30242795899893526, "beta1": 0.6660660464900847, "beta2": 0.999977106375269, "epsilon": 2869.099734740961, "use_nesterov": true, "adamw_weight_decay": 0.006973682830321543, "l2_weight_decay": 0.0, "warmup_fraction": 0.00019836642865806762, "min_learning_rate_mult": 0.0, "constant_fraction": 0.12435766614150312}, {"learning_rate": 0.011519609790216372, "beta1": 0.9945786628555128, "beta2": 0.9952289333928893, "epsilon": 0.00025619149099746877, "use_nesterov": true, "adamw_weight_decay": 0.0011186844484058686, "l2_weight_decay": 0.03870669640218932, "warmup_fraction": 0.022932858171833995, "min_learning_rate_mult": 0.0, "constant_fraction": 0.20821711782143648}, {"learning_rate": 7.909838605187666e-05, "beta1": 0.6350272510039268, "beta2": 0.9999498422144614, "epsilon": 444.64260168379235, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.002295045914908692, "warmup_fraction": 0.0031753185152776564, "min_learning_rate_mult": 0.00019765729830294106, "constant_fraction": 0.8275261699514136}, {"learning_rate": 0.09882124151891682, "beta1": 0.9969517485950602, "beta2": 0.9999213628688438, "epsilon": 33.68226253966892, "use_nesterov": false, "adamw_weight_decay": 0.0002988983351843276, "l2_weight_decay": 0.0, "warmup_fraction": 1.2388525327044496e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.17611460405052937}, {"learning_rate": 0.28915252013326476, "beta1": 0.9872691251359172, "beta2": 0.9990877912285722, "epsilon": 0.01136528006758568, "use_nesterov": true, "adamw_weight_decay": 1.9683392933042787e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.028931304380948653, "constant_fraction": 0.7579706326889994}, {"learning_rate": 0.03793437355483491, "beta1": 0.9988119377379922, "beta2": 0.9999731289659097, "epsilon": 0.0002722612496020362, "use_nesterov": true, "adamw_weight_decay": 0.007835327029781394, "l2_weight_decay": 0.0017060580201600946, "warmup_fraction": 7.569203673530571e-05, "min_learning_rate_mult": 0.008741026283013915, "constant_fraction": 0.4860160087647577}, {"learning_rate": 3.45527046565045e-05, "beta1": 0.986869714342842, "beta2": 0.2045236801005167, "epsilon": 3.447394542306494e-05, "use_nesterov": false, "adamw_weight_decay": 0.006799660094019831, "l2_weight_decay": 0.0, "warmup_fraction": 0.001021354580115546, "min_learning_rate_mult": 0.0, "constant_fraction": 0.6305678217902212}, {"learning_rate": 2.1343691013669864e-05, "beta1": 0.99722569009007, "beta2": 0.9998753786358908, "epsilon": 6.702472440835023, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 1.0550319825273372e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.028739491994114193, "constant_fraction": 0.9366562663932797}, {"learning_rate": 0.16102247257937732, "beta1": 0.9926287370347574, "beta2": 0.999859429580853, "epsilon": 292.7031982709721, "use_nesterov": true, "adamw_weight_decay": 0.0034970478309281827, "l2_weight_decay": 3.6865684622733606e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.6774109203756421}, {"learning_rate": 0.0005302001208889189, "beta1": 0.800129246995437, "beta2": 0.9984208728479638, "epsilon": 162.7214490526932, "use_nesterov": true, "adamw_weight_decay": 3.214206906201691e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.71305725468194}, {"learning_rate": 0.00013628846280370034, "beta1": 0.9985060212946155, "beta2": 0.9788345892955661, "epsilon": 0.06198769877782303, "use_nesterov": false, "adamw_weight_decay": 0.0011529411720594255, "l2_weight_decay": 7.501741055602981e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.8292929279308142, "constant_fraction": 0.6241211572025865}, {"learning_rate": 0.14911147803374955, "beta1": 0.972847998558128, "beta2": 0.9986871665426197, "epsilon": 3.039203724513246e-05, "use_nesterov": true, "adamw_weight_decay": 0.001362320482369395, "l2_weight_decay": 0.0012954291073634914, "warmup_fraction": 2.0276467714678657e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.925859096784433}, {"learning_rate": 0.007683212636385746, "beta1": 0.8827618084230089, "beta2": 0.9999376653954826, "epsilon": 1.137575918065841, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.00012999318118444387, "warmup_fraction": 0.08719976366587028, "min_learning_rate_mult": 0.0, "constant_fraction": 0.12146041002235042}, {"learning_rate": 0.5538440919800999, "beta1": 0.13769095169778345, "beta2": 0.9999868979846164, "epsilon": 0.004205392343382271, "use_nesterov": true, "adamw_weight_decay": 0.00012655048312570281, "l2_weight_decay": 0.0, "warmup_fraction": 1.1507404476562256e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.7604752422249449}, {"learning_rate": 0.02376003681225914, "beta1": 0.9897951056357981, "beta2": 0.5617570220430143, "epsilon": 846.1001056029232, "use_nesterov": false, "adamw_weight_decay": 0.0022320959642908407, "l2_weight_decay": 0.0021736376778192976, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.69986393328263}, {"learning_rate": 0.9808636054653961, "beta1": 0.5901145114182004, "beta2": 0.9989796613395219, "epsilon": 4.4147684763924026e-05, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.057516191049538916, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.2719158705796789}, {"learning_rate": 0.005490962415211446, "beta1": 0.9935899758592708, "beta2": 0.9875878483995596, "epsilon": 4.646330685708923e-05, "use_nesterov": false, "adamw_weight_decay": 0.0035994045252809893, "l2_weight_decay": 0.08816527883790716, "warmup_fraction": 0.0002837730401872178, "min_learning_rate_mult": 0.006402537451998484, "constant_fraction": 0.9708141869397184}, {"learning_rate": 7.62239340047126e-05, "beta1": 0.9988044272465847, "beta2": 0.9998064185357735, "epsilon": 8.012880932688383e-06, "use_nesterov": false, "adamw_weight_decay": 0.00023853513225312073, "l2_weight_decay": 0.0022914854772127613, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.5573720320388376}, {"learning_rate": 0.3357035810081224, "beta1": 0.9982196175608385, "beta2": 0.996556671092559, "epsilon": 2.939586291309441e-08, "use_nesterov": false, "adamw_weight_decay": 1.629029844822613e-05, "l2_weight_decay": 0.07518349059598269, "warmup_fraction": 0.0001328752261301094, "min_learning_rate_mult": 0.0001827896671310396, "constant_fraction": 0.3973015922950053}, {"learning_rate": 0.0024552073110330995, "beta1": 0.9986635494138182, "beta2": 0.9995890376288472, "epsilon": 4401.502738560305, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 2.1248615189952403e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0001457302441347315, "constant_fraction": 0.6163643843429732}, {"learning_rate": 0.08233559738258157, "beta1": 0.9988538531773754, "beta2": 0.9918048773296669, "epsilon": 2.0180410026934213e-05, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.002997545248805927, "warmup_fraction": 1.4360411812157642e-05, "min_learning_rate_mult": 0.00014001540742016093, "constant_fraction": 0.5094376273476062}, {"learning_rate": 0.5498569825284523, "beta1": 0.35610185728984134, "beta2": 0.9963510207030689, "epsilon": 0.0016914957249051835, "use_nesterov": true, "adamw_weight_decay": 0.0690842069929862, "l2_weight_decay": 0.0, "warmup_fraction": 1.2376754822713583e-05, "min_learning_rate_mult": 0.0012888598119468247, "constant_fraction": 0.810132471708561}, {"learning_rate": 1.5326749741380235e-05, "beta1": 0.9946688871833562, "beta2": 0.9938860535615398, "epsilon": 0.00012477044242288618, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0006511746906285882, "warmup_fraction": 0.0066657284525216, "min_learning_rate_mult": 0.00016286742350405097, "constant_fraction": 0.5612709431534806}, {"learning_rate": 4.017807263244162e-05, "beta1": 0.9887829729159131, "beta2": 0.9993154092900862, "epsilon": 0.8381818921238815, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 1.1536670189740288e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.03076998968795827, "constant_fraction": 0.9992136203556568}, {"learning_rate": 0.16410092368429044, "beta1": 0.9948669784597299, "beta2": 0.999987136592776, "epsilon": 5.516820448201073, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0016191947729543897, "warmup_fraction": 0.0019855758419887516, "min_learning_rate_mult": 0.0, "constant_fraction": 0.17852427875489418}, {"learning_rate": 0.0031912129777838245, "beta1": 0.9989325874170182, "beta2": 0.9990639574536708, "epsilon": 48.03330296448983, "use_nesterov": false, "adamw_weight_decay": 0.0003266521339847212, "l2_weight_decay": 0.0, "warmup_fraction": 3.22056292800301e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.671392871665639}, {"learning_rate": 0.02138571374305623, "beta1": 0.9368832964106403, "beta2": 0.9999881545175042, "epsilon": 0.032782918013639264, "use_nesterov": false, "adamw_weight_decay": 1.738411434221514e-05, "l2_weight_decay": 0.0031316046792941228, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.7167303844884497}, {"learning_rate": 0.00010212916927871752, "beta1": 0.9564794330127985, "beta2": 0.9390524070192383, "epsilon": 1.2773868050392018e-07, "use_nesterov": false, "adamw_weight_decay": 0.00011326904674302757, "l2_weight_decay": 2.5261003617835683e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.00012050671465411394, "constant_fraction": 0.7167358002288488}, {"learning_rate": 0.17805592104396045, "beta1": 0.9665573133549223, "beta2": 0.15223868677350405, "epsilon": 0.01682594026897968, "use_nesterov": true, "adamw_weight_decay": 0.0002091200627740905, "l2_weight_decay": 0.0004880214919562334, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.7544484930735964}, {"learning_rate": 0.04015244211604988, "beta1": 0.9458991945666353, "beta2": 0.999987681690943, "epsilon": 26.056407329709042, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0038277089401067225, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.19821796779646195}, {"learning_rate": 0.5936152951337726, "beta1": 0.3622367420589482, "beta2": 0.9922172823857687, "epsilon": 0.0005092327792992177, "use_nesterov": true, "adamw_weight_decay": 0.0006576900703389787, "l2_weight_decay": 0.0, "warmup_fraction": 0.00776891459971948, "min_learning_rate_mult": 0.0, "constant_fraction": 0.899009001101913}, {"learning_rate": 7.47383329305523e-05, "beta1": 0.5026651197753146, "beta2": 0.9999561322391187, "epsilon": 3.4347495037623686e-06, "use_nesterov": true, "adamw_weight_decay": 0.004010185027248033, "l2_weight_decay": 0.0, "warmup_fraction": 0.003862785367250584, "min_learning_rate_mult": 0.3329030990060723, "constant_fraction": 0.05043430661263282}, {"learning_rate": 0.00028258590508700607, "beta1": 0.9912369309242292, "beta2": 0.8594314819418565, "epsilon": 500.34890808895756, "use_nesterov": true, "adamw_weight_decay": 0.0006178812685289673, "l2_weight_decay": 0.01775024378643101, "warmup_fraction": 0.007445883461918307, "min_learning_rate_mult": 0.0, "constant_fraction": 0.22313010241470466}, {"learning_rate": 0.0001112736469063851, "beta1": 0.9911983467935414, "beta2": 0.9970204750747228, "epsilon": 1.630057392690269e-07, "use_nesterov": false, "adamw_weight_decay": 3.271722368074644e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.00022187368208575805, "min_learning_rate_mult": 0.0026280457340001917, "constant_fraction": 0.715475349337666}, {"learning_rate": 0.0008253428070377102, "beta1": 0.10424134060512813, "beta2": 0.6966948919053101, "epsilon": 8740.743094264977, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.005940254052919288, "warmup_fraction": 2.8782958909433597e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.9256057569348282}, {"learning_rate": 0.0002282020071911179, "beta1": 0.9989757379354788, "beta2": 0.9936957489523625, "epsilon": 314.64541671722225, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0005521837965300396, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.5463560343743707, "constant_fraction": 0.5185303963315965}, {"learning_rate": 6.0648205821143345e-05, "beta1": 0.7823332761474457, "beta2": 0.999051165605713, "epsilon": 0.06276256348388458, "use_nesterov": true, "adamw_weight_decay": 0.015898283195490897, "l2_weight_decay": 4.0832172098408656e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.8796981474690118}, {"learning_rate": 6.306428921264133e-05, "beta1": 0.9815931208723533, "beta2": 0.7599711222461637, "epsilon": 1.1245390335382044, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.009205398911232907, "warmup_fraction": 5.648658097754081e-05, "min_learning_rate_mult": 0.39486902937643154, "constant_fraction": 0.23510950693064836}, {"learning_rate": 0.7653254264340544, "beta1": 0.9894672822756501, "beta2": 0.9254852604782362, "epsilon": 6.013213543591692e-05, "use_nesterov": false, "adamw_weight_decay": 0.05260204859261757, "l2_weight_decay": 0.0027128494366592073, "warmup_fraction": 0.006951134090478177, "min_learning_rate_mult": 0.00012637536272342803, "constant_fraction": 0.8489728814510088}, {"learning_rate": 7.843715175143875e-05, "beta1": 0.7937927499335167, "beta2": 0.22116280894375273, "epsilon": 0.059304351666423935, "use_nesterov": false, "adamw_weight_decay": 9.387504303890384e-05, "l2_weight_decay": 0.00027261469254643965, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.4990449183267538}, {"learning_rate": 0.0053678329019364035, "beta1": 0.9927984471212988, "beta2": 0.9847028254685708, "epsilon": 3.1304289730814824e-05, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.005284772124971204, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0003343932885681134, "constant_fraction": 0.3788562531447075}, {"learning_rate": 5.7598737930205595e-05, "beta1": 0.9875482671950256, "beta2": 0.9989023441067508, "epsilon": 300.44895246414194, "use_nesterov": false, "adamw_weight_decay": 0.000177393967476232, "l2_weight_decay": 0.0, "warmup_fraction": 0.0001796561537191753, "min_learning_rate_mult": 0.0, "constant_fraction": 0.9890091893799037}, {"learning_rate": 0.8601362961091618, "beta1": 0.9949127609007702, "beta2": 0.9975312716949363, "epsilon": 0.2786394291018055, "use_nesterov": false, "adamw_weight_decay": 1.6372127248337716e-05, "l2_weight_decay": 0.0, "warmup_fraction": 1.9786562703599634e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.6263819668207528}, {"learning_rate": 0.957162041915142, "beta1": 0.9931138826237556, "beta2": 0.9835530037225414, "epsilon": 0.15722599106099883, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 3.470908452511609e-05, "warmup_fraction": 9.45651825573908e-05, "min_learning_rate_mult": 0.0001841923102068693, "constant_fraction": 0.7658745816117201}, {"learning_rate": 0.006356946083203916, "beta1": 0.9923887220978013, "beta2": 0.999981652393998, "epsilon": 108.57643192315975, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 8.544672472745506e-05, "warmup_fraction": 0.0001531153043518029, "min_learning_rate_mult": 1.2036974199149832e-05, "constant_fraction": 0.03797675622573482}, {"learning_rate": 0.2613169090177041, "beta1": 0.945019472427461, "beta2": 0.9998950427743104, "epsilon": 7226.475971604108, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 1.6512001795666684e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0004897857637287275, "constant_fraction": 0.1355179964108344}, {"learning_rate": 0.012680538600070077, "beta1": 0.9866814972121609, "beta2": 0.4299672781363525, "epsilon": 6952.923751443349, "use_nesterov": true, "adamw_weight_decay": 0.00012275647471314693, "l2_weight_decay": 0.0, "warmup_fraction": 0.0007135260743743379, "min_learning_rate_mult": 0.0, "constant_fraction": 0.01660747452517841}, {"learning_rate": 3.097818098660811e-05, "beta1": 0.8903655223914928, "beta2": 0.9998255780711064, "epsilon": 0.0006408954406357277, "use_nesterov": true, "adamw_weight_decay": 5.489953166564693e-05, "l2_weight_decay": 5.2235275755318736e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.37132956041398507, "constant_fraction": 0.6997935295191818}, {"learning_rate": 7.720431766937712e-05, "beta1": 0.3517216137040585, "beta2": 0.999986073673069, "epsilon": 1.3561540268862626, "use_nesterov": true, "adamw_weight_decay": 0.0020980844831033443, "l2_weight_decay": 0.00019275690642900532, "warmup_fraction": 0.0, "min_learning_rate_mult": 1.058497171258805e-05, "constant_fraction": 0.7966839492404932}, {"learning_rate": 0.005200184353580875, "beta1": 0.6922189839900328, "beta2": 0.9732370404630762, "epsilon": 7743.891106333356, "use_nesterov": false, "adamw_weight_decay": 0.004628484917287984, "l2_weight_decay": 0.016793450663819324, "warmup_fraction": 0.0006283509571894367, "min_learning_rate_mult": 0.028062289635148487, "constant_fraction": 0.1307576827297181}, {"learning_rate": 0.00131154226300022, "beta1": 0.991148617546453, "beta2": 0.9999536667873767, "epsilon": 0.00023024974942258044, "use_nesterov": true, "adamw_weight_decay": 3.8452681215195286e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.9932584208976665}, {"learning_rate": 0.9175918746008406, "beta1": 0.9869608329174023, "beta2": 0.4968716855846794, "epsilon": 11.843897057402613, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.011468082836200254, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.5041025451704676}, {"learning_rate": 0.09111861995814573, "beta1": 0.7771934122018913, "beta2": 0.9994986790165903, "epsilon": 1.3410134922532295, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.001402043895689164, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.6132652260389094}, {"learning_rate": 0.00471517435085035, "beta1": 0.9808695830238614, "beta2": 0.9999521441538781, "epsilon": 4.886625932984867e-05, "use_nesterov": false, "adamw_weight_decay": 2.2078880200066138e-05, "l2_weight_decay": 0.00075936412072233, "warmup_fraction": 0.012098004977358133, "min_learning_rate_mult": 0.9490097353774577, "constant_fraction": 0.478388634982432}, {"learning_rate": 1.2627009366552325e-05, "beta1": 0.4652222798034963, "beta2": 0.9999564433992058, "epsilon": 1131.8457919837294, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 5.5189583699193204e-05, "warmup_fraction": 0.007916575126335017, "min_learning_rate_mult": 0.0011830248455240698, "constant_fraction": 0.598100479366304}, {"learning_rate": 0.28649064247020617, "beta1": 0.9869846615414583, "beta2": 0.9845362047771481, "epsilon": 209.982640648495, "use_nesterov": false, "adamw_weight_decay": 2.595285415315067e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.8708063545475103}, {"learning_rate": 0.8536597378679915, "beta1": 0.8121545167857178, "beta2": 0.7481898416181012, "epsilon": 0.5356311025245134, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.00033783891834184346, "warmup_fraction": 0.0013960495174835772, "min_learning_rate_mult": 0.0, "constant_fraction": 0.29127043750693493}, {"learning_rate": 0.0366178272773394, "beta1": 0.9665477862034945, "beta2": 0.9957040034750587, "epsilon": 1.987509723119354e-07, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 4.314514122340363e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.7483125592058321}, {"learning_rate": 0.00036003105256364595, "beta1": 0.7150089314270774, "beta2": 0.9988388329875264, "epsilon": 6.323994469041008e-08, "use_nesterov": false, "adamw_weight_decay": 0.007118485017832658, "l2_weight_decay": 0.09918946038308225, "warmup_fraction": 0.0026168903764689088, "min_learning_rate_mult": 0.0141527749848422, "constant_fraction": 0.5305403487825785}, {"learning_rate": 4.2950383210255114e-05, "beta1": 0.33099966462806407, "beta2": 0.994823263204482, "epsilon": 2.1346938607797306, "use_nesterov": true, "adamw_weight_decay": 0.00028306079779619875, "l2_weight_decay": 0.0, "warmup_fraction": 1.738046474207586e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.9757422982435554}, {"learning_rate": 0.0002485951360076637, "beta1": 0.36990131962894135, "beta2": 0.5843653799839834, "epsilon": 0.001345967114365581, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 6.915317098146145e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 1.8985812933648974e-05, "constant_fraction": 0.3734720752663371}, {"learning_rate": 0.00011483943349572463, "beta1": 0.9988998840943069, "beta2": 0.999891361801411, "epsilon": 3.1949256999674034e-08, "use_nesterov": true, "adamw_weight_decay": 0.0068276716824655055, "l2_weight_decay": 0.00013858589153242822, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.5710718395181347}, {"learning_rate": 6.232034624111315e-05, "beta1": 0.7833453372842125, "beta2": 0.9999774722658036, "epsilon": 7.764977470477154e-05, "use_nesterov": false, "adamw_weight_decay": 0.019038639694177024, "l2_weight_decay": 0.0, "warmup_fraction": 0.00074483246961435, "min_learning_rate_mult": 0.0009775964588679962, "constant_fraction": 0.5666949968652031}, {"learning_rate": 0.004402629865173251, "beta1": 0.980224647050432, "beta2": 0.9998908681186573, "epsilon": 282.46660930624915, "use_nesterov": true, "adamw_weight_decay": 0.00010067175307837581, "l2_weight_decay": 1.8330644902430837e-05, "warmup_fraction": 0.0015562056862498833, "min_learning_rate_mult": 2.317643880558142e-05, "constant_fraction": 0.21328897797238122}, {"learning_rate": 0.07202508290937591, "beta1": 0.9726543939715926, "beta2": 0.999988159646071, "epsilon": 8.551379244968756e-07, "use_nesterov": true, "adamw_weight_decay": 5.484838891616215e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.6178299275455342}, {"learning_rate": 0.0017644881376746443, "beta1": 0.9818714607473549, "beta2": 0.9999519925102033, "epsilon": 2.215383326570832e-07, "use_nesterov": false, "adamw_weight_decay": 0.00725505239272043, "l2_weight_decay": 0.0005740583721489348, "warmup_fraction": 0.0003079423821349844, "min_learning_rate_mult": 0.0, "constant_fraction": 0.5766057609461084}, {"learning_rate": 0.00021607765112165747, "beta1": 0.24162253894162466, "beta2": 0.9999696619758686, "epsilon": 0.003193759233824065, "use_nesterov": true, "adamw_weight_decay": 0.008553448684140022, "l2_weight_decay": 0.0, "warmup_fraction": 0.000985406379740836, "min_learning_rate_mult": 0.0, "constant_fraction": 0.6538633953933071}, {"learning_rate": 5.4204380708769846e-05, "beta1": 0.9956011692051703, "beta2": 0.9712200656716008, "epsilon": 0.012903910354956402, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.006266751212390608, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.10029041385829932, "constant_fraction": 0.13907220665766196}, {"learning_rate": 0.28707738228721175, "beta1": 0.9769533773941488, "beta2": 0.9493169663981779, "epsilon": 3.2480511104035496e-08, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0048203660951666475, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.23078200852070163}, {"learning_rate": 1.7764938838585116e-05, "beta1": 0.07498696471061284, "beta2": 0.9826641251356445, "epsilon": 6.918518209779241e-07, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.009571941726505202, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.00014536068965822314, "constant_fraction": 0.9583150965737638}, {"learning_rate": 0.0001768471374460242, "beta1": 0.9715063272612559, "beta2": 0.9976222267324218, "epsilon": 2.3003667693420153, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 3.126378291114844e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.513805726817965}, {"learning_rate": 5.202649925843598e-05, "beta1": 0.9796392195111976, "beta2": 0.999982421761267, "epsilon": 0.059430141044277816, "use_nesterov": false, "adamw_weight_decay": 0.06066527394382188, "l2_weight_decay": 8.285574421819333e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.018696726575711798, "constant_fraction": 0.5988913902118008}, {"learning_rate": 0.02535378225689493, "beta1": 0.6418515110748824, "beta2": 0.9997554219352259, "epsilon": 125.16463022937295, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 5.1939287496776445e-05, "warmup_fraction": 0.01569990827681069, "min_learning_rate_mult": 0.0, "constant_fraction": 0.009484865020033761}, {"learning_rate": 0.1833021694607107, "beta1": 0.993476147082401, "beta2": 0.9999790299637341, "epsilon": 0.0004697026736450301, "use_nesterov": true, "adamw_weight_decay": 1.2324281310321709e-05, "l2_weight_decay": 0.005525346905067978, "warmup_fraction": 1.6292094639279448e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.9428391189280598}, {"learning_rate": 9.091138881852359e-05, "beta1": 0.5878342373110477, "beta2": 0.9604232279762215, "epsilon": 1.64302690262604e-05, "use_nesterov": true, "adamw_weight_decay": 9.574556802055981e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0012210016580598466, "constant_fraction": 0.682336690595303}, {"learning_rate": 0.0005513416175771913, "beta1": 0.9971346129504763, "beta2": 0.9982924196445951, "epsilon": 26.554612629154715, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0003544954435945734, "warmup_fraction": 0.04836816397054053, "min_learning_rate_mult": 0.002736070143110126, "constant_fraction": 0.05148039085606382}, {"learning_rate": 0.0009551683590886598, "beta1": 0.6458339136875497, "beta2": 0.9986664473532302, "epsilon": 2436.9888469359666, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.07374978081225673, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.006881204697934288, "constant_fraction": 0.5757703444398831}, {"learning_rate": 0.006115103953299133, "beta1": 0.0725725033728577, "beta2": 0.9999803960338887, "epsilon": 329.10023777688116, "use_nesterov": false, "adamw_weight_decay": 0.00010167466953320674, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 1.3830387409592812e-05, "constant_fraction": 0.07046095492702253}, {"learning_rate": 0.00013253134955188982, "beta1": 0.9975249132525627, "beta2": 0.999789370390599, "epsilon": 3.4660244370681337, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0035381581394937113, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0001717603677907106, "constant_fraction": 0.8921859308642364}, {"learning_rate": 0.05582211245510444, "beta1": 0.9862515654719601, "beta2": 0.9942822958440981, "epsilon": 3.8625114588284195e-08, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.04429910972622699, "warmup_fraction": 5.995592205081576e-05, "min_learning_rate_mult": 3.207749127731321e-05, "constant_fraction": 0.7244264943923319}, {"learning_rate": 0.016105349263933106, "beta1": 0.7841261919305398, "beta2": 0.9999312633023925, "epsilon": 19.330058804820617, "use_nesterov": false, "adamw_weight_decay": 0.0002029624831452395, "l2_weight_decay": 0.0030926992761758196, "warmup_fraction": 8.098541623472968e-05, "min_learning_rate_mult": 0.0012519059967426266, "constant_fraction": 0.47313511217803605}, {"learning_rate": 0.186104218255701, "beta1": 0.9980297630972892, "beta2": 0.9998003425029622, "epsilon": 10.393189660571302, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0010407225935496695, "warmup_fraction": 7.447935508256545e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.7907467105201533}, {"learning_rate": 0.9921264182097522, "beta1": 0.9739126460012365, "beta2": 0.9876431854012738, "epsilon": 0.04685163102654306, "use_nesterov": false, "adamw_weight_decay": 0.0012565924884604398, "l2_weight_decay": 0.04586879410503247, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.005627211765420174, "constant_fraction": 0.20236288909586708}, {"learning_rate": 0.04521272039108537, "beta1": 0.5237524947026636, "beta2": 0.9880570102931765, "epsilon": 33.520836859684884, "use_nesterov": true, "adamw_weight_decay": 1.9711725185953847e-05, "l2_weight_decay": 0.0563019753061221, "warmup_fraction": 0.0, "min_learning_rate_mult": 7.961829036703987e-05, "constant_fraction": 0.6060624691111425}, {"learning_rate": 0.012250080016067205, "beta1": 0.9418758988732708, "beta2": 0.9996953228816177, "epsilon": 3.9906888012475648, "use_nesterov": true, "adamw_weight_decay": 0.00015471987948501186, "l2_weight_decay": 0.0006926552252155988, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.9105428897077981}, {"learning_rate": 0.3910706870644346, "beta1": 0.9061802659980913, "beta2": 0.9479646553499157, "epsilon": 0.0003460423295899584, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 2.0122636532070906e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.12720493226342144, "constant_fraction": 0.673399839658001}, {"learning_rate": 0.2499851807550562, "beta1": 0.9901217325638896, "beta2": 0.9986014274017192, "epsilon": 1.1681133715838719, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0006329361559764824, "warmup_fraction": 0.0002560155808950335, "min_learning_rate_mult": 0.0, "constant_fraction": 0.5040262689570258}, {"learning_rate": 0.002941369486501652, "beta1": 0.9876063862861368, "beta2": 0.9999475853911728, "epsilon": 0.025247147051145634, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0010655381473687, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.8298621826205412}, {"learning_rate": 0.00017988069382152093, "beta1": 0.9502952402757069, "beta2": 0.9999884003957685, "epsilon": 3.3965774878725434, "use_nesterov": false, "adamw_weight_decay": 0.0026346968019176553, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.2826526011129933}, {"learning_rate": 0.0036884225525994968, "beta1": 0.23531443075307812, "beta2": 0.9999890766053607, "epsilon": 883.1258622952907, "use_nesterov": true, "adamw_weight_decay": 3.54939350768059e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.00016600198071163325, "min_learning_rate_mult": 0.10521581750258203, "constant_fraction": 0.040395863263345655}, {"learning_rate": 0.0010557917567298699, "beta1": 0.757063826976422, "beta2": 0.9994536559737652, "epsilon": 3.3833463334845115, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0006016178982844296, "warmup_fraction": 0.00019099360693178977, "min_learning_rate_mult": 0.6633653201531874, "constant_fraction": 0.21230414721999558}, {"learning_rate": 0.042292339236647124, "beta1": 0.8526210950397477, "beta2": 0.9999859285466922, "epsilon": 7134.418544713838, "use_nesterov": true, "adamw_weight_decay": 0.020338792941443817, "l2_weight_decay": 0.0, "warmup_fraction": 0.012405442119562926, "min_learning_rate_mult": 0.009786119943805453, "constant_fraction": 0.46476441005310476}, {"learning_rate": 0.050845983933307755, "beta1": 0.9981005682700799, "beta2": 0.7164816188330072, "epsilon": 7723.658259952292, "use_nesterov": true, "adamw_weight_decay": 0.009237497822899557, "l2_weight_decay": 0.00018560086230184558, "warmup_fraction": 0.007196755033281666, "min_learning_rate_mult": 0.0, "constant_fraction": 0.2478307280771228}, {"learning_rate": 0.8018685040527282, "beta1": 0.9362799807398676, "beta2": 0.9989180196603074, "epsilon": 0.003502458259156597, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.004590858657485709, "warmup_fraction": 0.0352354238069754, "min_learning_rate_mult": 0.00024889075961346163, "constant_fraction": 0.9733050264470916}, {"learning_rate": 0.0001076928300450341, "beta1": 0.9063575604775158, "beta2": 0.9999884257488948, "epsilon": 7084.427954359263, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.015972763312802795, "warmup_fraction": 0.0, "min_learning_rate_mult": 2.6322827344680846e-05, "constant_fraction": 0.618722320868769}, {"learning_rate": 0.0001345093444080637, "beta1": 0.4070561771056236, "beta2": 0.9214531380491845, "epsilon": 0.15089633190528717, "use_nesterov": true, "adamw_weight_decay": 0.07008323822349814, "l2_weight_decay": 0.0, "warmup_fraction": 0.00163512520589643, "min_learning_rate_mult": 0.0, "constant_fraction": 0.3110813136365519}, {"learning_rate": 2.982287816553904e-05, "beta1": 0.6812698126486676, "beta2": 0.09402749728501525, "epsilon": 1.2571596939245928, "use_nesterov": true, "adamw_weight_decay": 0.01659649209131383, "l2_weight_decay": 0.0001944849817242997, "warmup_fraction": 9.636115071738025e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.5516584161115266}, {"learning_rate": 0.40700360053932433, "beta1": 0.8876129898327777, "beta2": 0.9982032289270398, "epsilon": 4.24564388257147e-06, "use_nesterov": true, "adamw_weight_decay": 0.00790259851642279, "l2_weight_decay": 0.0076118697361470585, "warmup_fraction": 1.5555211443275062e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.7965175951113994}, {"learning_rate": 1.0633414044560634e-05, "beta1": 0.9892899767438452, "beta2": 0.9999263829561419, "epsilon": 1.5615056851806941e-06, "use_nesterov": false, "adamw_weight_decay": 0.00011291232254827871, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.18338066317788604}, {"learning_rate": 0.2942588136335709, "beta1": 0.9969258593349817, "beta2": 0.9975567321825187, "epsilon": 0.022810025463248135, "use_nesterov": false, "adamw_weight_decay": 0.00019929063750826547, "l2_weight_decay": 0.0, "warmup_fraction": 0.013292105287786097, "min_learning_rate_mult": 0.0, "constant_fraction": 0.6544817335919817}, {"learning_rate": 0.0004489559097012545, "beta1": 0.9918401213713596, "beta2": 0.8476166106526857, "epsilon": 0.9388331624017332, "use_nesterov": true, "adamw_weight_decay": 0.06919274024993659, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.11676918906984235}, {"learning_rate": 0.032766467889234215, "beta1": 0.9779892467695256, "beta2": 0.9918506377530475, "epsilon": 109.31378880559511, "use_nesterov": false, "adamw_weight_decay": 1.7499732069008034e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.0045327514912770275, "min_learning_rate_mult": 0.6458519402128488, "constant_fraction": 0.3927606238431284}, {"learning_rate": 0.03588394296894301, "beta1": 0.2229381534576751, "beta2": 0.8629637994179242, "epsilon": 2.9494225585626906e-05, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0002588286822337671, "warmup_fraction": 0.00027159546697996616, "min_learning_rate_mult": 0.2567141461252629, "constant_fraction": 0.3846843714674226}, {"learning_rate": 0.07930061702282418, "beta1": 0.9727468577896069, "beta2": 0.952898618552175, "epsilon": 1.3626601408403889e-07, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.000317189559493341, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.015641172600574134, "constant_fraction": 0.2799480641074109}, {"learning_rate": 0.13684104769497302, "beta1": 0.9524877750263702, "beta2": 0.999007047202531, "epsilon": 4.331541894399849e-08, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0019035220226489313, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.4324286729569925}, {"learning_rate": 0.0006925688367497116, "beta1": 0.9795333637744869, "beta2": 0.7054144666955852, "epsilon": 2238.175445810647, "use_nesterov": false, "adamw_weight_decay": 0.00018111851048876803, "l2_weight_decay": 0.0, "warmup_fraction": 0.036096571921792976, "min_learning_rate_mult": 8.581805741226378e-05, "constant_fraction": 0.4317895047877509}, {"learning_rate": 4.8144956400915616e-05, "beta1": 0.826338423459615, "beta2": 0.9999572966271213, "epsilon": 727.8916368520369, "use_nesterov": true, "adamw_weight_decay": 0.007210410365939807, "l2_weight_decay": 0.0442035799609412, "warmup_fraction": 0.008795827225355816, "min_learning_rate_mult": 0.0, "constant_fraction": 0.5532525020768582}, {"learning_rate": 0.0031334255424162417, "beta1": 0.7064164341003139, "beta2": 0.28347905472019896, "epsilon": 0.0078422263925981, "use_nesterov": true, "adamw_weight_decay": 6.158128160541717e-05, "l2_weight_decay": 0.015472035932725121, "warmup_fraction": 0.05655757402539798, "min_learning_rate_mult": 0.0027364093758020717, "constant_fraction": 0.7496318035232679}, {"learning_rate": 0.05639942122562145, "beta1": 0.9986519027131475, "beta2": 0.9999093755696894, "epsilon": 0.0002595050910724847, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 4.125278298940614e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 2.5711457700943273e-05, "constant_fraction": 0.8511723755691694}, {"learning_rate": 0.00019656556883700167, "beta1": 0.708119813244962, "beta2": 0.9994435438787863, "epsilon": 2.7022830885200158, "use_nesterov": true, "adamw_weight_decay": 0.0018316901541283095, "l2_weight_decay": 0.0, "warmup_fraction": 4.354106669128726e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.021609023001578964}, {"learning_rate": 0.08637289096323869, "beta1": 0.9980850626476486, "beta2": 0.8940743478011058, "epsilon": 4635.876159947905, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.014269617359724403, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.6309698147564052}, {"learning_rate": 3.641413706925684e-05, "beta1": 0.9985841401035528, "beta2": 0.99961527605994, "epsilon": 0.06681434134287254, "use_nesterov": false, "adamw_weight_decay": 0.00029363019861293986, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0003834301714287493, "constant_fraction": 0.36152934302056927}, {"learning_rate": 0.009075056994736373, "beta1": 0.9951120132832658, "beta2": 0.9999529636925543, "epsilon": 0.002252573762266706, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0030850198905983824, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.6678992539370858}, {"learning_rate": 0.026916327794731205, "beta1": 0.9945215864531803, "beta2": 0.999747135017799, "epsilon": 0.00010590488570992774, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0017175280170147553, "warmup_fraction": 2.5029766596578843e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.9741533333507638}, {"learning_rate": 0.03133948678508111, "beta1": 0.40303416805617254, "beta2": 0.9999389937254066, "epsilon": 0.06395479126151063, "use_nesterov": false, "adamw_weight_decay": 0.0003323508675785316, "l2_weight_decay": 0.0009743345190051412, "warmup_fraction": 0.043713510661838435, "min_learning_rate_mult": 0.0101423250957228, "constant_fraction": 0.9188540784535393}, {"learning_rate": 0.0007477658685576898, "beta1": 0.9969695210164229, "beta2": 0.9804055472480514, "epsilon": 1.3271869700054504e-07, "use_nesterov": true, "adamw_weight_decay": 3.9292316981378336e-05, "l2_weight_decay": 0.09978881572445983, "warmup_fraction": 0.03537228293556087, "min_learning_rate_mult": 0.0, "constant_fraction": 0.48861155952715074}, {"learning_rate": 3.0468289302266842e-05, "beta1": 0.4808433309454959, "beta2": 0.9712579963673235, "epsilon": 0.9714992999734426, "use_nesterov": false, "adamw_weight_decay": 5.9140430266882845e-05, "l2_weight_decay": 0.028067527073925035, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.7151731941925739}, {"learning_rate": 0.02033776358289902, "beta1": 0.9836707587974077, "beta2": 0.9999857139477965, "epsilon": 9.099394048296245e-06, "use_nesterov": false, "adamw_weight_decay": 0.0001390919937957036, "l2_weight_decay": 0.00043060649265366725, "warmup_fraction": 0.002174749579564076, "min_learning_rate_mult": 0.09043584835967633, "constant_fraction": 0.8203910846252422}, {"learning_rate": 0.051058247255003346, "beta1": 0.9980940922292076, "beta2": 0.9998992221837112, "epsilon": 9.246466234835836e-06, "use_nesterov": false, "adamw_weight_decay": 0.00018810838147781877, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0011064971976116832, "constant_fraction": 0.38685173494779057}, {"learning_rate": 0.3106247438038283, "beta1": 0.07355399219658376, "beta2": 0.9999163552116884, "epsilon": 54.23879779133018, "use_nesterov": true, "adamw_weight_decay": 6.692811896639284e-05, "l2_weight_decay": 0.0, "warmup_fraction": 8.275868461022482e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.4217009810371497}, {"learning_rate": 0.8972280450808423, "beta1": 0.9649817557734592, "beta2": 0.9972310928589263, "epsilon": 5.983275623765303e-08, "use_nesterov": false, "adamw_weight_decay": 0.000977579932700855, "l2_weight_decay": 0.0, "warmup_fraction": 9.379359001242392e-05, "min_learning_rate_mult": 0.19998685977577255, "constant_fraction": 0.08346188110702168}, {"learning_rate": 0.00017100201743317335, "beta1": 0.9956214794311014, "beta2": 0.9991923525297128, "epsilon": 0.01022388627120098, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.00011034213547817818, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.6590435952828336}, {"learning_rate": 1.5682318768595324e-05, "beta1": 0.34680906910742937, "beta2": 0.9948589529521572, "epsilon": 106.90433580658714, "use_nesterov": false, "adamw_weight_decay": 0.0013279798820605064, "l2_weight_decay": 2.923147548175546e-05, "warmup_fraction": 0.0011295982118293554, "min_learning_rate_mult": 0.05407839194907621, "constant_fraction": 0.2781722169049672}, {"learning_rate": 0.10547997249069684, "beta1": 0.9886841585288761, "beta2": 0.9997738973034046, "epsilon": 1.6480207216808672e-05, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.02256345159513458, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.6282046774978968, "constant_fraction": 0.5721348046766757}, {"learning_rate": 1.64328942999653e-05, "beta1": 0.993387996427224, "beta2": 0.9999620159476585, "epsilon": 0.022562497171308385, "use_nesterov": true, "adamw_weight_decay": 0.00419784333615386, "l2_weight_decay": 6.546658749771756e-05, "warmup_fraction": 8.087904501966026e-05, "min_learning_rate_mult": 2.1205511025032255e-05, "constant_fraction": 0.8585285263708421}, {"learning_rate": 3.3162528624835805e-05, "beta1": 0.9956120907719097, "beta2": 0.21535698574815942, "epsilon": 0.04630646535588624, "use_nesterov": false, "adamw_weight_decay": 0.0784364624072841, "l2_weight_decay": 0.011494709821940903, "warmup_fraction": 0.01259218763004615, "min_learning_rate_mult": 0.00012311362862244774, "constant_fraction": 0.6935740475828108}, {"learning_rate": 4.098810449755443e-05, "beta1": 0.9894766963034324, "beta2": 0.8533433581799867, "epsilon": 11.472093018435986, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 3.3417072669312396e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.0525370332240066}, {"learning_rate": 0.003961368291154268, "beta1": 0.9986528171064025, "beta2": 0.19604653739447575, "epsilon": 1694.3106560496904, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.00010124719992003593, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.007068289483845422, "constant_fraction": 0.008319008831747632}, {"learning_rate": 0.01681363728867728, "beta1": 0.9953289591445765, "beta2": 0.9788483221889567, "epsilon": 0.010390199705240575, "use_nesterov": false, "adamw_weight_decay": 0.0002824328402059881, "l2_weight_decay": 0.0, "warmup_fraction": 0.0002708604556725719, "min_learning_rate_mult": 0.0, "constant_fraction": 0.7235605041502168}, {"learning_rate": 0.01822561988978418, "beta1": 0.9964140117448008, "beta2": 0.2627853332697778, "epsilon": 0.00010407120254290316, "use_nesterov": false, "adamw_weight_decay": 0.0002525633559085751, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.40413609371278203}, {"learning_rate": 1.072785201780718e-05, "beta1": 0.9940754839418592, "beta2": 0.9986577511407568, "epsilon": 1.2309747444248595e-05, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.05102872889676917, "warmup_fraction": 0.0002482434917312556, "min_learning_rate_mult": 0.39693881057616737, "constant_fraction": 0.9005904570636976}, {"learning_rate": 0.04974164749376038, "beta1": 0.7960729450057764, "beta2": 0.9999242075158137, "epsilon": 2.1257633257234935e-06, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.02347600194689407, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.2040127287079877, "constant_fraction": 0.9812602878237994}, {"learning_rate": 0.0003464277078587084, "beta1": 0.9980320957005094, "beta2": 0.9990468465965725, "epsilon": 4761.608191258724, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0058610011332698156, "warmup_fraction": 0.00024186678530480884, "min_learning_rate_mult": 0.0, "constant_fraction": 0.03654476937815232}, {"learning_rate": 0.020416903099275793, "beta1": 0.9636611791785369, "beta2": 0.9754446680654487, "epsilon": 119.6300982323418, "use_nesterov": false, "adamw_weight_decay": 0.007778179115232713, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.5338925847323945}, {"learning_rate": 3.0443581653246438e-05, "beta1": 0.9815215979066545, "beta2": 0.9973566570128214, "epsilon": 0.0029400547303146526, "use_nesterov": true, "adamw_weight_decay": 2.127736574724868e-05, "l2_weight_decay": 0.001016907966862073, "warmup_fraction": 0.00016561167915649184, "min_learning_rate_mult": 0.0, "constant_fraction": 0.4252543490359195}, {"learning_rate": 0.0060971516920105785, "beta1": 0.981912330621328, "beta2": 0.9999779965623982, "epsilon": 0.016144110415182704, "use_nesterov": false, "adamw_weight_decay": 0.041218647519836754, "l2_weight_decay": 1.6533477605887808e-05, "warmup_fraction": 1.6477425094313484e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.9387609968410683}, {"learning_rate": 0.3133546722367019, "beta1": 0.9276656538421847, "beta2": 0.8640827847027877, "epsilon": 489.94710615266246, "use_nesterov": false, "adamw_weight_decay": 0.004185501760672127, "l2_weight_decay": 0.0012255421580733253, "warmup_fraction": 2.4950998262765978e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.6185365344115655}, {"learning_rate": 2.4835747250695835e-05, "beta1": 0.404811165729148, "beta2": 0.9999834417554397, "epsilon": 5.799462739972109e-05, "use_nesterov": false, "adamw_weight_decay": 3.6098897459139826e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.006028574250337154, "min_learning_rate_mult": 0.043681099465163506, "constant_fraction": 0.1320545069824156}, {"learning_rate": 2.3746888342412193e-05, "beta1": 0.9987295644755284, "beta2": 0.9974041545812405, "epsilon": 0.013610851235546492, "use_nesterov": false, "adamw_weight_decay": 0.00026740823959958487, "l2_weight_decay": 6.710402836169093e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.6282613733492708}, {"learning_rate": 4.949613862297368e-05, "beta1": 0.7158323156529209, "beta2": 0.033028947116596874, "epsilon": 426.15246427789265, "use_nesterov": true, "adamw_weight_decay": 0.0003037380144814719, "l2_weight_decay": 0.0, "warmup_fraction": 2.2297870604431815e-05, "min_learning_rate_mult": 0.02505449538861154, "constant_fraction": 0.43710426738056496}, {"learning_rate": 0.012075433372865733, "beta1": 0.9799265178966712, "beta2": 0.9980265165335671, "epsilon": 5.0487758521217465, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.051388784841857056, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.42682649160783437}, {"learning_rate": 0.00019312759623570796, "beta1": 0.9938446493322962, "beta2": 0.9999821811394943, "epsilon": 2.9259401658749767e-05, "use_nesterov": true, "adamw_weight_decay": 0.0015969504697043058, "l2_weight_decay": 0.008668618085624302, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.5308855842941667}, {"learning_rate": 6.879403652864611e-05, "beta1": 0.9612768347795299, "beta2": 0.9989947054099667, "epsilon": 0.9669781433167832, "use_nesterov": false, "adamw_weight_decay": 2.4896856391919995e-05, "l2_weight_decay": 0.09988985943493695, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.003196238294149325, "constant_fraction": 0.9946365692163901}, {"learning_rate": 9.607938235430516e-05, "beta1": 0.965365053579354, "beta2": 0.9999484282224528, "epsilon": 0.009550849450141313, "use_nesterov": false, "adamw_weight_decay": 0.0017599666492817312, "l2_weight_decay": 0.00012321083841963505, "warmup_fraction": 0.0010677243982637186, "min_learning_rate_mult": 0.40087937644039423, "constant_fraction": 0.888033316116464}, {"learning_rate": 0.04861112044313665, "beta1": 0.9977572814914633, "beta2": 0.9994165572341259, "epsilon": 62.303376585266506, "use_nesterov": false, "adamw_weight_decay": 0.00034897102974722216, "l2_weight_decay": 0.0, "warmup_fraction": 0.00016145413866186956, "min_learning_rate_mult": 0.04448932734186709, "constant_fraction": 0.6823237663882255}, {"learning_rate": 1.3006405291305291e-05, "beta1": 0.9975609492103915, "beta2": 0.9999815111586382, "epsilon": 3.86354522657321e-08, "use_nesterov": false, "adamw_weight_decay": 3.9650426342589896e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.877887057886451}, {"learning_rate": 0.2579193113574557, "beta1": 0.9980448288882778, "beta2": 0.5978340386570351, "epsilon": 0.017426954144305142, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 9.963400802618664e-05, "warmup_fraction": 1.0391523335761155e-05, "min_learning_rate_mult": 0.00021245519638832987, "constant_fraction": 0.09728149967822575}, {"learning_rate": 3.862103829668565e-05, "beta1": 0.9934593303568636, "beta2": 0.9968021483328294, "epsilon": 1.7518457019974233e-07, "use_nesterov": false, "adamw_weight_decay": 0.025986679803074602, "l2_weight_decay": 0.0, "warmup_fraction": 0.006796910591913633, "min_learning_rate_mult": 0.05010951187902261, "constant_fraction": 0.3944931716823634}, {"learning_rate": 0.8908079568295801, "beta1": 0.9901993059592025, "beta2": 0.9996521975572173, "epsilon": 11.77691529998012, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.007258532597445361, "warmup_fraction": 1.969850082614025e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.6022664709334342}, {"learning_rate": 0.1313733112645222, "beta1": 0.9880256147571239, "beta2": 0.5875470299839893, "epsilon": 33.74651790445787, "use_nesterov": false, "adamw_weight_decay": 0.00684307868313034, "l2_weight_decay": 0.0226785799151996, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.00019409041014887095, "constant_fraction": 0.21311970607363095}, {"learning_rate": 0.00021350871797401136, "beta1": 0.9440345518516046, "beta2": 0.999661957705603, "epsilon": 137.26826378272293, "use_nesterov": false, "adamw_weight_decay": 0.0012605036140461443, "l2_weight_decay": 0.0, "warmup_fraction": 9.57658320632341e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.05221782951849718}, {"learning_rate": 0.00012457896779561247, "beta1": 0.85079687764218, "beta2": 0.3954000894032892, "epsilon": 0.00031989416333072783, "use_nesterov": false, "adamw_weight_decay": 0.00013170307230396232, "l2_weight_decay": 0.0, "warmup_fraction": 0.00014826031621245481, "min_learning_rate_mult": 0.0, "constant_fraction": 0.2808157924057043}, {"learning_rate": 0.577016575820496, "beta1": 0.997063476527743, "beta2": 0.9696603139304905, "epsilon": 2.2476611563802582e-08, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.00020103157127576186, "warmup_fraction": 9.077004162571812e-05, "min_learning_rate_mult": 0.0007785902064211627, "constant_fraction": 0.9208956011276351}, {"learning_rate": 0.26315246142521687, "beta1": 0.9893721981627972, "beta2": 0.9999737428759315, "epsilon": 0.6957361994486779, "use_nesterov": false, "adamw_weight_decay": 1.1652491852304488e-05, "l2_weight_decay": 3.053277139130936e-05, "warmup_fraction": 0.001069020201009015, "min_learning_rate_mult": 0.0, "constant_fraction": 0.7031127195154002}, {"learning_rate": 3.0323653937969636e-05, "beta1": 0.9968877048088579, "beta2": 0.6285138542969244, "epsilon": 0.6002566475678418, "use_nesterov": false, "adamw_weight_decay": 3.0834715715859866e-05, "l2_weight_decay": 0.059023794889308534, "warmup_fraction": 4.348013832717239e-05, "min_learning_rate_mult": 0.001896043760646072, "constant_fraction": 0.9734511234297539}, {"learning_rate": 6.139569865963594e-05, "beta1": 0.9329333500544131, "beta2": 0.9997385416067177, "epsilon": 31.3981681886998, "use_nesterov": true, "adamw_weight_decay": 0.00016317305909176625, "l2_weight_decay": 3.1043352821319416e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.19920822876411293}, {"learning_rate": 0.0003952703931187249, "beta1": 0.9732880532488154, "beta2": 0.9999888275405534, "epsilon": 0.15798737219252978, "use_nesterov": false, "adamw_weight_decay": 0.011234995354883776, "l2_weight_decay": 0.0, "warmup_fraction": 4.830099011145886e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.648167160988611}, {"learning_rate": 0.03150095906367942, "beta1": 0.26899373918017777, "beta2": 0.998543252825601, "epsilon": 200.58996615329932, "use_nesterov": false, "adamw_weight_decay": 0.0013863060970781354, "l2_weight_decay": 0.00553706730307226, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.07671649521426675, "constant_fraction": 0.40324393350652243}, {"learning_rate": 0.005794805359350821, "beta1": 0.9892007470656901, "beta2": 0.9999844098035208, "epsilon": 0.0036448741796968475, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.00021387978915418632, "warmup_fraction": 1.9075606765022015e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.32491602214194837}, {"learning_rate": 0.05719196123893273, "beta1": 0.7033977330672462, "beta2": 0.9999011562064379, "epsilon": 0.4172298783742308, "use_nesterov": true, "adamw_weight_decay": 0.0002875288886464492, "l2_weight_decay": 0.04401253064706936, "warmup_fraction": 0.0, "min_learning_rate_mult": 1.2330547179164033e-05, "constant_fraction": 0.17876088841722126}, {"learning_rate": 7.52122988553821e-05, "beta1": 0.7371967819616057, "beta2": 0.7162984492624632, "epsilon": 1.3232124048624796e-05, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0009573527005531541, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.017492255787383407, "constant_fraction": 0.9767119585290758}, {"learning_rate": 0.0015406005993107601, "beta1": 0.970060154665522, "beta2": 0.8167321913594777, "epsilon": 1.4141931237085585, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.000139631632601764, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.8759007132656178}, {"learning_rate": 0.39594276302599046, "beta1": 0.46431724073510716, "beta2": 0.9555963606469141, "epsilon": 6.175440608927152e-08, "use_nesterov": true, "adamw_weight_decay": 0.00010692082341622225, "l2_weight_decay": 4.8072207080392245e-05, "warmup_fraction": 0.0005652163369297657, "min_learning_rate_mult": 4.8183803939382746e-05, "constant_fraction": 0.8302437162123829}, {"learning_rate": 0.02193107175699833, "beta1": 0.9886817037928741, "beta2": 0.3566638071823808, "epsilon": 17.99628001432311, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 1.0809535200157304e-05, "warmup_fraction": 0.07838584969886196, "min_learning_rate_mult": 0.07387338927402373, "constant_fraction": 0.7885327082480355}, {"learning_rate": 0.048678466081847296, "beta1": 0.8299392432062062, "beta2": 0.9999170069383932, "epsilon": 49.851957758557575, "use_nesterov": true, "adamw_weight_decay": 0.0005048298180732819, "l2_weight_decay": 0.0029464447595867397, "warmup_fraction": 3.364857653957725e-05, "min_learning_rate_mult": 0.01564207240308126, "constant_fraction": 0.4125871887657885}, {"learning_rate": 0.024804419983299943, "beta1": 0.9524412428144352, "beta2": 0.9997634278088273, "epsilon": 8.615457141414261, "use_nesterov": false, "adamw_weight_decay": 0.00034434359704627065, "l2_weight_decay": 0.0, "warmup_fraction": 0.038935597575983125, "min_learning_rate_mult": 0.0, "constant_fraction": 0.2113275312368108}, {"learning_rate": 0.0011661847334958303, "beta1": 0.689202832636836, "beta2": 0.9994180685454838, "epsilon": 3094.976108953656, "use_nesterov": false, "adamw_weight_decay": 0.07127876655173955, "l2_weight_decay": 0.000735979131021045, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0005467740894548731, "constant_fraction": 0.15462270181330018}, {"learning_rate": 0.017788886459917715, "beta1": 0.37012915504854493, "beta2": 0.9999770127443623, "epsilon": 2473.969418559052, "use_nesterov": true, "adamw_weight_decay": 0.005858183590115538, "l2_weight_decay": 0.00035404478078600586, "warmup_fraction": 0.09146514000554933, "min_learning_rate_mult": 0.0, "constant_fraction": 0.963153800801189}, {"learning_rate": 0.00015489283825594137, "beta1": 0.9866846005407961, "beta2": 0.9999318524178559, "epsilon": 1.1587314664294012e-08, "use_nesterov": false, "adamw_weight_decay": 0.0001877326824643919, "l2_weight_decay": 0.00010800359652508568, "warmup_fraction": 0.016412137289416758, "min_learning_rate_mult": 0.0, "constant_fraction": 0.7114587819600582}, {"learning_rate": 9.605663782699606e-05, "beta1": 0.9436301121196915, "beta2": 0.9994701415100034, "epsilon": 0.0004994278942314395, "use_nesterov": false, "adamw_weight_decay": 0.030237585187900824, "l2_weight_decay": 0.0028531432408763504, "warmup_fraction": 0.010839983775168332, "min_learning_rate_mult": 0.0, "constant_fraction": 0.42655378874055194}, {"learning_rate": 2.201081983920161e-05, "beta1": 0.2802010973638288, "beta2": 0.9999873977074707, "epsilon": 3.3355044942891463, "use_nesterov": false, "adamw_weight_decay": 0.030017852285536793, "l2_weight_decay": 0.0, "warmup_fraction": 0.034791860536920814, "min_learning_rate_mult": 0.00013614654484431422, "constant_fraction": 0.731675940083692}, {"learning_rate": 0.0031823028631218653, "beta1": 0.9898126003636096, "beta2": 0.5356175847881057, "epsilon": 131.52669222665708, "use_nesterov": false, "adamw_weight_decay": 0.004872515555089976, "l2_weight_decay": 4.272757087429652e-05, "warmup_fraction": 0.054255257150695665, "min_learning_rate_mult": 0.0, "constant_fraction": 0.11025191133309675}, {"learning_rate": 0.001494207794017953, "beta1": 0.021303787507392813, "beta2": 0.1925540164812085, "epsilon": 6928.717268281263, "use_nesterov": true, "adamw_weight_decay": 0.0003911467031183724, "l2_weight_decay": 0.0003420003709635163, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.6528930290905363, "constant_fraction": 0.12389617773610151}, {"learning_rate": 0.00030277915023599637, "beta1": 0.2563496698531522, "beta2": 0.9998785758815201, "epsilon": 0.8945084325919924, "use_nesterov": true, "adamw_weight_decay": 0.00010990181534104597, "l2_weight_decay": 0.01742262576143221, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.6223997551991534}, {"learning_rate": 0.0014416646282616233, "beta1": 0.07578261406086817, "beta2": 0.8623248859818075, "epsilon": 9.753849671794715e-07, "use_nesterov": false, "adamw_weight_decay": 1.0108152291877258e-05, "l2_weight_decay": 0.008721987993488315, "warmup_fraction": 0.0018103928233481482, "min_learning_rate_mult": 0.0, "constant_fraction": 0.11776708676473246}, {"learning_rate": 8.510300110356963e-05, "beta1": 0.7072953057960158, "beta2": 0.9997108139984052, "epsilon": 2.1698956139439692e-07, "use_nesterov": true, "adamw_weight_decay": 0.0015285197847622039, "l2_weight_decay": 0.0, "warmup_fraction": 1.8883394554227552e-05, "min_learning_rate_mult": 0.8503026397530704, "constant_fraction": 0.35232841318304375}, {"learning_rate": 0.00010984664818641348, "beta1": 0.9867052318792776, "beta2": 0.9999788786560232, "epsilon": 9.852486407075835, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0001330081931501912, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.006376861887261894, "constant_fraction": 0.8261434597437463}, {"learning_rate": 0.010504643607658945, "beta1": 0.9872619405479538, "beta2": 0.999812816496904, "epsilon": 0.517423128310937, "use_nesterov": false, "adamw_weight_decay": 0.04985353150074078, "l2_weight_decay": 0.0, "warmup_fraction": 3.834493621474819e-05, "min_learning_rate_mult": 0.9769329575381616, "constant_fraction": 0.5077300712401756}, {"learning_rate": 4.600727666497762e-05, "beta1": 0.9958550720096591, "beta2": 0.9995017708222868, "epsilon": 1.007242873617808e-05, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 6.46320141938125e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0022711145732585564, "constant_fraction": 0.8310590939265197}, {"learning_rate": 1.2375528163477208e-05, "beta1": 0.9525597667096563, "beta2": 0.9997284771853032, "epsilon": 4.5071720635688654e-06, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 1.5239777335860706e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0007631857060271253, "constant_fraction": 0.9729769356698004}, {"learning_rate": 0.0005987688148282236, "beta1": 0.998515675318826, "beta2": 0.9997054975832605, "epsilon": 27.64927678564993, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 1.1247429515855267e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.279862561284709}, {"learning_rate": 0.005890503396275024, "beta1": 0.9988577501164313, "beta2": 0.9477111195477631, "epsilon": 1.9616986678661485e-06, "use_nesterov": false, "adamw_weight_decay": 0.0035290407782421845, "l2_weight_decay": 5.129422032102949e-05, "warmup_fraction": 0.031743372529347356, "min_learning_rate_mult": 0.0, "constant_fraction": 0.9531909356176579}, {"learning_rate": 0.00013043019947775472, "beta1": 0.6184381722189567, "beta2": 0.9994057151352359, "epsilon": 5.7755507421823396e-05, "use_nesterov": false, "adamw_weight_decay": 0.010296116606084241, "l2_weight_decay": 0.000569334985961975, "warmup_fraction": 0.014360184808201766, "min_learning_rate_mult": 0.0, "constant_fraction": 0.25251538281125563}, {"learning_rate": 0.022946321211584835, "beta1": 0.9978999480277204, "beta2": 0.9376450751762991, "epsilon": 0.0010584739626311138, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.08888352462059074, "warmup_fraction": 0.0, "min_learning_rate_mult": 4.43006579951043e-05, "constant_fraction": 0.5231733962977629}, {"learning_rate": 6.29220185034161e-05, "beta1": 0.9988170147956796, "beta2": 0.9998719358425483, "epsilon": 190.97622314690813, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0027793729744707376, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.7100105721674731}, {"learning_rate": 1.8427094081771736e-05, "beta1": 0.8935582195618407, "beta2": 0.9952756985574426, "epsilon": 0.4439195226169429, "use_nesterov": true, "adamw_weight_decay": 0.0046686916029813385, "l2_weight_decay": 0.00013807941536934912, "warmup_fraction": 0.06510051096864021, "min_learning_rate_mult": 0.30724094241679784, "constant_fraction": 0.7789922131354876}, {"learning_rate": 2.857561592202935e-05, "beta1": 0.9215393271589082, "beta2": 0.9998507385227254, "epsilon": 395.717750533544, "use_nesterov": true, "adamw_weight_decay": 0.010399959455151002, "l2_weight_decay": 0.0110901200078207, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.012032661514105576, "constant_fraction": 0.8672007273386679}, {"learning_rate": 0.00015773168572574166, "beta1": 0.9817092450777015, "beta2": 0.9969623187508487, "epsilon": 3393.143277512044, "use_nesterov": true, "adamw_weight_decay": 0.02798344992956961, "l2_weight_decay": 0.0, "warmup_fraction": 0.0007924819073886004, "min_learning_rate_mult": 0.0, "constant_fraction": 0.5407043641089901}, {"learning_rate": 0.007694385363174248, "beta1": 0.9958339162046098, "beta2": 0.987267162682801, "epsilon": 4.2698552737846836e-05, "use_nesterov": true, "adamw_weight_decay": 0.0003276201902750138, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.6497287066191215}, {"learning_rate": 0.00020765542767103075, "beta1": 0.8871537038189777, "beta2": 0.9827395228711121, "epsilon": 1172.874804463869, "use_nesterov": false, "adamw_weight_decay": 0.0022744234314257053, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.5302564273682384}, {"learning_rate": 0.0003991638186555547, "beta1": 0.2306901580856201, "beta2": 0.999987078676567, "epsilon": 7.222436978288791e-07, "use_nesterov": false, "adamw_weight_decay": 0.00014418229156445004, "l2_weight_decay": 2.279902917445453e-05, "warmup_fraction": 1.671384868995393e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.2208774754718682}, {"learning_rate": 0.009590087697570904, "beta1": 0.9976302821712957, "beta2": 0.8511971604394338, "epsilon": 5.2927161575009796e-06, "use_nesterov": true, "adamw_weight_decay": 0.014313567848309701, "l2_weight_decay": 1.1278697149647402e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.5009273598783235}, {"learning_rate": 0.030365207106898783, "beta1": 0.9974536250541056, "beta2": 0.9744717509543515, "epsilon": 1915.182751582718, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 2.7591770584201992e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.9103723652200597}, {"learning_rate": 0.005233595477897234, "beta1": 0.998955160901265, "beta2": 0.07591218684566603, "epsilon": 0.025833494807725135, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.009375922745501475, "warmup_fraction": 0.046656607827494735, "min_learning_rate_mult": 0.0, "constant_fraction": 0.8240994375776223}, {"learning_rate": 0.012770631031878147, "beta1": 0.38649904475193597, "beta2": 0.9998718546700226, "epsilon": 0.005777884772228059, "use_nesterov": true, "adamw_weight_decay": 3.326691501364484e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.026736646254402464, "min_learning_rate_mult": 0.0, "constant_fraction": 0.349699198133289}, {"learning_rate": 0.5116004266122558, "beta1": 0.7724388880840333, "beta2": 0.9951815854322453, "epsilon": 0.000751632535395938, "use_nesterov": false, "adamw_weight_decay": 0.00014551256512862368, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 6.190760142523668e-05, "constant_fraction": 0.8266890447709249}, {"learning_rate": 0.0004514861824367785, "beta1": 0.9899832372130539, "beta2": 0.9999688283606577, "epsilon": 3.5237956886945847, "use_nesterov": false, "adamw_weight_decay": 0.00609411852938818, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.1896852986776437, "constant_fraction": 0.8926640588791567}, {"learning_rate": 0.013119517886312446, "beta1": 0.9927963819558989, "beta2": 0.9357410870320892, "epsilon": 0.0018522670532445666, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.001938619822372555, "warmup_fraction": 1.551229287670581e-05, "min_learning_rate_mult": 0.010489357255724283, "constant_fraction": 0.021037235595057546}, {"learning_rate": 0.0005281443686940033, "beta1": 0.9933138415964666, "beta2": 0.9949158066415243, "epsilon": 509.77815101322716, "use_nesterov": true, "adamw_weight_decay": 8.386552702057842e-05, "l2_weight_decay": 0.0016198254648905881, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.02057513082274052, "constant_fraction": 0.32204953468578446}, {"learning_rate": 0.1305091016343287, "beta1": 0.8826020214414212, "beta2": 0.9941811545775732, "epsilon": 3.0055901847864034e-07, "use_nesterov": true, "adamw_weight_decay": 0.002044839846827245, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.12389438803721448, "constant_fraction": 0.5813986523653657}, {"learning_rate": 7.04521659921647e-05, "beta1": 0.7486781227669241, "beta2": 0.9958249505705518, "epsilon": 1126.7979780510686, "use_nesterov": false, "adamw_weight_decay": 0.014656644009318329, "l2_weight_decay": 2.8137632705551205e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.5607003808645289}, {"learning_rate": 0.0012790128821048381, "beta1": 0.936259517738355, "beta2": 0.9322098527390937, "epsilon": 3928.5583602535426, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.002181939595566497, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.32775626661970936}, {"learning_rate": 5.783860741630972e-05, "beta1": 0.998433797954564, "beta2": 0.9960920566773614, "epsilon": 0.003312618568264337, "use_nesterov": false, "adamw_weight_decay": 1.8346644157694453e-05, "l2_weight_decay": 0.019456711105677517, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.45306477151860614}, {"learning_rate": 0.00016165774483968177, "beta1": 0.9465706495512046, "beta2": 0.9999548825963597, "epsilon": 0.0011768179942789063, "use_nesterov": true, "adamw_weight_decay": 5.158368239981761e-05, "l2_weight_decay": 0.0048817276598762125, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.03712249616222533, "constant_fraction": 0.9207587516766743}, {"learning_rate": 0.352831849787503, "beta1": 0.6188339374142412, "beta2": 0.8686637058166911, "epsilon": 3.266830491654063e-08, "use_nesterov": true, "adamw_weight_decay": 6.232219183508962e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.00011261150841957426, "min_learning_rate_mult": 4.6331019553595926e-05, "constant_fraction": 0.39702487348297266}, {"learning_rate": 0.003089789692891654, "beta1": 0.9672236962848565, "beta2": 0.9999886445018071, "epsilon": 6.834010728036599, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.01505108565242218, "warmup_fraction": 0.0002563137020554592, "min_learning_rate_mult": 0.0, "constant_fraction": 0.23825621936525088}, {"learning_rate": 0.10600379582659981, "beta1": 0.11887093444756014, "beta2": 0.3594523733074714, "epsilon": 16.587088248836, "use_nesterov": false, "adamw_weight_decay": 0.02557798502210518, "l2_weight_decay": 0.025580964618158654, "warmup_fraction": 1.0594759020551306e-05, "min_learning_rate_mult": 0.0027424924017803516, "constant_fraction": 0.92660126007269}, {"learning_rate": 0.0025588219963979327, "beta1": 0.9643119731243632, "beta2": 0.9999884508143033, "epsilon": 66.43607404549985, "use_nesterov": false, "adamw_weight_decay": 2.0104007736191424e-05, "l2_weight_decay": 2.8980699648445675e-05, "warmup_fraction": 6.258965545952821e-05, "min_learning_rate_mult": 0.011572586276910464, "constant_fraction": 0.8662377806135502}, {"learning_rate": 0.0004817812886825056, "beta1": 0.9925847142148719, "beta2": 0.8166191614013536, "epsilon": 4072.582769627591, "use_nesterov": true, "adamw_weight_decay": 1.9526270584585065e-05, "l2_weight_decay": 0.08278655548238471, "warmup_fraction": 0.009680141324031138, "min_learning_rate_mult": 0.0, "constant_fraction": 0.33831908664927823}, {"learning_rate": 0.004733881608973759, "beta1": 0.9948343993970171, "beta2": 0.9190104268663657, "epsilon": 2019.4354820772685, "use_nesterov": false, "adamw_weight_decay": 0.0006947507217143738, "l2_weight_decay": 0.00032177729876473255, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.22924040900363118}, {"learning_rate": 1.0187554967177508e-05, "beta1": 0.9880675956045214, "beta2": 0.9983158894348738, "epsilon": 3645.088586856746, "use_nesterov": false, "adamw_weight_decay": 0.005098422074426053, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.02838159599630548, "constant_fraction": 0.5012465900981609}, {"learning_rate": 0.019070379030985633, "beta1": 0.9734326202953241, "beta2": 0.9853745989905871, "epsilon": 0.0012231201782433585, "use_nesterov": false, "adamw_weight_decay": 2.285643766545676e-05, "l2_weight_decay": 1.5715071450241585e-05, "warmup_fraction": 0.020226632608851793, "min_learning_rate_mult": 0.0, "constant_fraction": 0.8137010782330665}, {"learning_rate": 5.569151363094566e-05, "beta1": 0.9903656483477754, "beta2": 0.9993190970321469, "epsilon": 212.59787157314165, "use_nesterov": true, "adamw_weight_decay": 0.006180238125869742, "l2_weight_decay": 0.0, "warmup_fraction": 0.00029220047482062867, "min_learning_rate_mult": 0.23349642042625637, "constant_fraction": 0.6567783877345781}, {"learning_rate": 0.003563342086350844, "beta1": 0.6506994974589638, "beta2": 0.9997929369490232, "epsilon": 5.101366244854219e-06, "use_nesterov": false, "adamw_weight_decay": 0.03276996074195554, "l2_weight_decay": 0.0012697563303100963, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.7462930319849224}, {"learning_rate": 2.3296631358606585e-05, "beta1": 0.9886969745696502, "beta2": 0.999920849109931, "epsilon": 0.31353928667616215, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0002443053286614798, "warmup_fraction": 1.0238154051617973e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.5266908495672629}, {"learning_rate": 0.007285560688074645, "beta1": 0.9976506067077398, "beta2": 0.9997818452197155, "epsilon": 0.0010813660994243566, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0012100898706884783, "warmup_fraction": 3.096729466977915e-05, "min_learning_rate_mult": 0.9513930663254565, "constant_fraction": 0.30390507642167786}, {"learning_rate": 0.013153392012060285, "beta1": 0.9909303642636685, "beta2": 0.9998807033910283, "epsilon": 0.007419100798081219, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0009019406802237848, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.3406141570173191}, {"learning_rate": 1.4644368208234374e-05, "beta1": 0.9921700798272415, "beta2": 0.9992965213212038, "epsilon": 1336.9210859666969, "use_nesterov": true, "adamw_weight_decay": 0.00030844859112219363, "l2_weight_decay": 0.0, "warmup_fraction": 0.0005245037434994419, "min_learning_rate_mult": 0.0007941855785639235, "constant_fraction": 0.302878197173426}, {"learning_rate": 0.03434728958921487, "beta1": 0.9985108429534802, "beta2": 0.995856522802259, "epsilon": 504.70058796634277, "use_nesterov": true, "adamw_weight_decay": 2.7542866526429747e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.006434743750985726, "min_learning_rate_mult": 0.0, "constant_fraction": 0.6735670024230126}, {"learning_rate": 0.022642200416011712, "beta1": 0.9691516670830862, "beta2": 0.6163700826390757, "epsilon": 0.0001660721610809923, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0019074491883267325, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.2851836662863304}, {"learning_rate": 0.05060681862496109, "beta1": 0.12076865910702783, "beta2": 0.998225735475007, "epsilon": 81.33244258257419, "use_nesterov": true, "adamw_weight_decay": 0.0006562804332738368, "l2_weight_decay": 0.00011660965866164784, "warmup_fraction": 0.0017848614770944041, "min_learning_rate_mult": 0.0, "constant_fraction": 0.32889954172598546}, {"learning_rate": 2.0599494037383947e-05, "beta1": 0.9805493474523704, "beta2": 0.999632428087089, "epsilon": 8.117824144603973e-07, "use_nesterov": true, "adamw_weight_decay": 5.483001811009986e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.08793676205903508, "min_learning_rate_mult": 1.618874513673556e-05, "constant_fraction": 0.8850577344123829}, {"learning_rate": 0.001003407277482095, "beta1": 0.995524101879756, "beta2": 0.2581332197219759, "epsilon": 0.0009290232531632786, "use_nesterov": false, "adamw_weight_decay": 7.989170333371477e-05, "l2_weight_decay": 0.007069797483506982, "warmup_fraction": 0.010205730609724625, "min_learning_rate_mult": 0.7226956589052433, "constant_fraction": 0.2021062485943108}, {"learning_rate": 0.04099079318367949, "beta1": 0.9574218491474271, "beta2": 0.9999543179432636, "epsilon": 0.05545726186055952, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.007428124655554959, "warmup_fraction": 6.561087316028967e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.8123081547698381}, {"learning_rate": 1.1946871628331291e-05, "beta1": 0.9983682674450302, "beta2": 0.9999531578748457, "epsilon": 0.00012422341854545314, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.08771535641774188, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.9972960466461379}, {"learning_rate": 2.4704197391033307e-05, "beta1": 0.9987819537739016, "beta2": 0.5212112575055801, "epsilon": 0.18325776169718114, "use_nesterov": false, "adamw_weight_decay": 0.013820035998276217, "l2_weight_decay": 0.03674379280573783, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.2684965751826972}, {"learning_rate": 0.00021657004870542847, "beta1": 0.9484744779967806, "beta2": 0.9997315353119711, "epsilon": 0.014749098196677484, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0006679786695234719, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.28656933975011895, "constant_fraction": 0.024691683426002253}, {"learning_rate": 0.17689523645862829, "beta1": 0.9791286280449008, "beta2": 0.9999372606145436, "epsilon": 2.0896032207999677e-06, "use_nesterov": false, "adamw_weight_decay": 0.08760851761454731, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.028028971728077685, "constant_fraction": 0.7817994241368444}, {"learning_rate": 0.013731299824189719, "beta1": 0.9978103589855064, "beta2": 0.788511526521836, "epsilon": 8113.4268983305055, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 1.3243605633396325e-05, "warmup_fraction": 0.0001232706564369459, "min_learning_rate_mult": 0.03527585890510545, "constant_fraction": 0.9844677967375304}, {"learning_rate": 0.10855076646001202, "beta1": 0.9963313200955763, "beta2": 0.9788150310652108, "epsilon": 1.9265237451352024e-07, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 1.3054188705318482e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.5959636547761435}, {"learning_rate": 2.1474860655703872e-05, "beta1": 0.9629300766827747, "beta2": 0.9999819065971989, "epsilon": 0.0019104902168881966, "use_nesterov": false, "adamw_weight_decay": 1.4243767762700389e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0025696414591907996, "constant_fraction": 0.4769488980103965}, {"learning_rate": 0.0018140854679486182, "beta1": 0.9981699658789185, "beta2": 0.9981965036300974, "epsilon": 2.247218488972721, "use_nesterov": true, "adamw_weight_decay": 0.0001971790220707151, "l2_weight_decay": 1.861999317345307e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.9230934764736358}, {"learning_rate": 0.02653650343960735, "beta1": 0.6358379230234724, "beta2": 0.9997831335300593, "epsilon": 1.760179045294452e-05, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.03678355359307519, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.04991501896198063, "constant_fraction": 0.4273614022958976}, {"learning_rate": 0.014358466822012996, "beta1": 0.6234007169103588, "beta2": 0.9989304248582006, "epsilon": 7.144343291357533e-06, "use_nesterov": true, "adamw_weight_decay": 1.0754517338560414e-05, "l2_weight_decay": 0.00012967488921458036, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.9744800232598811}, {"learning_rate": 0.11649725457123303, "beta1": 0.6329408238196852, "beta2": 0.9849398910766165, "epsilon": 13.654176429425696, "use_nesterov": true, "adamw_weight_decay": 0.018162808852589307, "l2_weight_decay": 4.279356170527052e-05, "warmup_fraction": 6.397043228124866e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.9032828811297953}, {"learning_rate": 2.204397732001797e-05, "beta1": 0.9852944475572655, "beta2": 0.9994315523928975, "epsilon": 2309.446664102062, "use_nesterov": false, "adamw_weight_decay": 0.0003968544315500345, "l2_weight_decay": 1.029424673456062e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.01064678842665257, "constant_fraction": 0.24162206943089315}, {"learning_rate": 0.0006460629712909633, "beta1": 0.9968563183750384, "beta2": 0.9931239505869617, "epsilon": 0.31985739720901785, "use_nesterov": true, "adamw_weight_decay": 2.8112419577409957e-05, "l2_weight_decay": 0.010616057725775967, "warmup_fraction": 0.02181173792837917, "min_learning_rate_mult": 0.0, "constant_fraction": 0.2319508971480423}, {"learning_rate": 0.0007206182252614333, "beta1": 0.9975953246312094, "beta2": 0.9972105281335492, "epsilon": 1405.3363993029234, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 2.2035994991047492e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 5.3916220899358806e-05, "constant_fraction": 0.5727931383155452}, {"learning_rate": 0.012849103622993421, "beta1": 0.976803143075097, "beta2": 0.7501854101007671, "epsilon": 4.139061013529382e-06, "use_nesterov": true, "adamw_weight_decay": 4.586168950389506e-05, "l2_weight_decay": 0.0, "warmup_fraction": 1.62563887680943e-05, "min_learning_rate_mult": 0.34183403387884215, "constant_fraction": 0.30245739848120434}, {"learning_rate": 0.0015172843278536, "beta1": 0.9968308823375459, "beta2": 0.9966720760921219, "epsilon": 1.881944272194643e-08, "use_nesterov": false, "adamw_weight_decay": 8.365117327739057e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.9661643758902908, "constant_fraction": 0.7211315039117491}, {"learning_rate": 0.14150168526038087, "beta1": 0.9985911690879962, "beta2": 0.97524815504287, "epsilon": 0.01915875213955494, "use_nesterov": true, "adamw_weight_decay": 0.00017857064265427967, "l2_weight_decay": 0.0, "warmup_fraction": 0.0042791257691429194, "min_learning_rate_mult": 0.0, "constant_fraction": 0.834640208346516}, {"learning_rate": 0.3772912719973449, "beta1": 0.8855959409141514, "beta2": 0.9999895316655832, "epsilon": 2.5004949285842082e-05, "use_nesterov": false, "adamw_weight_decay": 0.00015377591669889955, "l2_weight_decay": 0.07212223058031628, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.8880167877552909}, {"learning_rate": 0.02003537853667577, "beta1": 0.3991926475928692, "beta2": 0.9720812793874318, "epsilon": 0.0890517350567906, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0011293602689962181, "warmup_fraction": 0.032410463260400035, "min_learning_rate_mult": 0.13210039567860032, "constant_fraction": 0.5493173255826206}, {"learning_rate": 7.015489351313324e-05, "beta1": 0.9680519833045824, "beta2": 0.9999526392039226, "epsilon": 0.002941223101881354, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0005818951243356588, "warmup_fraction": 1.9450547725632277e-05, "min_learning_rate_mult": 0.0133775908170019, "constant_fraction": 0.8021024153907496}, {"learning_rate": 0.0024698693084121877, "beta1": 0.010219941835986623, "beta2": 0.9995957801968881, "epsilon": 0.008476262637359677, "use_nesterov": false, "adamw_weight_decay": 0.0003435909934057015, "l2_weight_decay": 0.0, "warmup_fraction": 0.00011163971690248991, "min_learning_rate_mult": 4.4968188994318344e-05, "constant_fraction": 0.8899259468945401}, {"learning_rate": 1.3329419215859969e-05, "beta1": 0.8619801902791664, "beta2": 0.9991210536706406, "epsilon": 4.453166993056327e-08, "use_nesterov": false, "adamw_weight_decay": 1.2228351593398876e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.006329720579210683, "min_learning_rate_mult": 0.0, "constant_fraction": 0.2139462421860424}, {"learning_rate": 1.352245442521151e-05, "beta1": 0.9064754555080397, "beta2": 0.9993920206837403, "epsilon": 0.0006070645629568548, "use_nesterov": true, "adamw_weight_decay": 0.00011644584985050526, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.3652491014072189}, {"learning_rate": 0.002138795833222322, "beta1": 0.9954368556405772, "beta2": 0.9846192381423001, "epsilon": 110.11081678434277, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 2.6450478348552967e-05, "warmup_fraction": 0.0008327094961723411, "min_learning_rate_mult": 8.869363558660814e-05, "constant_fraction": 0.4041811368888554}, {"learning_rate": 0.2399857845490895, "beta1": 0.9028233147852677, "beta2": 0.9826217111214133, "epsilon": 0.0017425882639459883, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 1.0453751980354597e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0018140974010233272, "constant_fraction": 0.1616539540662344}, {"learning_rate": 0.00010300082100898636, "beta1": 0.9982994810839314, "beta2": 0.9999424651510742, "epsilon": 263.99651251832825, "use_nesterov": true, "adamw_weight_decay": 1.0000270668347852e-05, "l2_weight_decay": 0.0002496227299064328, "warmup_fraction": 0.0, "min_learning_rate_mult": 1.6216239722877137e-05, "constant_fraction": 0.3409108152700524}, {"learning_rate": 0.0006071111499729708, "beta1": 0.9978292139415897, "beta2": 0.9998437712578124, "epsilon": 9.548826073411876, "use_nesterov": false, "adamw_weight_decay": 8.513728024367128e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0014867476848873095, "constant_fraction": 0.314490694797917}, {"learning_rate": 8.922548151347963e-05, "beta1": 0.9962787381597007, "beta2": 0.9807438280252605, "epsilon": 7.351346456988741e-05, "use_nesterov": false, "adamw_weight_decay": 0.0006815851465429245, "l2_weight_decay": 0.06907050330416553, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.036682088469951864, "constant_fraction": 0.3470408271796336}, {"learning_rate": 0.04266362473165651, "beta1": 0.8857101811328182, "beta2": 0.9996376174878505, "epsilon": 256.6628587063888, "use_nesterov": true, "adamw_weight_decay": 0.003134406638711066, "l2_weight_decay": 1.2185427427666246e-05, "warmup_fraction": 9.952094279247026e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.02821314558307486}, {"learning_rate": 0.06409490040546671, "beta1": 0.730941654400499, "beta2": 0.87540839317285, "epsilon": 1.2587299956669988e-06, "use_nesterov": false, "adamw_weight_decay": 0.04204943879173707, "l2_weight_decay": 0.0009250637539330359, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.17057867738053611, "constant_fraction": 0.53541873344036}, {"learning_rate": 0.42688713784047105, "beta1": 0.9986197125545375, "beta2": 0.9992127747691136, "epsilon": 1.0925608116995007, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.08597985026927779, "warmup_fraction": 0.00013434406799819984, "min_learning_rate_mult": 0.0, "constant_fraction": 0.5689046342814874}, {"learning_rate": 0.00015974934324843496, "beta1": 0.985687655356826, "beta2": 0.9643578137084248, "epsilon": 7.532671100715907, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.021607043535989686, "warmup_fraction": 0.0007840154408063339, "min_learning_rate_mult": 5.551172569866984e-05, "constant_fraction": 0.8986961353535586}, {"learning_rate": 0.0005567620060275389, "beta1": 0.9940318656707496, "beta2": 0.9994528139405701, "epsilon": 1.822692250511652e-08, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 3.8342941788477865e-05, "warmup_fraction": 0.013326725557393919, "min_learning_rate_mult": 0.02317149417930859, "constant_fraction": 0.6035034076657411}, {"learning_rate": 1.589416052937753e-05, "beta1": 0.9855857613698726, "beta2": 0.9870173364478605, "epsilon": 9.255484331036625, "use_nesterov": false, "adamw_weight_decay": 0.0006200690072394709, "l2_weight_decay": 0.0013598110314059814, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0034512789566061974, "constant_fraction": 0.15181779044798793}, {"learning_rate": 0.011007458436958086, "beta1": 0.9441849537244239, "beta2": 0.9857721546887958, "epsilon": 2628.993096278863, "use_nesterov": false, "adamw_weight_decay": 0.000556039851798913, "l2_weight_decay": 0.0006089127850131019, "warmup_fraction": 0.00020755982394506748, "min_learning_rate_mult": 0.0008353227153256618, "constant_fraction": 0.8355415486436083}, {"learning_rate": 0.06843196916951902, "beta1": 0.9964923827851797, "beta2": 0.8725780088584474, "epsilon": 8.501460881792569e-07, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.001826663115897076, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0003075919525396029, "constant_fraction": 0.8932269057406426}, {"learning_rate": 0.0010868257083839232, "beta1": 0.9635217867382794, "beta2": 0.9300556006263305, "epsilon": 5.414554467127426, "use_nesterov": true, "adamw_weight_decay": 0.017415845783576644, "l2_weight_decay": 0.006208302493833865, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.09017378866275738}, {"learning_rate": 0.00020841846099653972, "beta1": 0.9746519349115311, "beta2": 0.9999855237987584, "epsilon": 2.7223915406376777, "use_nesterov": false, "adamw_weight_decay": 0.02108475976295528, "l2_weight_decay": 0.0, "warmup_fraction": 0.0004880208308312825, "min_learning_rate_mult": 0.011993756462448869, "constant_fraction": 0.7081918510735364}, {"learning_rate": 0.00026719613653264796, "beta1": 0.6542527218423633, "beta2": 0.9958476433742125, "epsilon": 4182.633004231385, "use_nesterov": true, "adamw_weight_decay": 1.7524576927664273e-05, "l2_weight_decay": 1.3116899577813986e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.3852505827805017}, {"learning_rate": 0.0009014165068353689, "beta1": 0.8351673129642802, "beta2": 0.9964329058374228, "epsilon": 0.07193334658925629, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 4.09497947933838e-05, "warmup_fraction": 2.1605487469111003e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.8221339836425658}, {"learning_rate": 0.03838437769761072, "beta1": 0.9623877680701158, "beta2": 0.9976848885505908, "epsilon": 1.3943187972742694, "use_nesterov": false, "adamw_weight_decay": 4.808046365525927e-05, "l2_weight_decay": 0.007648572521030508, "warmup_fraction": 0.023531020673288557, "min_learning_rate_mult": 0.002482211913454252, "constant_fraction": 0.09340410414027112}, {"learning_rate": 0.0018310597758847307, "beta1": 0.9463045735656658, "beta2": 0.974103950854208, "epsilon": 406.83549840328226, "use_nesterov": false, "adamw_weight_decay": 0.003607323495504147, "l2_weight_decay": 0.0, "warmup_fraction": 0.0002941576308834853, "min_learning_rate_mult": 0.0011275664438969773, "constant_fraction": 0.1347183836160647}, {"learning_rate": 0.0004292931680133512, "beta1": 0.981492503451861, "beta2": 0.9981384152074669, "epsilon": 3.42971998374097e-06, "use_nesterov": true, "adamw_weight_decay": 0.03200491456352602, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 6.960325228963801e-05, "constant_fraction": 0.7818989614202054}, {"learning_rate": 0.0001275542789861206, "beta1": 0.8009456028147846, "beta2": 0.4226819719098467, "epsilon": 0.00034298405280589286, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.014549248602609465, "warmup_fraction": 9.416210756726392e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.8444692886148875}, {"learning_rate": 0.2141493298187379, "beta1": 0.9815466031371648, "beta2": 0.6762709573902203, "epsilon": 1.1372661697685784e-05, "use_nesterov": false, "adamw_weight_decay": 0.01743568455230432, "l2_weight_decay": 0.0, "warmup_fraction": 0.08113417903677544, "min_learning_rate_mult": 0.03696052478579316, "constant_fraction": 0.89998056148648}, {"learning_rate": 7.837491216614881e-05, "beta1": 0.9846332944594632, "beta2": 0.9850495320148129, "epsilon": 9.21484677465573e-08, "use_nesterov": false, "adamw_weight_decay": 0.00022020942768883337, "l2_weight_decay": 0.0077899233370320705, "warmup_fraction": 0.014186374886964644, "min_learning_rate_mult": 0.00015071874403512208, "constant_fraction": 0.3830379523652887}, {"learning_rate": 6.286463573710029e-05, "beta1": 0.9347088837512233, "beta2": 0.9999389624123984, "epsilon": 1.1957058640532836e-07, "use_nesterov": false, "adamw_weight_decay": 1.5228434431254436e-05, "l2_weight_decay": 0.025964139730566445, "warmup_fraction": 0.06980429898672831, "min_learning_rate_mult": 0.01096314236230983, "constant_fraction": 0.20566535100186456}, {"learning_rate": 0.0188565717226975, "beta1": 0.9699834937520305, "beta2": 0.7268418436832087, "epsilon": 92.87745541510577, "use_nesterov": true, "adamw_weight_decay": 2.9835241879067023e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.8064789164945345}, {"learning_rate": 0.1640557154897957, "beta1": 0.9943951562401887, "beta2": 0.8170993494191316, "epsilon": 549.0212676034376, "use_nesterov": false, "adamw_weight_decay": 0.00018425638891859524, "l2_weight_decay": 0.0, "warmup_fraction": 0.004180892065913894, "min_learning_rate_mult": 0.0, "constant_fraction": 0.3787110870754006}, {"learning_rate": 1.3714073056514315e-05, "beta1": 0.8887304614483846, "beta2": 0.20549256168047603, "epsilon": 1.3423349985589102e-08, "use_nesterov": false, "adamw_weight_decay": 0.014217883926007159, "l2_weight_decay": 1.207979916260035e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.20879926594376064}, {"learning_rate": 0.0002438059057599606, "beta1": 0.9759513228744442, "beta2": 0.9994811378842076, "epsilon": 5.549992169296717, "use_nesterov": true, "adamw_weight_decay": 0.0006053986226095007, "l2_weight_decay": 0.0, "warmup_fraction": 0.0008039678181514361, "min_learning_rate_mult": 0.0, "constant_fraction": 0.5274828714083104}, {"learning_rate": 0.01229252580827133, "beta1": 0.9905606305020153, "beta2": 0.7477998117102128, "epsilon": 0.006374875003484812, "use_nesterov": true, "adamw_weight_decay": 5.8425716080259796e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.00523832428555378, "min_learning_rate_mult": 0.5085922210737696, "constant_fraction": 0.5112159955127821}, {"learning_rate": 1.060559293510721e-05, "beta1": 0.8147863649860121, "beta2": 0.5633785270463161, "epsilon": 2.3680132685503816e-06, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.06298327199483783, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.6511187844524452, "constant_fraction": 0.13565424988114738}, {"learning_rate": 0.001265308744923699, "beta1": 0.9984329434572348, "beta2": 0.6882873685855204, "epsilon": 1.4911771251036992e-08, "use_nesterov": true, "adamw_weight_decay": 0.024448014314732352, "l2_weight_decay": 5.458224255135949e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 9.107901905458084e-05, "constant_fraction": 0.4905865308340728}, {"learning_rate": 0.4494634240745159, "beta1": 0.9989939988672184, "beta2": 0.999952610669329, "epsilon": 1290.028599597863, "use_nesterov": true, "adamw_weight_decay": 0.0002706936259105551, "l2_weight_decay": 0.01203473831925615, "warmup_fraction": 0.0836870235925519, "min_learning_rate_mult": 1.7547428173637906e-05, "constant_fraction": 0.9775163618607078}, {"learning_rate": 0.054338069986544335, "beta1": 0.961316050137838, "beta2": 0.999845835861978, "epsilon": 4.082006773642775, "use_nesterov": false, "adamw_weight_decay": 2.7536864056937692e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.3078036430548621}, {"learning_rate": 0.000189412800434368, "beta1": 0.9820894539520201, "beta2": 0.9932278636405862, "epsilon": 0.0004961225910502752, "use_nesterov": false, "adamw_weight_decay": 0.0004049521600189918, "l2_weight_decay": 0.055371156790829, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.00013504948412104605, "constant_fraction": 0.9904455879735135}, {"learning_rate": 0.021276538650750697, "beta1": 0.9914156788408683, "beta2": 0.9992754122900774, "epsilon": 490.1366470608099, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.09471522924952229, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.10149731426715947, "constant_fraction": 0.7604221322906649}, {"learning_rate": 0.0005084212380356813, "beta1": 0.7343296277237374, "beta2": 0.9995504995153809, "epsilon": 185.97811326251977, "use_nesterov": false, "adamw_weight_decay": 0.014143079142615294, "l2_weight_decay": 0.0, "warmup_fraction": 0.009810381725808566, "min_learning_rate_mult": 0.011588771118171625, "constant_fraction": 0.6344328596036437}, {"learning_rate": 0.006833489732879659, "beta1": 0.8250563393578071, "beta2": 0.9999581911129557, "epsilon": 0.426677018638597, "use_nesterov": true, "adamw_weight_decay": 0.04729329658614482, "l2_weight_decay": 0.0, "warmup_fraction": 4.48721127039906e-05, "min_learning_rate_mult": 0.00023889991949726085, "constant_fraction": 0.3155378215975557}, {"learning_rate": 0.004672080494458792, "beta1": 0.9951692398104693, "beta2": 0.9999866031170666, "epsilon": 0.0006364148138411633, "use_nesterov": false, "adamw_weight_decay": 2.081970926401394e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.0008151948793410112, "min_learning_rate_mult": 0.10092081606357775, "constant_fraction": 0.5829961050787303}, {"learning_rate": 0.36762828763574384, "beta1": 0.9689995966793754, "beta2": 0.9936230220006511, "epsilon": 3.0662693462866235, "use_nesterov": false, "adamw_weight_decay": 0.0019517958954248188, "l2_weight_decay": 0.022217964452361183, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.08001615631255128, "constant_fraction": 0.13343874127911848}, {"learning_rate": 0.06373246201181457, "beta1": 0.11601287174255848, "beta2": 0.9998263518360175, "epsilon": 0.002486874650756026, "use_nesterov": true, "adamw_weight_decay": 0.0017902396805127103, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.023068243472714123, "constant_fraction": 0.764351478873437}, {"learning_rate": 0.00018594089746958292, "beta1": 0.9837901724582166, "beta2": 0.9937117960395404, "epsilon": 0.4352754301020101, "use_nesterov": true, "adamw_weight_decay": 1.596490445598246e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.00033463686312915525, "min_learning_rate_mult": 0.0, "constant_fraction": 0.4812290455641287}, {"learning_rate": 0.3899798980395588, "beta1": 0.4124710201633499, "beta2": 0.9999652103445403, "epsilon": 1.1952024608860046e-07, "use_nesterov": true, "adamw_weight_decay": 3.2149053494561164e-05, "l2_weight_decay": 1.1197536854115965e-05, "warmup_fraction": 0.000523064001677042, "min_learning_rate_mult": 0.07011725604498015, "constant_fraction": 0.8673540506855577}, {"learning_rate": 1.0874176242965358e-05, "beta1": 0.995297202123257, "beta2": 0.963525753572908, "epsilon": 269.2948455478641, "use_nesterov": false, "adamw_weight_decay": 0.014226528577608762, "l2_weight_decay": 0.0, "warmup_fraction": 3.6521529668847565e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.7317015415560723}, {"learning_rate": 0.0008150312235890308, "beta1": 0.9934775282849007, "beta2": 0.9998070607965452, "epsilon": 9.353736269300486, "use_nesterov": false, "adamw_weight_decay": 0.026245180989948252, "l2_weight_decay": 0.0, "warmup_fraction": 0.0013372282470021223, "min_learning_rate_mult": 0.0, "constant_fraction": 0.14934027795962324}, {"learning_rate": 0.30530720156454677, "beta1": 0.9478693175947703, "beta2": 0.9999866256329795, "epsilon": 0.0034563296864741568, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 9.756274027254559e-05, "warmup_fraction": 0.00019283275892975388, "min_learning_rate_mult": 0.0, "constant_fraction": 0.8234521863097528}, {"learning_rate": 4.2579318309278065e-05, "beta1": 0.6799876069295989, "beta2": 0.9998964176644798, "epsilon": 1418.1854397908235, "use_nesterov": false, "adamw_weight_decay": 2.5937378244153805e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.47089046912404586}, {"learning_rate": 1.4152196134383385e-05, "beta1": 0.9966182314829194, "beta2": 0.9999463685059137, "epsilon": 0.00283042534635409, "use_nesterov": true, "adamw_weight_decay": 0.048726333093074385, "l2_weight_decay": 0.0025097662507584054, "warmup_fraction": 0.009066051218919563, "min_learning_rate_mult": 0.00077204282886209, "constant_fraction": 0.153033086788677}, {"learning_rate": 0.5266653804162006, "beta1": 0.9903068846887942, "beta2": 0.8832576057083934, "epsilon": 0.028711644455143383, "use_nesterov": true, "adamw_weight_decay": 1.3064897784927625e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.000892592061231595, "min_learning_rate_mult": 0.0, "constant_fraction": 0.6420708911553392}, {"learning_rate": 0.40231612834830355, "beta1": 0.9911476867450913, "beta2": 0.9999488495348781, "epsilon": 0.017958832870815882, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.08648235291783132, "warmup_fraction": 4.980323555107475e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.22494868766944742}, {"learning_rate": 0.01389248506050092, "beta1": 0.9986165275889155, "beta2": 0.7626642629787579, "epsilon": 21.849291451901717, "use_nesterov": true, "adamw_weight_decay": 1.8157769148531326e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.11090082417975489, "constant_fraction": 0.5794964656319875}, {"learning_rate": 0.009546779105228774, "beta1": 0.9390659255439757, "beta2": 0.9984774419039188, "epsilon": 0.9213553242321647, "use_nesterov": false, "adamw_weight_decay": 3.2347915016466006e-05, "l2_weight_decay": 0.00972311402960836, "warmup_fraction": 0.014195826128596269, "min_learning_rate_mult": 2.4629553095453458e-05, "constant_fraction": 0.5675440072339806}, {"learning_rate": 2.021509342033358e-05, "beta1": 0.9986991895734055, "beta2": 0.9999806862849991, "epsilon": 1.0089143534041531e-08, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 8.458981921567617e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.432407703197931}, {"learning_rate": 1.184034772486334e-05, "beta1": 0.9192696675614204, "beta2": 0.1041417296032836, "epsilon": 2484.6483506712198, "use_nesterov": false, "adamw_weight_decay": 1.4975930803782868e-05, "l2_weight_decay": 0.000167492352800462, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.14408933366397425}, {"learning_rate": 1.25062301659427e-05, "beta1": 0.889640976911185, "beta2": 0.9997104441202677, "epsilon": 7.141797620684109, "use_nesterov": false, "adamw_weight_decay": 0.006984643910203526, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.04558457470556743}, {"learning_rate": 4.405323376896904e-05, "beta1": 0.965556793132629, "beta2": 0.9999759295787167, "epsilon": 0.0005463406511701247, "use_nesterov": true, "adamw_weight_decay": 0.011741506919218329, "l2_weight_decay": 0.004674301534645338, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.7579739580537421}, {"learning_rate": 2.6216241639510902e-05, "beta1": 0.9948665467475017, "beta2": 0.9681942064132645, "epsilon": 7.137790139550873e-07, "use_nesterov": true, "adamw_weight_decay": 0.00013059533867719914, "l2_weight_decay": 0.0, "warmup_fraction": 0.007242617031202112, "min_learning_rate_mult": 0.003032434236952092, "constant_fraction": 0.1690190116490895}, {"learning_rate": 0.00046639881805850416, "beta1": 0.25228361904895147, "beta2": 0.9075675399065339, "epsilon": 0.008415982413435252, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.007751905871925067, "warmup_fraction": 0.06363354603838955, "min_learning_rate_mult": 0.0, "constant_fraction": 0.7106993279144725}, {"learning_rate": 0.020893302386384732, "beta1": 0.8422755725867572, "beta2": 0.9940049466907808, "epsilon": 5363.516781353384, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.019037370893546852, "warmup_fraction": 0.08130591353500671, "min_learning_rate_mult": 0.5538412677708302, "constant_fraction": 0.14561123778988616}, {"learning_rate": 0.007209119194148017, "beta1": 0.987079547356025, "beta2": 0.999923989079075, "epsilon": 583.4968517255953, "use_nesterov": false, "adamw_weight_decay": 3.3160125948078106e-05, "l2_weight_decay": 0.0, "warmup_fraction": 9.410894504691244e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.7102286006265354}, {"learning_rate": 0.0003067901383701882, "beta1": 0.9624055947251599, "beta2": 0.9916082341174591, "epsilon": 20.365279945524268, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.06317267882739748, "warmup_fraction": 0.00025549519348324896, "min_learning_rate_mult": 0.0, "constant_fraction": 0.5102729071735923}, {"learning_rate": 0.603957574788857, "beta1": 0.9943960087553219, "beta2": 0.9971816292913542, "epsilon": 0.002738703331651808, "use_nesterov": false, "adamw_weight_decay": 0.0011869942250665993, "l2_weight_decay": 0.0, "warmup_fraction": 0.00021063780848077406, "min_learning_rate_mult": 0.0, "constant_fraction": 0.791996691654991}, {"learning_rate": 0.02207382446306518, "beta1": 0.8235031018044886, "beta2": 0.9995226229167097, "epsilon": 1457.3130054874289, "use_nesterov": false, "adamw_weight_decay": 0.0023283418041562818, "l2_weight_decay": 5.959127114427876e-05, "warmup_fraction": 0.010539853982853778, "min_learning_rate_mult": 0.0, "constant_fraction": 0.67580799277504}, {"learning_rate": 4.63676261107208e-05, "beta1": 0.921417415947552, "beta2": 0.9999637964705755, "epsilon": 2.9895307598028926e-06, "use_nesterov": false, "adamw_weight_decay": 0.06869736593938719, "l2_weight_decay": 5.1576353229369036e-05, "warmup_fraction": 0.07907046736337467, "min_learning_rate_mult": 0.0006308211612495086, "constant_fraction": 0.6970383737530566}, {"learning_rate": 0.04155455982998317, "beta1": 0.15556195591509658, "beta2": 0.9998561899521403, "epsilon": 7.50668493527111e-08, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 1.3833235956119421e-05, "warmup_fraction": 0.07535135882285379, "min_learning_rate_mult": 2.6640277139748944e-05, "constant_fraction": 0.17021521414375196}, {"learning_rate": 5.863771431690182e-05, "beta1": 0.9885806089635897, "beta2": 0.9998495272343861, "epsilon": 446.8646800095124, "use_nesterov": false, "adamw_weight_decay": 0.030283528117329123, "l2_weight_decay": 0.04374708004172411, "warmup_fraction": 8.281790522357027e-05, "min_learning_rate_mult": 5.854107779914016e-05, "constant_fraction": 0.9427871467552511}, {"learning_rate": 0.0039395725116096935, "beta1": 0.9987850154480281, "beta2": 0.7602822485082381, "epsilon": 9.633385235542134e-05, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0066217632026900446, "warmup_fraction": 0.021274067353005712, "min_learning_rate_mult": 0.5371046713478559, "constant_fraction": 0.059228855849393414}, {"learning_rate": 0.0006364451375330139, "beta1": 0.3448264450754942, "beta2": 0.9996669700808964, "epsilon": 0.79659208791673, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 8.133388379785051e-05, "warmup_fraction": 0.006023839495121105, "min_learning_rate_mult": 0.0, "constant_fraction": 0.2851052533990961}, {"learning_rate": 0.00013805905623123302, "beta1": 0.956590135262842, "beta2": 0.9608426649075996, "epsilon": 0.09865639595439137, "use_nesterov": true, "adamw_weight_decay": 0.0002815525601559158, "l2_weight_decay": 2.6424476165480282e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.5452976822855985}, {"learning_rate": 0.0011586278616340436, "beta1": 0.5054653156102714, "beta2": 0.5457262142223325, "epsilon": 9.841781944567288e-07, "use_nesterov": true, "adamw_weight_decay": 0.022213469134042416, "l2_weight_decay": 0.07688551648360523, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.00029854757438760375, "constant_fraction": 0.986632648616124}, {"learning_rate": 0.0020963416879690175, "beta1": 0.9959659725986822, "beta2": 0.9998626215747998, "epsilon": 0.005588103494131963, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.002263845597105555, "warmup_fraction": 0.001885451827272342, "min_learning_rate_mult": 8.060802778116394e-05, "constant_fraction": 0.6821327609236659}, {"learning_rate": 0.0004672662348252391, "beta1": 0.9985144359763971, "beta2": 0.9997412048944214, "epsilon": 29.17259989897731, "use_nesterov": false, "adamw_weight_decay": 5.294607877407497e-05, "l2_weight_decay": 0.007400738357602378, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0843088110429322, "constant_fraction": 0.24756092119343798}, {"learning_rate": 3.9488492140069486e-05, "beta1": 0.8249699657533984, "beta2": 0.9765580090095107, "epsilon": 3.6436293086671606e-05, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 1.2818211481588985e-05, "warmup_fraction": 1.045892227684837e-05, "min_learning_rate_mult": 0.00015785176629550118, "constant_fraction": 0.7784246919111298}, {"learning_rate": 0.033477123492965416, "beta1": 0.9982968603449904, "beta2": 0.9654503294628618, "epsilon": 1.1645386980000489e-07, "use_nesterov": false, "adamw_weight_decay": 2.099402082043828e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.27727789141568004}, {"learning_rate": 0.0007510387560396383, "beta1": 0.9944056521213595, "beta2": 0.8998350253478027, "epsilon": 0.35545086568601314, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.030507348301533576, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0002804630850262158, "constant_fraction": 0.5246421383730397}, {"learning_rate": 4.8324489307218373e-05, "beta1": 0.9966376576825812, "beta2": 0.9484018355770584, "epsilon": 0.0009642465723261072, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0010568015759676683, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.786431286121525}, {"learning_rate": 0.04772404539025245, "beta1": 0.9276486548109566, "beta2": 0.9379006934017615, "epsilon": 4.104772332699177, "use_nesterov": false, "adamw_weight_decay": 0.05513317583039557, "l2_weight_decay": 0.00019784368090819442, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.00015308357448407637, "constant_fraction": 0.17719312937135512}, {"learning_rate": 0.009476508675297382, "beta1": 0.9979796939294373, "beta2": 0.9822562638919098, "epsilon": 2.8743330155167137e-05, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 8.148401248203633e-05, "warmup_fraction": 0.00928497282180669, "min_learning_rate_mult": 3.177535595466813e-05, "constant_fraction": 0.3603752547239839}, {"learning_rate": 0.0007518511496504919, "beta1": 0.7327327489349946, "beta2": 0.9999826207059404, "epsilon": 0.0004644636310892702, "use_nesterov": true, "adamw_weight_decay": 0.027414913865639524, "l2_weight_decay": 0.012503405818664402, "warmup_fraction": 0.0007062946248660243, "min_learning_rate_mult": 0.13286552039742372, "constant_fraction": 0.5567198057692586}, {"learning_rate": 0.0007893261250456867, "beta1": 0.997730979183447, "beta2": 0.5834176434489868, "epsilon": 785.0739297147468, "use_nesterov": false, "adamw_weight_decay": 0.08069073915322057, "l2_weight_decay": 0.0005809183955369164, "warmup_fraction": 0.0010662277745386323, "min_learning_rate_mult": 5.7269740318136686e-05, "constant_fraction": 0.6510879418173074}, {"learning_rate": 1.7673030903971946e-05, "beta1": 0.8671700541206522, "beta2": 0.9950304902372428, "epsilon": 1.3840248334793421, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.00040825545373555667, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.00012194764714425885, "constant_fraction": 0.7976159050354001}, {"learning_rate": 0.010532242735402196, "beta1": 0.9988651056670108, "beta2": 0.9935864244022374, "epsilon": 216.62646781541392, "use_nesterov": false, "adamw_weight_decay": 0.00010521436400908398, "l2_weight_decay": 0.0, "warmup_fraction": 1.960383491731179e-05, "min_learning_rate_mult": 0.24024470591381006, "constant_fraction": 0.2867015637542021}, {"learning_rate": 0.0003650848236935273, "beta1": 0.7332712970795763, "beta2": 0.9998599199456142, "epsilon": 13.905563207637448, "use_nesterov": true, "adamw_weight_decay": 0.033155459471669736, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 1.2792198919186758e-05, "constant_fraction": 0.35990719375912283}, {"learning_rate": 0.3445877797163586, "beta1": 0.03693210275071712, "beta2": 0.9999299577509797, "epsilon": 2.6936244389046022, "use_nesterov": true, "adamw_weight_decay": 0.000502137054334771, "l2_weight_decay": 0.015685010197243866, "warmup_fraction": 0.0291294813569809, "min_learning_rate_mult": 3.354020132001228e-05, "constant_fraction": 0.21654177530840868}, {"learning_rate": 0.0002956897195407636, "beta1": 0.9884816410265932, "beta2": 0.9998610735349684, "epsilon": 0.0004428941890070358, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.038500914471248766, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.001341225245166915, "constant_fraction": 0.3946550615956623}, {"learning_rate": 0.4197357309903209, "beta1": 0.6655942011278572, "beta2": 0.9451400572547408, "epsilon": 0.002877968259799662, "use_nesterov": false, "adamw_weight_decay": 7.12540655601354e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.00025776516300993175, "min_learning_rate_mult": 0.0, "constant_fraction": 0.32770906828225843}, {"learning_rate": 0.4350463129207092, "beta1": 0.99818603790124, "beta2": 0.9999314808118732, "epsilon": 1.664303291758152e-08, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.006814290801559205, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.0803142085201316}, {"learning_rate": 0.09196732535581638, "beta1": 0.9986300567303751, "beta2": 0.913080614051367, "epsilon": 0.5253047408983885, "use_nesterov": true, "adamw_weight_decay": 0.0002555961782160762, "l2_weight_decay": 0.0, "warmup_fraction": 0.06071959338607732, "min_learning_rate_mult": 0.32406397351867855, "constant_fraction": 0.7686450308303509}, {"learning_rate": 0.6846825035237112, "beta1": 0.9815130814308093, "beta2": 0.9997380890711164, "epsilon": 4.815332613638297e-05, "use_nesterov": false, "adamw_weight_decay": 0.0005015069982022111, "l2_weight_decay": 0.009107983349898758, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.00027100815587290626, "constant_fraction": 0.0450162939370935}, {"learning_rate": 0.00045170519714504497, "beta1": 0.9199940600534906, "beta2": 0.9999510905376473, "epsilon": 544.6926061412172, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.09747395584370665, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.46118899671005376}, {"learning_rate": 0.00033921699999105696, "beta1": 0.981617886867597, "beta2": 0.996102946070808, "epsilon": 3.189766637483991e-05, "use_nesterov": true, "adamw_weight_decay": 0.0219366731184835, "l2_weight_decay": 0.0, "warmup_fraction": 0.0013803316086331797, "min_learning_rate_mult": 5.3821150006661706e-05, "constant_fraction": 0.15610320076040296}, {"learning_rate": 0.06470187954797603, "beta1": 0.8659813461523769, "beta2": 0.9997771875470722, "epsilon": 0.023689810740724567, "use_nesterov": false, "adamw_weight_decay": 4.974250408850275e-05, "l2_weight_decay": 0.05974586749297802, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.2588937788532451, "constant_fraction": 0.6454064466972701}, {"learning_rate": 0.009387131692737817, "beta1": 0.9879430475150661, "beta2": 0.9994854114695282, "epsilon": 9.143729588834755e-06, "use_nesterov": false, "adamw_weight_decay": 0.00032963956170756973, "l2_weight_decay": 0.0008343251970123713, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.953897976212088}, {"learning_rate": 1.3116156971741279e-05, "beta1": 0.9534562451171389, "beta2": 0.9345834011587649, "epsilon": 0.008051320430072569, "use_nesterov": true, "adamw_weight_decay": 0.00011880733852391383, "l2_weight_decay": 0.00123452164581974, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.18032727463826378, "constant_fraction": 0.3474688948270638}, {"learning_rate": 0.10280994002102928, "beta1": 0.9985607739615094, "beta2": 0.9998074360969298, "epsilon": 0.0960848306334011, "use_nesterov": false, "adamw_weight_decay": 0.00035547988168817805, "l2_weight_decay": 0.00036796347630174404, "warmup_fraction": 0.0005814716295699507, "min_learning_rate_mult": 0.0, "constant_fraction": 0.6516969276001274}, {"learning_rate": 0.6293658805146909, "beta1": 0.9031922945358268, "beta2": 0.09500926123812015, "epsilon": 3.9331921145597817, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.020139876446695848, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.46373013329663004}, {"learning_rate": 0.02496195507419319, "beta1": 0.9385449562450521, "beta2": 0.999969146885598, "epsilon": 1.6122592652939378e-05, "use_nesterov": false, "adamw_weight_decay": 4.5541451796058596e-05, "l2_weight_decay": 2.0726803880130476e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 5.5449559124324236e-05, "constant_fraction": 0.8527583447562942}, {"learning_rate": 0.10426358139809778, "beta1": 0.8948466056688149, "beta2": 0.9987494301806874, "epsilon": 0.004799111204357653, "use_nesterov": true, "adamw_weight_decay": 0.011148078459186583, "l2_weight_decay": 0.0005379772141803957, "warmup_fraction": 1.1062152263511432e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.4407939113021252}, {"learning_rate": 0.03683182067179663, "beta1": 0.5134768401365318, "beta2": 0.9999488669618855, "epsilon": 93.94348746613565, "use_nesterov": false, "adamw_weight_decay": 0.0019943637456238243, "l2_weight_decay": 0.0008318927937176873, "warmup_fraction": 0.0, "min_learning_rate_mult": 1.6222342403477406e-05, "constant_fraction": 0.16968826576712104}, {"learning_rate": 0.0021816741296147284, "beta1": 0.538097502866929, "beta2": 0.9999232492541739, "epsilon": 0.00014076259299889392, "use_nesterov": true, "adamw_weight_decay": 0.004338976382641385, "l2_weight_decay": 0.06887275781568977, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.00064012404223635, "constant_fraction": 0.3449063030956443}, {"learning_rate": 8.548693653126442e-05, "beta1": 0.9799513594284013, "beta2": 0.06480855793979279, "epsilon": 1.3247271953091976e-08, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.020263308911585082, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.7273814701775079}, {"learning_rate": 0.1094960824205915, "beta1": 0.9934043185056707, "beta2": 0.7717157715255192, "epsilon": 1.9079804738063808e-07, "use_nesterov": false, "adamw_weight_decay": 0.0007726187343186974, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.029879811114961508, "constant_fraction": 0.1758716062038116}, {"learning_rate": 0.000158927906870825, "beta1": 0.38719969114284947, "beta2": 0.9999753010273262, "epsilon": 0.0016550536121546272, "use_nesterov": false, "adamw_weight_decay": 0.04107725437183138, "l2_weight_decay": 0.0, "warmup_fraction": 0.00023204176706851615, "min_learning_rate_mult": 0.0, "constant_fraction": 0.4030693659677471}, {"learning_rate": 3.0456230307900685e-05, "beta1": 0.7803960193832415, "beta2": 0.9991847135477996, "epsilon": 5.186787532717669e-06, "use_nesterov": true, "adamw_weight_decay": 0.0007944213767764528, "l2_weight_decay": 0.00019110809020004508, "warmup_fraction": 0.002217549767076495, "min_learning_rate_mult": 0.0, "constant_fraction": 0.9203538584759758}, {"learning_rate": 6.571399661090159e-05, "beta1": 0.9370844368684272, "beta2": 0.9999211945238292, "epsilon": 63.66609575163081, "use_nesterov": false, "adamw_weight_decay": 0.00234998591768928, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.34922120412862223}, {"learning_rate": 0.0007100916551864691, "beta1": 0.9788480405164591, "beta2": 0.99598104484119, "epsilon": 9.168505768805669e-06, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0038570814507831765, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.900698285648556}, {"learning_rate": 0.0016280520607478439, "beta1": 0.9975251460709949, "beta2": 0.6694724163266934, "epsilon": 0.24344681606000076, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.03966099831547882, "warmup_fraction": 0.00043346828176460455, "min_learning_rate_mult": 0.0, "constant_fraction": 0.03591076707615015}, {"learning_rate": 5.077377197005549e-05, "beta1": 0.29719438930212905, "beta2": 0.9998062531003717, "epsilon": 0.09049059689380999, "use_nesterov": false, "adamw_weight_decay": 0.007282136266641733, "l2_weight_decay": 0.050484574400847505, "warmup_fraction": 0.004684716135266319, "min_learning_rate_mult": 0.0, "constant_fraction": 0.8141345119355167}, {"learning_rate": 0.12672910832134762, "beta1": 0.9873769633925897, "beta2": 0.999924915983335, "epsilon": 0.008991294275254282, "use_nesterov": false, "adamw_weight_decay": 0.00010408568662221012, "l2_weight_decay": 1.9334356424371505e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.693744475016895}, {"learning_rate": 0.0009107745687775015, "beta1": 0.9964370560398735, "beta2": 0.9676871796883768, "epsilon": 5.111020234497499e-06, "use_nesterov": false, "adamw_weight_decay": 1.1695597222859751e-05, "l2_weight_decay": 0.0, "warmup_fraction": 5.279083780426277e-05, "min_learning_rate_mult": 2.308803987473592e-05, "constant_fraction": 0.6539104624998993}, {"learning_rate": 0.040351647838250265, "beta1": 0.8345198901068949, "beta2": 0.9997886960970056, "epsilon": 0.3248388282703156, "use_nesterov": false, "adamw_weight_decay": 2.3022294875185868e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.003307891872288581, "min_learning_rate_mult": 0.028001013655250644, "constant_fraction": 0.5516482620857124}, {"learning_rate": 1.4057113969411143e-05, "beta1": 0.9839461952321388, "beta2": 0.998556685988452, "epsilon": 0.0008463226980392223, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 3.739831037068702e-05, "warmup_fraction": 0.0026898818692514615, "min_learning_rate_mult": 0.0, "constant_fraction": 0.6317153049120576}, {"learning_rate": 0.00031613667984779916, "beta1": 0.740408965911068, "beta2": 0.9994504672509785, "epsilon": 1.6503755650741728e-05, "use_nesterov": false, "adamw_weight_decay": 0.0037458551783390655, "l2_weight_decay": 4.05109631330213e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.5735873434457}, {"learning_rate": 0.00018033450085523626, "beta1": 0.9358718602611392, "beta2": 0.9992108921130886, "epsilon": 0.0015857554316772292, "use_nesterov": true, "adamw_weight_decay": 0.0004904777715359292, "l2_weight_decay": 0.0, "warmup_fraction": 0.013852380609389106, "min_learning_rate_mult": 0.016124120433267695, "constant_fraction": 0.2579218193903321}, {"learning_rate": 1.1712424989978123e-05, "beta1": 0.9911261421916882, "beta2": 0.999553555971121, "epsilon": 73.01288302395929, "use_nesterov": false, "adamw_weight_decay": 7.264074995384757e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.0006727008582405905, "min_learning_rate_mult": 0.0, "constant_fraction": 0.7105765382600822}, {"learning_rate": 0.0004704143040197769, "beta1": 0.9960235107088271, "beta2": 0.9919116124449499, "epsilon": 9.010535280192964e-07, "use_nesterov": false, "adamw_weight_decay": 0.00038734679722454956, "l2_weight_decay": 0.0, "warmup_fraction": 6.188262454977853e-05, "min_learning_rate_mult": 0.030098597665744138, "constant_fraction": 0.21564392002857768}, {"learning_rate": 3.727519660960793e-05, "beta1": 0.99106571625772, "beta2": 0.9999375334703435, "epsilon": 1.9038079926641455e-07, "use_nesterov": false, "adamw_weight_decay": 0.008872915110676848, "l2_weight_decay": 4.741712087918342e-05, "warmup_fraction": 0.0009423388303161492, "min_learning_rate_mult": 0.007995772611396028, "constant_fraction": 0.5128914520252109}, {"learning_rate": 0.0002742673830243505, "beta1": 0.47529951454593333, "beta2": 0.9875764785850712, "epsilon": 2.6409010240396515, "use_nesterov": false, "adamw_weight_decay": 0.007370495639122479, "l2_weight_decay": 0.00014689178925522862, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0024140357529990712, "constant_fraction": 0.9025858787813633}, {"learning_rate": 0.0010177639366304107, "beta1": 0.9960640032951603, "beta2": 0.1443849992557351, "epsilon": 76.85072220037573, "use_nesterov": false, "adamw_weight_decay": 1.6096277445841644e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.7041866193300704}, {"learning_rate": 0.014919131896289423, "beta1": 0.3542105488159132, "beta2": 0.9944296537638837, "epsilon": 1.1150751050364467e-05, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.053041450500738205, "warmup_fraction": 0.005249838788602547, "min_learning_rate_mult": 0.0, "constant_fraction": 0.24903613989826612}, {"learning_rate": 0.00012470023075193863, "beta1": 0.885978212874667, "beta2": 0.9191281527411389, "epsilon": 0.00035881569696566445, "use_nesterov": false, "adamw_weight_decay": 0.06022225228963992, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.05791453358293299, "constant_fraction": 0.6371889666686572}, {"learning_rate": 0.03030737225452729, "beta1": 0.9927549896535346, "beta2": 0.970970406756382, "epsilon": 32.26783217959045, "use_nesterov": true, "adamw_weight_decay": 0.00022295194056142908, "l2_weight_decay": 0.02109448260578154, "warmup_fraction": 0.0011934133209867033, "min_learning_rate_mult": 0.0, "constant_fraction": 0.4097280428848996}, {"learning_rate": 0.01378633986149472, "beta1": 0.007165274718660797, "beta2": 0.9969535631087246, "epsilon": 1.8518624773043798e-06, "use_nesterov": false, "adamw_weight_decay": 9.271096622111532e-05, "l2_weight_decay": 1.8216224999907716e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.2567645072840362}, {"learning_rate": 0.4203893063155203, "beta1": 0.742310235871922, "beta2": 0.9988931253502447, "epsilon": 2.631061055463697e-06, "use_nesterov": false, "adamw_weight_decay": 3.881779860527879e-05, "l2_weight_decay": 0.0001153061509746906, "warmup_fraction": 0.021700108891906246, "min_learning_rate_mult": 0.00017769101415634233, "constant_fraction": 0.9346943523685003}, {"learning_rate": 3.23639061271451e-05, "beta1": 0.9981354282741419, "beta2": 0.9998044258442167, "epsilon": 180.1290345542626, "use_nesterov": false, "adamw_weight_decay": 5.143862132581542e-05, "l2_weight_decay": 0.0004366913391382327, "warmup_fraction": 1.8615689202400476e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.47740054991536063}, {"learning_rate": 0.0034423409594305275, "beta1": 0.9742248493556263, "beta2": 0.9996640172554077, "epsilon": 0.038292682647321226, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0039054646571177404, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.9429208791792338}, {"learning_rate": 0.0010005008860847497, "beta1": 0.998404721543398, "beta2": 0.9984024561901961, "epsilon": 0.26556696022648446, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 1.478291941568316e-05, "warmup_fraction": 0.00012131850152993604, "min_learning_rate_mult": 1.0343432779914942e-05, "constant_fraction": 0.35665105851295753}, {"learning_rate": 0.0036943506082533573, "beta1": 0.9979921269014872, "beta2": 0.7559209318922886, "epsilon": 0.06355874280966113, "use_nesterov": false, "adamw_weight_decay": 4.505835170340311e-05, "l2_weight_decay": 5.182581840623091e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.9097098341866764}, {"learning_rate": 3.861310834952191e-05, "beta1": 0.8451058018346859, "beta2": 0.30539027076605796, "epsilon": 6.449589950823159e-07, "use_nesterov": false, "adamw_weight_decay": 0.0005112548047797068, "l2_weight_decay": 0.007782900525588754, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.022112354736518156, "constant_fraction": 0.0008974199746317746}, {"learning_rate": 0.029242719419940826, "beta1": 0.9965475501393084, "beta2": 0.9535869258197351, "epsilon": 4.125564261155923, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0787242699093877, "warmup_fraction": 1.3493801666408733e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.023527288882095654}, {"learning_rate": 0.25893647738006126, "beta1": 0.9980510674854047, "beta2": 0.9969331978013775, "epsilon": 24.008189124392384, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.00016620021920024972, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.0537596494758209}, {"learning_rate": 0.030984746821539313, "beta1": 0.9732691731499022, "beta2": 0.8727663347072004, "epsilon": 3321.937285674731, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.009166711331190664, "warmup_fraction": 0.015231279602472276, "min_learning_rate_mult": 2.147111223799045e-05, "constant_fraction": 0.4725434069394958}, {"learning_rate": 0.002614439631189982, "beta1": 0.9966688509425065, "beta2": 0.9711167876578635, "epsilon": 0.0012556301470839516, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.015273673945692722, "warmup_fraction": 1.0318508569244972e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.5197436652945662}, {"learning_rate": 0.004173141342241978, "beta1": 0.15225818759506982, "beta2": 0.9999773610028536, "epsilon": 6.449024595770022e-07, "use_nesterov": false, "adamw_weight_decay": 0.0007333972279720616, "l2_weight_decay": 0.0022493089904007985, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0008340996263145734, "constant_fraction": 0.21751876535768688}, {"learning_rate": 1.225162228936724e-05, "beta1": 0.7530858519408269, "beta2": 0.9985807861577429, "epsilon": 0.9836870693336871, "use_nesterov": true, "adamw_weight_decay": 0.012928385177991384, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.30533801303639285}, {"learning_rate": 0.012340261091198446, "beta1": 0.59972768512894, "beta2": 0.9982415668634773, "epsilon": 0.0007808568060057955, "use_nesterov": true, "adamw_weight_decay": 0.0030062048151027693, "l2_weight_decay": 0.0965567311513644, "warmup_fraction": 0.0, "min_learning_rate_mult": 2.00869576356408e-05, "constant_fraction": 0.5806014601411803}, {"learning_rate": 5.6587527937417116e-05, "beta1": 0.2981256786496944, "beta2": 0.9999692042720865, "epsilon": 7.836039800443278e-06, "use_nesterov": true, "adamw_weight_decay": 0.00024843001494089667, "l2_weight_decay": 4.8677356072899385e-05, "warmup_fraction": 0.09224633556215142, "min_learning_rate_mult": 1.4364310270513588e-05, "constant_fraction": 0.9916313986526822}, {"learning_rate": 0.00018491845640834597, "beta1": 0.9908206443055559, "beta2": 0.9984932404964363, "epsilon": 1.1465032793256036e-06, "use_nesterov": true, "adamw_weight_decay": 0.09423248031391741, "l2_weight_decay": 0.003982433053376072, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0013963249312392663, "constant_fraction": 0.33219315488078094}, {"learning_rate": 0.12082762398441066, "beta1": 0.982334901459857, "beta2": 0.9953737603644169, "epsilon": 8246.912322977381, "use_nesterov": true, "adamw_weight_decay": 0.0071217128862174975, "l2_weight_decay": 0.003990914334722918, "warmup_fraction": 6.589364808870654e-05, "min_learning_rate_mult": 5.862731954905831e-05, "constant_fraction": 0.6079366176237859}, {"learning_rate": 0.20943537694626066, "beta1": 0.9767326740363232, "beta2": 0.99995699640723, "epsilon": 0.000184926211931001, "use_nesterov": true, "adamw_weight_decay": 0.00878068841494916, "l2_weight_decay": 0.04877532517617478, "warmup_fraction": 0.030327174261315128, "min_learning_rate_mult": 0.0055075759674869515, "constant_fraction": 0.3698013972963039}, {"learning_rate": 0.004252381821222831, "beta1": 0.9989357053454114, "beta2": 0.9999662287643754, "epsilon": 4.8132276107599325e-06, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0310489592721225, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.9656774533916646}, {"learning_rate": 0.023112107490732926, "beta1": 0.9896127501983443, "beta2": 0.9995563618923916, "epsilon": 6.2326546530202155e-06, "use_nesterov": false, "adamw_weight_decay": 0.0010980579455833895, "l2_weight_decay": 0.024600617464436328, "warmup_fraction": 0.005670414593758597, "min_learning_rate_mult": 0.0, "constant_fraction": 0.7807329474484354}, {"learning_rate": 0.00014577589059617247, "beta1": 0.9908158531515636, "beta2": 0.9997152090422533, "epsilon": 1.811190737829945e-07, "use_nesterov": false, "adamw_weight_decay": 9.838918374840231e-05, "l2_weight_decay": 0.004855570335019566, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.027102665621271383, "constant_fraction": 0.5784793905059852}, {"learning_rate": 2.2538459124046832e-05, "beta1": 0.7339034994795854, "beta2": 0.9895588758373679, "epsilon": 6683.103642142991, "use_nesterov": true, "adamw_weight_decay": 0.0005146518222153101, "l2_weight_decay": 0.0, "warmup_fraction": 0.00026266879454751906, "min_learning_rate_mult": 0.0, "constant_fraction": 0.2472419783432771}, {"learning_rate": 8.10601505706309e-05, "beta1": 0.9875832491646499, "beta2": 0.41670866828583464, "epsilon": 1103.085587823014, "use_nesterov": false, "adamw_weight_decay": 0.0016716370122003142, "l2_weight_decay": 0.005185347589097483, "warmup_fraction": 8.020466644851671e-05, "min_learning_rate_mult": 0.06851692657265905, "constant_fraction": 0.7267818718212152}, {"learning_rate": 0.007827053540861112, "beta1": 0.9968968038135512, "beta2": 0.9937457436872839, "epsilon": 0.013048470588679096, "use_nesterov": true, "adamw_weight_decay": 1.3363383180020288e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.00015805359073745248, "min_learning_rate_mult": 0.0038115796354242994, "constant_fraction": 0.18335984752230738}, {"learning_rate": 0.00025419442415596427, "beta1": 0.9453583759994368, "beta2": 0.9945973432611446, "epsilon": 7.91562012483202e-08, "use_nesterov": true, "adamw_weight_decay": 8.2772591054731e-05, "l2_weight_decay": 8.044266484723826e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.7454884980284596}, {"learning_rate": 3.2907567467777516e-05, "beta1": 0.9327069914408006, "beta2": 0.23614226123706994, "epsilon": 6.682206678548767e-08, "use_nesterov": false, "adamw_weight_decay": 0.0832880850354105, "l2_weight_decay": 0.0, "warmup_fraction": 0.0711162949783224, "min_learning_rate_mult": 0.02285208861990805, "constant_fraction": 0.0633957292181423}, {"learning_rate": 0.2354575581581307, "beta1": 0.9976449467708934, "beta2": 0.9992443442988054, "epsilon": 0.029244709229888474, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.00015512803284613378, "warmup_fraction": 0.0001281921071503123, "min_learning_rate_mult": 8.949856556868889e-05, "constant_fraction": 0.5780673739839867}, {"learning_rate": 0.003306588062066658, "beta1": 0.9966799133707692, "beta2": 0.9998800686806081, "epsilon": 0.0007658636109215232, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 1.5669359815420567e-05, "warmup_fraction": 2.934472846017415e-05, "min_learning_rate_mult": 7.559782371014121e-05, "constant_fraction": 0.04376728845472311}, {"learning_rate": 0.9442256561401599, "beta1": 0.9969726153134648, "beta2": 0.9999845836479596, "epsilon": 355.7177784270181, "use_nesterov": true, "adamw_weight_decay": 0.02073514522277812, "l2_weight_decay": 0.0, "warmup_fraction": 0.0062266179731912735, "min_learning_rate_mult": 0.0, "constant_fraction": 0.9325905535599291}, {"learning_rate": 0.0001687049325260243, "beta1": 0.9989317718976907, "beta2": 0.08731676680621592, "epsilon": 2.8626351696140824, "use_nesterov": true, "adamw_weight_decay": 1.2984371707245199e-05, "l2_weight_decay": 0.00013652420030476107, "warmup_fraction": 0.0008307613513227547, "min_learning_rate_mult": 0.0, "constant_fraction": 0.4968823761479596}, {"learning_rate": 0.00031865611892236225, "beta1": 0.9979620877322157, "beta2": 0.9920152508383006, "epsilon": 0.0004282811140596039, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 1.719230050171332e-05, "warmup_fraction": 0.07197307626357473, "min_learning_rate_mult": 0.0, "constant_fraction": 0.5080891944766445}, {"learning_rate": 0.007991063766112673, "beta1": 0.6174452691617334, "beta2": 0.28557560141396354, "epsilon": 1.591508588064111e-07, "use_nesterov": true, "adamw_weight_decay": 0.00014635300305529777, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.6291893460928102}, {"learning_rate": 0.013474029314809581, "beta1": 0.9489469988445013, "beta2": 0.8367777966433554, "epsilon": 1.9849748168017654e-05, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.025708358843792706, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.6035146192986995}, {"learning_rate": 0.04926098391376417, "beta1": 0.9907774258055363, "beta2": 0.9999883530870705, "epsilon": 1.2976943002501198e-08, "use_nesterov": true, "adamw_weight_decay": 0.04856596267802332, "l2_weight_decay": 2.321778306458518e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 1.1889683121493425e-05, "constant_fraction": 0.03929057418610371}, {"learning_rate": 0.0015158325893116329, "beta1": 0.997616727364371, "beta2": 0.9915818102486413, "epsilon": 0.08862103557036335, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.012775217385457636, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.6636566120302735}, {"learning_rate": 0.007438855966684839, "beta1": 0.9864452989616559, "beta2": 0.9998842921375253, "epsilon": 220.80075025167156, "use_nesterov": true, "adamw_weight_decay": 0.001700015879879932, "l2_weight_decay": 4.049527887642964e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.6602090774387226, "constant_fraction": 0.13757135958283917}, {"learning_rate": 0.04055482093872615, "beta1": 0.9989452047334931, "beta2": 0.8915237377524452, "epsilon": 843.0530518594481, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0002832730229571768, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.009630807593138311, "constant_fraction": 0.22963484596668238}, {"learning_rate": 0.27580719258377573, "beta1": 0.1601096146674984, "beta2": 0.9955927876282971, "epsilon": 1.2040240349442507e-08, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 8.792755484681537e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.000504464102416102, "constant_fraction": 0.8576321109546532}, {"learning_rate": 8.771515705867686e-05, "beta1": 0.6729293058426025, "beta2": 0.963080453170629, "epsilon": 1.633452591833786e-06, "use_nesterov": false, "adamw_weight_decay": 0.011663049847520812, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.45740147078917237}, {"learning_rate": 0.005262934030728578, "beta1": 0.9961063755194902, "beta2": 0.9999664781993363, "epsilon": 0.7921441193595735, "use_nesterov": true, "adamw_weight_decay": 0.0025784963205354823, "l2_weight_decay": 0.0033648677857019936, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.65540159848107}, {"learning_rate": 0.2189405692668492, "beta1": 0.7302872655450994, "beta2": 0.9999404322001497, "epsilon": 2.007651510779769e-07, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 4.8810059866793416e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.9781912815725895}, {"learning_rate": 0.04736590121355246, "beta1": 0.9958530947406898, "beta2": 0.9981660598577702, "epsilon": 0.00022504913383006807, "use_nesterov": false, "adamw_weight_decay": 0.01717301721973146, "l2_weight_decay": 0.04997629643512036, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.7597433498111122}, {"learning_rate": 0.0002613245464045561, "beta1": 0.8972293129366111, "beta2": 0.9999888140562291, "epsilon": 0.006722686035246396, "use_nesterov": false, "adamw_weight_decay": 0.07054757650426198, "l2_weight_decay": 0.008024497771312337, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.06760835721746605}, {"learning_rate": 0.0001499493162228961, "beta1": 0.9960389678096053, "beta2": 0.6629987228896134, "epsilon": 7.697514399699104e-05, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 7.201418663635424e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.1488291164052555, "constant_fraction": 0.9644041902513999}, {"learning_rate": 0.019096138823377323, "beta1": 0.9853282994944979, "beta2": 0.7485886463665029, "epsilon": 7.104942602246239e-08, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 2.238236440158732e-05, "warmup_fraction": 8.991905370356906e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.7460619430405605}, {"learning_rate": 0.8806037306470896, "beta1": 0.7211523757993374, "beta2": 0.9704505311013979, "epsilon": 3264.168150818, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0022633229400333766, "warmup_fraction": 0.0021289599481998816, "min_learning_rate_mult": 0.0, "constant_fraction": 0.23682057020829872}, {"learning_rate": 2.5318622699329045e-05, "beta1": 0.9399310674627551, "beta2": 0.999021581780636, "epsilon": 7.347671871747592e-08, "use_nesterov": false, "adamw_weight_decay": 0.00010675004527857507, "l2_weight_decay": 0.0, "warmup_fraction": 0.0023510573843976493, "min_learning_rate_mult": 2.9088847738320534e-05, "constant_fraction": 0.21089572096435183}, {"learning_rate": 0.7305057252756293, "beta1": 0.9969496642250399, "beta2": 0.9571224869546019, "epsilon": 0.0026359004192917563, "use_nesterov": false, "adamw_weight_decay": 0.0019401533906236292, "l2_weight_decay": 0.0, "warmup_fraction": 0.011754155201412925, "min_learning_rate_mult": 0.0065553499020277305, "constant_fraction": 0.1595961959580403}, {"learning_rate": 0.08145892169960409, "beta1": 0.7573833214850814, "beta2": 0.9406583451026908, "epsilon": 8789.90403769743, "use_nesterov": false, "adamw_weight_decay": 2.5765042160256384e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.03690224653346281, "constant_fraction": 0.6259545073136924}, {"learning_rate": 3.3102802469346536e-05, "beta1": 0.9935750348140298, "beta2": 0.9476936332337033, "epsilon": 5.724506952784915, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.06603378073515666, "warmup_fraction": 0.04568554346405363, "min_learning_rate_mult": 7.928352328602887e-05, "constant_fraction": 0.5753269119318466}, {"learning_rate": 0.02036033236638413, "beta1": 0.9727119631728401, "beta2": 0.6949812989756862, "epsilon": 0.00012794690504819477, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.02077733307796528, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.003223073675380069, "constant_fraction": 0.5203581778999119}, {"learning_rate": 0.14635004091767215, "beta1": 0.581721422435503, "beta2": 0.9252593948163483, "epsilon": 3.4404531017964e-08, "use_nesterov": true, "adamw_weight_decay": 0.02619080763763329, "l2_weight_decay": 0.00932125105794004, "warmup_fraction": 0.0026738543006775565, "min_learning_rate_mult": 0.0, "constant_fraction": 0.9666322610360774}, {"learning_rate": 0.03667968597780235, "beta1": 0.43935705796487323, "beta2": 0.9380522151135371, "epsilon": 1544.1665938387598, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.042728178297941365, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.8041941950044975}, {"learning_rate": 5.342063590504414e-05, "beta1": 0.9920423474130847, "beta2": 0.9984286858630714, "epsilon": 5.209183049686998, "use_nesterov": true, "adamw_weight_decay": 0.014237722184501679, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 1.4593378033521584e-05, "constant_fraction": 0.6692671125909134}, {"learning_rate": 0.000773915544506432, "beta1": 0.9165090289610535, "beta2": 0.44161730395571996, "epsilon": 0.24782924709432716, "use_nesterov": false, "adamw_weight_decay": 0.003148444106410766, "l2_weight_decay": 0.0, "warmup_fraction": 0.023671708409230566, "min_learning_rate_mult": 0.030020799530874498, "constant_fraction": 0.7326529038720573}, {"learning_rate": 0.27272115197975716, "beta1": 0.8872541973904136, "beta2": 0.5532387759298165, "epsilon": 1.1810709092110015e-05, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 5.636402896962392e-05, "warmup_fraction": 0.015839783386003264, "min_learning_rate_mult": 5.2145918221678694e-05, "constant_fraction": 0.23336689252854959}, {"learning_rate": 0.22852671924688786, "beta1": 0.989934678111452, "beta2": 0.9997791278761167, "epsilon": 1.0124273515055669e-07, "use_nesterov": true, "adamw_weight_decay": 4.389748608450401e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.4152456537818151}, {"learning_rate": 0.0032123801067651817, "beta1": 0.6787593992121808, "beta2": 0.9973542166531956, "epsilon": 5.034089262271543e-07, "use_nesterov": true, "adamw_weight_decay": 0.0013002551130271267, "l2_weight_decay": 0.007955045467903198, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.2444264958248663}, {"learning_rate": 0.17289960410237915, "beta1": 0.9738078454690391, "beta2": 0.9989391809526078, "epsilon": 4.791944626349936e-05, "use_nesterov": false, "adamw_weight_decay": 0.018279552279659366, "l2_weight_decay": 0.0, "warmup_fraction": 3.2443477464685005e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.665739514045241}, {"learning_rate": 2.2870539298751296e-05, "beta1": 0.9989675150219064, "beta2": 0.9983541710100042, "epsilon": 0.0003450462571503383, "use_nesterov": true, "adamw_weight_decay": 2.410420145332847e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.007252359836352474, "min_learning_rate_mult": 0.00327876447586618, "constant_fraction": 0.36305274559513645}, {"learning_rate": 0.0006882779174080016, "beta1": 0.9928206530413884, "beta2": 0.9179363592434172, "epsilon": 560.9947864586674, "use_nesterov": false, "adamw_weight_decay": 0.011909734107784977, "l2_weight_decay": 0.0, "warmup_fraction": 1.1446096757437698e-05, "min_learning_rate_mult": 3.23820639125488e-05, "constant_fraction": 0.9207263346568542}, {"learning_rate": 0.21182612663110229, "beta1": 0.9715594554618353, "beta2": 0.9924346793975231, "epsilon": 0.030430156950474394, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 2.3436323190595665e-05, "warmup_fraction": 0.0017764365926607607, "min_learning_rate_mult": 0.0, "constant_fraction": 0.9580691716980478}, {"learning_rate": 0.0002153602080182142, "beta1": 0.9559266118434399, "beta2": 0.9999702475579275, "epsilon": 4.849213882257559e-06, "use_nesterov": true, "adamw_weight_decay": 0.002796034065952558, "l2_weight_decay": 0.0004618725299694008, "warmup_fraction": 0.018552058250428143, "min_learning_rate_mult": 0.19414902913429738, "constant_fraction": 0.9303310694172523}, {"learning_rate": 0.10820090235705782, "beta1": 0.9983596402656534, "beta2": 0.9999545326709565, "epsilon": 0.00013836654362957832, "use_nesterov": true, "adamw_weight_decay": 0.00039320504406250146, "l2_weight_decay": 0.0, "warmup_fraction": 0.04081973007438349, "min_learning_rate_mult": 0.03843536764131974, "constant_fraction": 0.5792605854043755}, {"learning_rate": 0.0009851946550481238, "beta1": 0.9957084952044023, "beta2": 0.8564208893207437, "epsilon": 0.16455517258435065, "use_nesterov": true, "adamw_weight_decay": 0.006692059300723375, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0002822714973995203, "constant_fraction": 0.6974963858169121}, {"learning_rate": 1.1199585695916074e-05, "beta1": 0.9937170199932047, "beta2": 0.9998917079128593, "epsilon": 1.6155480005886254, "use_nesterov": false, "adamw_weight_decay": 0.008603269241781316, "l2_weight_decay": 0.00013463624272474375, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.22692519283102186}, {"learning_rate": 5.912336814318337e-05, "beta1": 0.9959261072271186, "beta2": 0.9555429687813177, "epsilon": 47.312113503926945, "use_nesterov": true, "adamw_weight_decay": 3.0096516677043937e-05, "l2_weight_decay": 6.470133611341221e-05, "warmup_fraction": 0.005362219571246192, "min_learning_rate_mult": 0.32458632133862314, "constant_fraction": 0.28789821358208556}, {"learning_rate": 3.9565924964235506e-05, "beta1": 0.8466975211810862, "beta2": 0.8442168110727711, "epsilon": 29.111415465151957, "use_nesterov": true, "adamw_weight_decay": 0.026996178525812688, "l2_weight_decay": 0.007642517942785971, "warmup_fraction": 0.00019673639183691668, "min_learning_rate_mult": 4.7915570255163814e-05, "constant_fraction": 0.5129958252895315}, {"learning_rate": 0.3456679753585363, "beta1": 0.8692022932939022, "beta2": 0.9999786857299233, "epsilon": 7376.590586522489, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 3.527248077053418e-05, "warmup_fraction": 0.05666050796524618, "min_learning_rate_mult": 0.07755887754542057, "constant_fraction": 0.4516196469942132}, {"learning_rate": 0.0038603703917783846, "beta1": 0.9978296169939204, "beta2": 0.9941977049323454, "epsilon": 0.00420515265027739, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 9.35031838483916e-05, "warmup_fraction": 0.06908861129545497, "min_learning_rate_mult": 0.0002006899333628445, "constant_fraction": 0.8497041897771871}, {"learning_rate": 1.035569515629211e-05, "beta1": 0.9543482129636763, "beta2": 0.9865577197724403, "epsilon": 0.019442705626754302, "use_nesterov": true, "adamw_weight_decay": 0.0002990933182897978, "l2_weight_decay": 0.0009247603200742442, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.3093124357264545}, {"learning_rate": 2.0714964301016298e-05, "beta1": 0.9987406162678083, "beta2": 0.9998494426911645, "epsilon": 0.003734126869178425, "use_nesterov": true, "adamw_weight_decay": 0.0037719700293782805, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.9698267284073828, "constant_fraction": 0.9107624835668564}, {"learning_rate": 0.0178677698408671, "beta1": 0.9840429575747197, "beta2": 0.8258375107921742, "epsilon": 1346.474375823492, "use_nesterov": false, "adamw_weight_decay": 0.007525731583085676, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 1.701199977806229e-05, "constant_fraction": 0.21823021599474102}, {"learning_rate": 0.4544861132683541, "beta1": 0.9845684966017203, "beta2": 0.9998648276235115, "epsilon": 0.23448281522061085, "use_nesterov": true, "adamw_weight_decay": 0.0019673062383920026, "l2_weight_decay": 0.008391953607875124, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.9606156655122932}, {"learning_rate": 0.00020683802885505955, "beta1": 0.9483155647615255, "beta2": 0.9996606579804698, "epsilon": 0.05437339192456122, "use_nesterov": true, "adamw_weight_decay": 0.0005021580135244213, "l2_weight_decay": 0.0, "warmup_fraction": 0.0022725099442446883, "min_learning_rate_mult": 0.012877967051154472, "constant_fraction": 0.846699743737637}, {"learning_rate": 0.11049714589513275, "beta1": 0.987005355490576, "beta2": 0.7017548811664536, "epsilon": 0.4549089929884415, "use_nesterov": true, "adamw_weight_decay": 0.00026300995583349994, "l2_weight_decay": 0.00011561208827063153, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.06169929730895218}, {"learning_rate": 6.466571621881881e-05, "beta1": 0.8571591868542644, "beta2": 0.9999076895298786, "epsilon": 12.238007590940537, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.004517625931065415, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.48436488593282656, "constant_fraction": 0.4668064297314706}, {"learning_rate": 0.001116975530704319, "beta1": 0.303160182782368, "beta2": 0.995405824174155, "epsilon": 6.906231592288291e-08, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.010489702977094591, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.4723279966072589}, {"learning_rate": 2.189909400692018e-05, "beta1": 0.9805537985895719, "beta2": 0.9993601643081036, "epsilon": 1.346786293958208, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 3.127965396886237e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.510404398823175}, {"learning_rate": 0.0007100281034220097, "beta1": 0.7818789937123002, "beta2": 0.4841305215375937, "epsilon": 1.5497609666002596e-08, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.002936280457066981, "warmup_fraction": 0.045652136025270906, "min_learning_rate_mult": 0.01120733760941568, "constant_fraction": 0.5348854785268254}, {"learning_rate": 1.3120137219354836e-05, "beta1": 0.4584013159967699, "beta2": 0.9999717691537616, "epsilon": 274.34070492199936, "use_nesterov": true, "adamw_weight_decay": 0.0005505649019509298, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.7021063557686066}, {"learning_rate": 0.0018017293484922582, "beta1": 0.9976609462245145, "beta2": 0.9999594803002878, "epsilon": 0.0003717514588902638, "use_nesterov": true, "adamw_weight_decay": 0.0006949938715366734, "l2_weight_decay": 0.05834572115012243, "warmup_fraction": 9.786455018477199e-05, "min_learning_rate_mult": 0.0002107406203528016, "constant_fraction": 0.5737569858113282}, {"learning_rate": 0.26349191281683987, "beta1": 0.9475395251132315, "beta2": 0.9998838694521939, "epsilon": 0.0053834115075678205, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0018639442933087685, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.47980155028873217}, {"learning_rate": 0.04798350212355469, "beta1": 0.6107029673022384, "beta2": 0.9926721898292065, "epsilon": 8.563795614556501e-08, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 5.949247033576634e-05, "warmup_fraction": 0.013664305712291129, "min_learning_rate_mult": 0.027467845836107396, "constant_fraction": 0.7378797715509732}, {"learning_rate": 0.0022172085294571457, "beta1": 0.9969880945414312, "beta2": 0.9988668119928872, "epsilon": 3.5544834316267164, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.00041093311920537863, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.3968573042165918}, {"learning_rate": 0.06045049636580456, "beta1": 0.997373117711885, "beta2": 0.9999638786229028, "epsilon": 0.033926631937115266, "use_nesterov": true, "adamw_weight_decay": 0.0005604584328620976, "l2_weight_decay": 0.014294181897064892, "warmup_fraction": 0.040979882461700944, "min_learning_rate_mult": 3.164450854952688e-05, "constant_fraction": 0.7034642340090173}, {"learning_rate": 0.3861936886502016, "beta1": 0.9246529266275967, "beta2": 0.9998457067483714, "epsilon": 0.11530708268361033, "use_nesterov": false, "adamw_weight_decay": 0.00018710032010974895, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.9104254801343205}, {"learning_rate": 2.604646559541433e-05, "beta1": 0.9969294005470222, "beta2": 0.9999855398316685, "epsilon": 2.9549496137444904e-06, "use_nesterov": true, "adamw_weight_decay": 0.010645858560091759, "l2_weight_decay": 0.001466933225540056, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.00037173506909848663, "constant_fraction": 0.9852108299482001}, {"learning_rate": 0.00010446819674607716, "beta1": 0.8436590179746497, "beta2": 0.9941911643679692, "epsilon": 1755.1822605967413, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0005413478056673828, "warmup_fraction": 5.419161223611909e-05, "min_learning_rate_mult": 0.0013519229371689971, "constant_fraction": 0.1697968309472876}, {"learning_rate": 0.05968293197450993, "beta1": 0.9859680788700922, "beta2": 0.9999437192409284, "epsilon": 0.0001345080622887975, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 4.5209476784816625e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.13980633197382009, "constant_fraction": 0.18714557533258236}, {"learning_rate": 1.3761645026523434e-05, "beta1": 0.976246509655504, "beta2": 0.9999794951245253, "epsilon": 2.6924907703658607e-08, "use_nesterov": false, "adamw_weight_decay": 0.003942910434788243, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.2858887999362074}, {"learning_rate": 0.5675930701222627, "beta1": 0.9984850709933599, "beta2": 0.9319986165848171, "epsilon": 0.6809538986016084, "use_nesterov": false, "adamw_weight_decay": 2.4284093476906046e-05, "l2_weight_decay": 0.03409044136712912, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.05314345800137985, "constant_fraction": 0.8306441975158237}, {"learning_rate": 0.6044761193427397, "beta1": 0.9978249780553394, "beta2": 0.9929984201969044, "epsilon": 1803.8448633091316, "use_nesterov": true, "adamw_weight_decay": 0.00043343682334562154, "l2_weight_decay": 0.0, "warmup_fraction": 2.672249246759294e-05, "min_learning_rate_mult": 0.8780669761994667, "constant_fraction": 0.4664274088379764}, {"learning_rate": 2.4750220023048834e-05, "beta1": 0.9896903094660097, "beta2": 0.3309458743704793, "epsilon": 5633.896939032489, "use_nesterov": false, "adamw_weight_decay": 0.0008909881174268151, "l2_weight_decay": 0.0022664985058304028, "warmup_fraction": 0.001466658038087361, "min_learning_rate_mult": 5.393390376217215e-05, "constant_fraction": 0.6713928454038179}, {"learning_rate": 0.37961556273097696, "beta1": 0.9962229435338128, "beta2": 0.8836171183399347, "epsilon": 3.8917682523735204e-08, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0030603885405222505, "warmup_fraction": 0.03455386001779087, "min_learning_rate_mult": 0.0, "constant_fraction": 0.668527976626565}, {"learning_rate": 0.10715243582705548, "beta1": 0.9806882178661133, "beta2": 0.9773712821618639, "epsilon": 0.0024329452767763698, "use_nesterov": true, "adamw_weight_decay": 0.0046002058943820645, "l2_weight_decay": 0.0, "warmup_fraction": 2.193141651710674e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.706796012492727}, {"learning_rate": 0.0002879645555822931, "beta1": 0.991352255304677, "beta2": 0.9996485865215379, "epsilon": 0.07604551896873818, "use_nesterov": false, "adamw_weight_decay": 0.0022118275145232365, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.04491347005186357, "constant_fraction": 0.7434889190657546}, {"learning_rate": 6.0384865305126824e-05, "beta1": 0.7829468486882, "beta2": 0.7284284735445979, "epsilon": 173.59746082096348, "use_nesterov": true, "adamw_weight_decay": 2.113995289269148e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0011483360206013162, "constant_fraction": 0.01714239444564547}, {"learning_rate": 4.178698196713881e-05, "beta1": 0.9937464598347113, "beta2": 0.999548639340075, "epsilon": 1.861679161217417e-07, "use_nesterov": false, "adamw_weight_decay": 7.94490300092056e-05, "l2_weight_decay": 0.001483676606571213, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0133072871946436, "constant_fraction": 0.14677744042362495}, {"learning_rate": 0.0001516998641494683, "beta1": 0.9259632315430333, "beta2": 0.7530600981016036, "epsilon": 3.473091381650328e-05, "use_nesterov": true, "adamw_weight_decay": 0.09781685896702463, "l2_weight_decay": 0.0011765470413444144, "warmup_fraction": 0.0, "min_learning_rate_mult": 4.4720412374314755e-05, "constant_fraction": 0.49350684058832683}, {"learning_rate": 0.8289326019207967, "beta1": 0.6859014917213138, "beta2": 0.9981193056832182, "epsilon": 0.00033734359484823283, "use_nesterov": true, "adamw_weight_decay": 4.142752871526671e-05, "l2_weight_decay": 0.001152250068230366, "warmup_fraction": 0.0005090494048740251, "min_learning_rate_mult": 0.0, "constant_fraction": 0.6444470956890431}, {"learning_rate": 0.006290372759174715, "beta1": 0.9282212680343543, "beta2": 0.9899041427207379, "epsilon": 4326.904304796197, "use_nesterov": true, "adamw_weight_decay": 3.519653288813463e-05, "l2_weight_decay": 9.358998683349749e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0908150062554143, "constant_fraction": 0.9305517493431275}, {"learning_rate": 0.36795520904774043, "beta1": 0.6844473069553776, "beta2": 0.9991041265174682, "epsilon": 3.8256608699169866e-05, "use_nesterov": false, "adamw_weight_decay": 0.0009207463106340986, "l2_weight_decay": 0.0, "warmup_fraction": 0.01542776946199365, "min_learning_rate_mult": 0.0, "constant_fraction": 0.5076372762625115}, {"learning_rate": 0.0066280667255352145, "beta1": 0.9829112878265135, "beta2": 0.9642958900372445, "epsilon": 0.012267161065815858, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.005488872697554227, "warmup_fraction": 5.8162735163525586e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.8966386423945562}, {"learning_rate": 0.0071699960467921636, "beta1": 0.9532142536127078, "beta2": 0.5826480349134552, "epsilon": 49.64743571670105, "use_nesterov": false, "adamw_weight_decay": 0.023073912887363567, "l2_weight_decay": 0.0012542881191687383, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.00018731935269687762, "constant_fraction": 0.982469029522464}, {"learning_rate": 0.00018424596712179292, "beta1": 0.9436451527373279, "beta2": 0.9995663097575452, "epsilon": 1231.9799835447088, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 2.764264308003711e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.00048324792709895974, "constant_fraction": 0.11728066029885631}, {"learning_rate": 0.019710918331496033, "beta1": 0.9905445516016177, "beta2": 0.9977390942778436, "epsilon": 0.854845760122629, "use_nesterov": true, "adamw_weight_decay": 0.0006546699559252979, "l2_weight_decay": 0.0016799493891019013, "warmup_fraction": 0.05261681597836509, "min_learning_rate_mult": 0.5209457428329014, "constant_fraction": 0.6329952257498542}, {"learning_rate": 1.614688994367264e-05, "beta1": 0.5351903188391663, "beta2": 0.7284472974036125, "epsilon": 1614.7836800631892, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0007796843906643197, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.5139477565142905}, {"learning_rate": 2.9648186174515388e-05, "beta1": 0.8666351109237997, "beta2": 0.9999805494902607, "epsilon": 0.016918946039181933, "use_nesterov": true, "adamw_weight_decay": 0.000397544687786519, "l2_weight_decay": 1.9637970951066396e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.8314237860158111}, {"learning_rate": 0.0026771774284591707, "beta1": 0.9870681919883374, "beta2": 0.999949940352679, "epsilon": 256.2663747375169, "use_nesterov": true, "adamw_weight_decay": 9.189331274804064e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.00019030379186959524, "min_learning_rate_mult": 0.0, "constant_fraction": 0.23068770744042633}, {"learning_rate": 0.42533429454785343, "beta1": 0.9826919940164012, "beta2": 0.9999396745101942, "epsilon": 9.974329069412377e-08, "use_nesterov": false, "adamw_weight_decay": 0.006405534731719381, "l2_weight_decay": 0.09850728588028144, "warmup_fraction": 0.05192958775986463, "min_learning_rate_mult": 0.0, "constant_fraction": 0.8835249352414272}, {"learning_rate": 0.0004284957672347059, "beta1": 0.9970962295764056, "beta2": 0.9964945089590497, "epsilon": 6.709008673301412, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 2.0367073299479743e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 9.81666144628278e-05, "constant_fraction": 0.03894769150788391}, {"learning_rate": 0.0004098001884668106, "beta1": 0.9955058489135423, "beta2": 0.9996904231154874, "epsilon": 4.0018282307411496e-08, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 1.5379621503905997e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 5.327085731160047e-05, "constant_fraction": 0.9674053077933659}, {"learning_rate": 1.3973387277718537e-05, "beta1": 0.9731924712774872, "beta2": 0.24341968630961563, "epsilon": 3.728394675357938, "use_nesterov": false, "adamw_weight_decay": 1.0929611507117251e-05, "l2_weight_decay": 7.440736679193559e-05, "warmup_fraction": 0.006275250211555397, "min_learning_rate_mult": 0.0, "constant_fraction": 0.5947459079853987}, {"learning_rate": 0.6920967248626889, "beta1": 0.9848160249132055, "beta2": 0.9999601028139705, "epsilon": 0.008756066441567614, "use_nesterov": true, "adamw_weight_decay": 0.0928950937722487, "l2_weight_decay": 0.028680212275047096, "warmup_fraction": 0.031005140907675432, "min_learning_rate_mult": 0.0, "constant_fraction": 0.9945553021611092}, {"learning_rate": 1.2626597082503364e-05, "beta1": 0.9673833806867478, "beta2": 0.9997558193144148, "epsilon": 0.5351697109388497, "use_nesterov": false, "adamw_weight_decay": 0.05385586273991676, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.2444874536319943}, {"learning_rate": 0.1947395313434653, "beta1": 0.9989780317850779, "beta2": 0.9999793257000292, "epsilon": 5.015246055385651e-07, "use_nesterov": true, "adamw_weight_decay": 0.0004878440758461413, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.40404352341285643}, {"learning_rate": 0.005945447944336607, "beta1": 0.10092276828994029, "beta2": 0.8918774079292681, "epsilon": 2.398734449458218e-07, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.050039710965606755, "warmup_fraction": 0.014454830432148201, "min_learning_rate_mult": 0.002790377635216, "constant_fraction": 0.670172458035294}, {"learning_rate": 8.338222439945072e-05, "beta1": 0.9877118562341449, "beta2": 0.9999878936034525, "epsilon": 321.51958495101394, "use_nesterov": false, "adamw_weight_decay": 0.020540143466759354, "l2_weight_decay": 0.000632003091120172, "warmup_fraction": 0.0005338817481256062, "min_learning_rate_mult": 0.0, "constant_fraction": 0.8056890753686978}, {"learning_rate": 0.3974795793238859, "beta1": 0.9873453893110566, "beta2": 0.9999171924772728, "epsilon": 496.37429366573167, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0020561255459234777, "warmup_fraction": 0.0, "min_learning_rate_mult": 2.2626061539482938e-05, "constant_fraction": 0.715070491695452}, {"learning_rate": 0.18967822715413699, "beta1": 0.9859115763776624, "beta2": 0.0590714714111823, "epsilon": 15.10651052070765, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 1.4454424015687246e-05, "warmup_fraction": 0.00015952875340536043, "min_learning_rate_mult": 0.41692475359198744, "constant_fraction": 0.07896638085638752}, {"learning_rate": 0.010934907614006069, "beta1": 0.9679057997168892, "beta2": 0.9992628850226172, "epsilon": 0.7717437630029971, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0002609147393233507, "warmup_fraction": 6.764571326990585e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.342204818642053}, {"learning_rate": 0.36065727013853827, "beta1": 0.997018958119722, "beta2": 0.9765264891291133, "epsilon": 0.0003229819455720008, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.05613354591560181, "warmup_fraction": 0.0002958406070750656, "min_learning_rate_mult": 0.0007446476079048411, "constant_fraction": 0.8870195761822142}, {"learning_rate": 0.001153118322493084, "beta1": 0.8947735648204569, "beta2": 0.9999781960226166, "epsilon": 1.727572832047309e-07, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.011487986869190631, "warmup_fraction": 0.0013724198828846705, "min_learning_rate_mult": 0.0, "constant_fraction": 0.5268787064042881}, {"learning_rate": 0.0016302236684954201, "beta1": 0.08221785954738459, "beta2": 0.9998910435421448, "epsilon": 452.42672308715765, "use_nesterov": false, "adamw_weight_decay": 0.08682310741943486, "l2_weight_decay": 0.0, "warmup_fraction": 0.0017028392657147287, "min_learning_rate_mult": 0.0, "constant_fraction": 0.25991465028224214}, {"learning_rate": 3.325791989423312e-05, "beta1": 0.9822091547331289, "beta2": 0.9947088933366675, "epsilon": 0.15022407084939093, "use_nesterov": false, "adamw_weight_decay": 1.3027088121739744e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.013749866548099881, "constant_fraction": 0.5513091838942841}, {"learning_rate": 0.00010631216413207391, "beta1": 0.9897416428252404, "beta2": 0.9999763615480425, "epsilon": 8.651426853928369, "use_nesterov": true, "adamw_weight_decay": 1.2954999887496763e-05, "l2_weight_decay": 0.0, "warmup_fraction": 2.122570743959026e-05, "min_learning_rate_mult": 0.023735771867648758, "constant_fraction": 0.3238496976486639}, {"learning_rate": 0.6648263208409538, "beta1": 0.03042370654803661, "beta2": 0.9764569238857974, "epsilon": 7.694110370515433e-07, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.07146104218017899, "warmup_fraction": 0.019991151402374688, "min_learning_rate_mult": 0.0, "constant_fraction": 0.7112876569148775}, {"learning_rate": 1.172826403413707e-05, "beta1": 0.9984523880782935, "beta2": 0.9986910773523497, "epsilon": 2.6378065902122654e-05, "use_nesterov": false, "adamw_weight_decay": 0.0007550806613464561, "l2_weight_decay": 0.00035417921091531314, "warmup_fraction": 7.843483914542406e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.0029452890597918557}, {"learning_rate": 0.0001550173377393823, "beta1": 0.3580102983436487, "beta2": 0.8415688875276255, "epsilon": 0.013029164173069346, "use_nesterov": false, "adamw_weight_decay": 0.02401936282924632, "l2_weight_decay": 0.0, "warmup_fraction": 0.0004887312430563556, "min_learning_rate_mult": 0.8898615650442372, "constant_fraction": 0.23053439839972123}, {"learning_rate": 0.0007676758313697541, "beta1": 0.9508285505866256, "beta2": 0.9979606251451427, "epsilon": 1688.8157194064129, "use_nesterov": true, "adamw_weight_decay": 0.04703869046796081, "l2_weight_decay": 0.0022685945067434216, "warmup_fraction": 1.4268301068569592e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.48596246834512913}, {"learning_rate": 0.034086427084911115, "beta1": 0.9978946920875866, "beta2": 0.7270943214907382, "epsilon": 115.39652310482742, "use_nesterov": true, "adamw_weight_decay": 0.000455150119763976, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.370444823592606}, {"learning_rate": 0.00010200260143413255, "beta1": 0.9982784818004977, "beta2": 0.999977172154093, "epsilon": 1.0787609986690546e-05, "use_nesterov": false, "adamw_weight_decay": 0.05873438143482576, "l2_weight_decay": 0.003049678089968478, "warmup_fraction": 0.0012456489940732307, "min_learning_rate_mult": 0.0, "constant_fraction": 0.5650389111550139}, {"learning_rate": 0.0006430513808021332, "beta1": 0.9927064276564994, "beta2": 0.9966149254517576, "epsilon": 0.20692666905637108, "use_nesterov": true, "adamw_weight_decay": 0.0048368853151643425, "l2_weight_decay": 0.0011564194996496599, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.003945064656250411, "constant_fraction": 0.05774240902381966}, {"learning_rate": 1.469341542044686e-05, "beta1": 0.9958579870855334, "beta2": 0.7271777677952485, "epsilon": 0.03135557623951734, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.007510275064508937, "warmup_fraction": 0.0008845535835318449, "min_learning_rate_mult": 0.0, "constant_fraction": 0.8518588214207904}, {"learning_rate": 0.0025215841795343634, "beta1": 0.8996098741788451, "beta2": 0.9988947817950795, "epsilon": 209.23473417932092, "use_nesterov": false, "adamw_weight_decay": 0.045927958834528985, "l2_weight_decay": 0.0003863138149898099, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.2671200569932331, "constant_fraction": 0.7369638808695693}, {"learning_rate": 0.0022211283805878023, "beta1": 0.21470496559026642, "beta2": 0.9999860302344948, "epsilon": 141.36695378322437, "use_nesterov": true, "adamw_weight_decay": 0.018484169984221494, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.4529379087027535}, {"learning_rate": 0.01150949215409132, "beta1": 0.9906582589992178, "beta2": 0.9997778466943826, "epsilon": 0.09572951403610948, "use_nesterov": false, "adamw_weight_decay": 0.006029617912925349, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.003689345576950886, "constant_fraction": 0.19397384886326619}, {"learning_rate": 0.9451490384274867, "beta1": 0.9881261038634691, "beta2": 0.848217866850911, "epsilon": 0.00017898588804176135, "use_nesterov": true, "adamw_weight_decay": 1.3654260094894735e-05, "l2_weight_decay": 0.00017085744810181548, "warmup_fraction": 0.00011617792415404825, "min_learning_rate_mult": 0.0009251689516724963, "constant_fraction": 0.26250871819597876}, {"learning_rate": 0.004504371383545856, "beta1": 0.9985502429728336, "beta2": 0.9995318926504502, "epsilon": 0.015349391857104266, "use_nesterov": false, "adamw_weight_decay": 0.008774415965779362, "l2_weight_decay": 0.00015911551492444443, "warmup_fraction": 0.00487441642257809, "min_learning_rate_mult": 3.495982421724854e-05, "constant_fraction": 0.050432809700613146}, {"learning_rate": 0.46047016329462737, "beta1": 0.9950879503508385, "beta2": 0.8857267365086876, "epsilon": 2.005249509872115e-06, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.029722028584636212, "warmup_fraction": 7.863891381105295e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.9214173377034355}, {"learning_rate": 1.784179219055176e-05, "beta1": 0.9539882899909359, "beta2": 0.9386920898925802, "epsilon": 0.2058813868506664, "use_nesterov": false, "adamw_weight_decay": 0.00018837147092523392, "l2_weight_decay": 0.0026486950627138788, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.44393828757367493}, {"learning_rate": 0.053924945547046875, "beta1": 0.9786525803099853, "beta2": 0.9999581501489969, "epsilon": 2210.4833121972288, "use_nesterov": true, "adamw_weight_decay": 0.009966519881057425, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0008525822672751425, "constant_fraction": 0.4821758154699711}, {"learning_rate": 3.139165600764007e-05, "beta1": 0.5375124531129745, "beta2": 0.9998452610988602, "epsilon": 3191.34239738279, "use_nesterov": false, "adamw_weight_decay": 0.022048270277081103, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.5309112969145681}, {"learning_rate": 0.00030222439237913474, "beta1": 0.9982576500630973, "beta2": 0.999963679670735, "epsilon": 22.983243706370747, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 1.1582134163599743e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.7512533742892734}, {"learning_rate": 0.0002617059219615687, "beta1": 0.9970351217156647, "beta2": 0.2992625418322842, "epsilon": 0.021568692751336542, "use_nesterov": false, "adamw_weight_decay": 0.09045861001963942, "l2_weight_decay": 3.9144213539744565e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0827674113833982, "constant_fraction": 0.41025124558207904}, {"learning_rate": 0.0071046849059717716, "beta1": 0.9360442032175592, "beta2": 0.99998277845792, "epsilon": 262.2342450373285, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.05543885092704575, "warmup_fraction": 0.02496080969471613, "min_learning_rate_mult": 9.914764275695334e-05, "constant_fraction": 0.5687078667611464}, {"learning_rate": 0.0050162043260204275, "beta1": 0.21155647193531368, "beta2": 0.9999580272232039, "epsilon": 1883.2964489605135, "use_nesterov": false, "adamw_weight_decay": 1.622326846140025e-05, "l2_weight_decay": 0.0002673746285923772, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.9434032378828878}, {"learning_rate": 0.13731615006335557, "beta1": 0.995380632539126, "beta2": 0.9999727206576899, "epsilon": 3.7526396011503675e-08, "use_nesterov": true, "adamw_weight_decay": 0.0013339657442176052, "l2_weight_decay": 6.790724433622241e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 1.0570023768035117e-05, "constant_fraction": 0.12755470079358178}, {"learning_rate": 0.009740704522524507, "beta1": 0.9988819832672182, "beta2": 0.9748313359631158, "epsilon": 3.0578869014564116, "use_nesterov": true, "adamw_weight_decay": 1.2191167192289218e-05, "l2_weight_decay": 0.0, "warmup_fraction": 9.492472434892115e-05, "min_learning_rate_mult": 1.8728202381429917e-05, "constant_fraction": 0.8825328247637165}, {"learning_rate": 0.028703697312903734, "beta1": 0.7624707395347554, "beta2": 0.6155529009727438, "epsilon": 0.025772657722100533, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0477221333110431, "warmup_fraction": 1.2671735766965743e-05, "min_learning_rate_mult": 0.0649657082976759, "constant_fraction": 0.4723685361948817}, {"learning_rate": 2.0712223524723224e-05, "beta1": 0.9836874270688376, "beta2": 0.995845501327273, "epsilon": 6.674719192912879e-05, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 5.080615891452274e-05, "warmup_fraction": 0.00022840308659971206, "min_learning_rate_mult": 0.283918035211839, "constant_fraction": 0.2562844308550636}, {"learning_rate": 0.00025507799213796075, "beta1": 0.9698405035635674, "beta2": 0.9999603359906739, "epsilon": 1.3468427233967094e-06, "use_nesterov": true, "adamw_weight_decay": 0.008308670841558409, "l2_weight_decay": 0.0013839142666626269, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.24973686098532344, "constant_fraction": 0.4773642906423754}, {"learning_rate": 1.6663206253925986e-05, "beta1": 0.8784151870675737, "beta2": 0.9999832105663897, "epsilon": 4.1707252081403424e-07, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.0018890509093483414, "warmup_fraction": 0.001015551111958815, "min_learning_rate_mult": 0.43517497751088907, "constant_fraction": 0.2580995926679406}, {"learning_rate": 0.7098098052886483, "beta1": 0.9980864605200949, "beta2": 0.9996278148752721, "epsilon": 0.0022301967623970177, "use_nesterov": false, "adamw_weight_decay": 1.9616003338090292e-05, "l2_weight_decay": 2.9620843065706782e-05, "warmup_fraction": 0.024658046216757754, "min_learning_rate_mult": 0.0, "constant_fraction": 0.36385931568544694}, {"learning_rate": 0.39973376514464876, "beta1": 0.9894128758831623, "beta2": 0.9998806550238931, "epsilon": 0.0027842027574324635, "use_nesterov": false, "adamw_weight_decay": 4.8762721539165315e-05, "l2_weight_decay": 3.82797125217456e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.02001743366669534, "constant_fraction": 0.47137528688096075}, {"learning_rate": 1.5149032505477192e-05, "beta1": 0.9954850948890529, "beta2": 0.9998263810981837, "epsilon": 9.9740617842949, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.028927004580473186, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.8368024876072879}, {"learning_rate": 0.0003103714628616701, "beta1": 0.9941698696528688, "beta2": 0.9939818008492655, "epsilon": 5.893214867316331e-06, "use_nesterov": false, "adamw_weight_decay": 0.05290915537411519, "l2_weight_decay": 0.0, "warmup_fraction": 0.0029335407440786144, "min_learning_rate_mult": 0.04583641437398137, "constant_fraction": 0.08350070494170692}, {"learning_rate": 0.5376946368118306, "beta1": 0.9764537769265424, "beta2": 0.9925926568647955, "epsilon": 0.00010111994504574597, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.004263927534760446, "warmup_fraction": 0.0022013282110630453, "min_learning_rate_mult": 0.0, "constant_fraction": 0.6733529982884875}, {"learning_rate": 0.35875700771319824, "beta1": 0.9965339833020718, "beta2": 0.9925202653326151, "epsilon": 256.57034098469273, "use_nesterov": true, "adamw_weight_decay": 4.8555690134201324e-05, "l2_weight_decay": 2.1853831865519467e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.43547087571364046, "constant_fraction": 0.5929043583786645}, {"learning_rate": 0.00814205451791106, "beta1": 0.7774032808880488, "beta2": 0.6781654979175764, "epsilon": 8.496140046476211e-07, "use_nesterov": true, "adamw_weight_decay": 0.00017904611031791638, "l2_weight_decay": 0.014508497982771783, "warmup_fraction": 0.012929685363404301, "min_learning_rate_mult": 0.0, "constant_fraction": 0.29733211443421914}, {"learning_rate": 0.5203823804022731, "beta1": 0.8728519105556127, "beta2": 0.9999539550454947, "epsilon": 1.8445755786922437e-05, "use_nesterov": true, "adamw_weight_decay": 1.9435514404385542e-05, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.3291699103849296}, {"learning_rate": 0.5123992596755811, "beta1": 0.8117448617171268, "beta2": 0.9997435261036823, "epsilon": 3.182853352501608e-07, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.00024054300356032794, "warmup_fraction": 0.0001728780295546935, "min_learning_rate_mult": 0.0, "constant_fraction": 0.03455944138877165}, {"learning_rate": 0.059304887691567276, "beta1": 0.9858190717673821, "beta2": 0.9956941272943237, "epsilon": 6137.888562642667, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 8.383863892653884e-05, "warmup_fraction": 0.00010533104801166922, "min_learning_rate_mult": 0.0, "constant_fraction": 0.6417958373571204}, {"learning_rate": 0.025900379156207732, "beta1": 0.9261666551775474, "beta2": 0.5751836750150353, "epsilon": 7.951846645010479e-07, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.00010932310098948478, "warmup_fraction": 4.1167220338643836e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.9359407197975855}, {"learning_rate": 5.7878512084161096e-05, "beta1": 0.3807494559987086, "beta2": 0.9536291710072585, "epsilon": 0.00017225747195400866, "use_nesterov": true, "adamw_weight_decay": 0.0001813345827282743, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.38193681466268603}, {"learning_rate": 0.0036458282460504502, "beta1": 0.8152743244096224, "beta2": 0.9975406157170589, "epsilon": 3304.841031061812, "use_nesterov": false, "adamw_weight_decay": 0.0019198818490159147, "l2_weight_decay": 0.0, "warmup_fraction": 4.81045064477937e-05, "min_learning_rate_mult": 1.798464059822004e-05, "constant_fraction": 0.49297841223466443}, {"learning_rate": 2.498341388711816e-05, "beta1": 0.1747199921178204, "beta2": 0.9976977727666799, "epsilon": 0.09503648173107014, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.00012556807763673518, "warmup_fraction": 0.03147734632670128, "min_learning_rate_mult": 0.0, "constant_fraction": 0.47225804925934844}, {"learning_rate": 0.0009441170205749714, "beta1": 0.6389397141974174, "beta2": 0.9966060886845735, "epsilon": 223.19347158854313, "use_nesterov": false, "adamw_weight_decay": 0.00041586994291315166, "l2_weight_decay": 0.0, "warmup_fraction": 0.006339086875275695, "min_learning_rate_mult": 0.0003633272118501893, "constant_fraction": 0.8196461298521129}, {"learning_rate": 7.037802633403875e-05, "beta1": 0.8001406843129946, "beta2": 0.9990955732279245, "epsilon": 2.7339749935075892e-08, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.002896989940560927, "warmup_fraction": 0.0027993066937506065, "min_learning_rate_mult": 0.0, "constant_fraction": 0.014083030712480848}, {"learning_rate": 3.151048320621296e-05, "beta1": 0.9959948488038226, "beta2": 0.9999765678803548, "epsilon": 79.24930775161653, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 2.5748873884240814e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.06815921153988524}, {"learning_rate": 0.006189816734156733, "beta1": 0.961113906991941, "beta2": 0.9999831609316767, "epsilon": 0.0011746901377543443, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.006409288682999275, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.9057878274796242}, {"learning_rate": 0.011475663715970313, "beta1": 0.9630430399942695, "beta2": 0.7710483289939327, "epsilon": 0.00031127674903142226, "use_nesterov": true, "adamw_weight_decay": 0.0002894715034634389, "l2_weight_decay": 3.980537427700214e-05, "warmup_fraction": 1.1095609361100388e-05, "min_learning_rate_mult": 0.006792573422971852, "constant_fraction": 0.9613574607624596}, {"learning_rate": 1.007223428077266e-05, "beta1": 0.9812929155436025, "beta2": 0.8315099477449481, "epsilon": 3.9777199990724355e-05, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 7.714371859652528e-05, "warmup_fraction": 0.006388519196287457, "min_learning_rate_mult": 0.031998897889218995, "constant_fraction": 0.27007822704211903}, {"learning_rate": 0.000561419244274309, "beta1": 0.6233547619701225, "beta2": 0.09607872303927179, "epsilon": 2.6179821900753176e-05, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 1.9704226190606497e-05, "warmup_fraction": 2.7297453517801838e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.6603782755826375}, {"learning_rate": 2.966517987553695e-05, "beta1": 0.8954544472938413, "beta2": 0.9999725288243176, "epsilon": 35.49557701556594, "use_nesterov": false, "adamw_weight_decay": 0.00016659651179855365, "l2_weight_decay": 0.010879393410056509, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.898425030252562}, {"learning_rate": 0.01235827698441609, "beta1": 0.4654417961777704, "beta2": 0.9999794260887395, "epsilon": 2066.6341665564255, "use_nesterov": true, "adamw_weight_decay": 0.0009679031605556754, "l2_weight_decay": 2.621529749599642e-05, "warmup_fraction": 0.03132215761223891, "min_learning_rate_mult": 0.0, "constant_fraction": 0.7383621812362607}, {"learning_rate": 0.018989555327585735, "beta1": 0.6733756007009797, "beta2": 0.655099025142671, "epsilon": 0.002123810953582213, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 2.7079876560676115e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.22085304757018515, "constant_fraction": 0.4625424282890648}, {"learning_rate": 0.16734935171769283, "beta1": 0.9770720891642894, "beta2": 0.9996399157812367, "epsilon": 0.0003030072913885408, "use_nesterov": true, "adamw_weight_decay": 0.008177627328464155, "l2_weight_decay": 0.0, "warmup_fraction": 5.741483815130939e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.17671282495522211}, {"learning_rate": 2.2667221840699326e-05, "beta1": 0.9830910332575035, "beta2": 0.9994415514555506, "epsilon": 2.5559136479060126e-05, "use_nesterov": true, "adamw_weight_decay": 0.00875989335516939, "l2_weight_decay": 0.0, "warmup_fraction": 6.003238280516637e-05, "min_learning_rate_mult": 0.10725731664555398, "constant_fraction": 0.4127007351289401}, {"learning_rate": 4.610134299685991e-05, "beta1": 0.9851307887002553, "beta2": 0.9995782863313453, "epsilon": 0.012104550840156575, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.005043211955673438, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.334629005930106}, {"learning_rate": 0.08984844915071208, "beta1": 0.9979314561958956, "beta2": 0.9680267026326267, "epsilon": 2.3893770508512544, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.005785713332132993, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.20059182834894418}, {"learning_rate": 0.14163314778518063, "beta1": 0.9938952824863734, "beta2": 0.9999427411834982, "epsilon": 1.8605367131660794e-08, "use_nesterov": true, "adamw_weight_decay": 0.022037852626738567, "l2_weight_decay": 2.8248194250066893e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.01112057856571258}, {"learning_rate": 1.3034690612627948e-05, "beta1": 0.9949191043810265, "beta2": 0.9999824334666251, "epsilon": 0.004554619483739033, "use_nesterov": false, "adamw_weight_decay": 0.00024375825730490802, "l2_weight_decay": 0.0007778433115634134, "warmup_fraction": 0.0015990592556832843, "min_learning_rate_mult": 0.0001266591038695846, "constant_fraction": 0.2739476969115662}, {"learning_rate": 0.00022441836073018023, "beta1": 0.9952934513677794, "beta2": 0.9876238445676461, "epsilon": 5.919752389428743, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.00014942573546403818, "warmup_fraction": 0.038905017610602666, "min_learning_rate_mult": 0.05173444543342982, "constant_fraction": 0.38064708511045764}, {"learning_rate": 4.480217415653187e-05, "beta1": 0.8963333020795372, "beta2": 0.9935355995059724, "epsilon": 30.46255470669872, "use_nesterov": true, "adamw_weight_decay": 0.001215026170330586, "l2_weight_decay": 0.0, "warmup_fraction": 0.0, "min_learning_rate_mult": 2.212348403041992e-05, "constant_fraction": 0.6358817387316945}, {"learning_rate": 0.22503399310014138, "beta1": 0.9381199791083934, "beta2": 0.7633483689205961, "epsilon": 0.0024027044483422143, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 2.8497012811811337e-05, "warmup_fraction": 0.0005334493012778141, "min_learning_rate_mult": 0.0, "constant_fraction": 0.31758614672494534}, {"learning_rate": 1.4995429482589337e-05, "beta1": 0.8985384508063559, "beta2": 0.05093679080605307, "epsilon": 0.00015987694103884205, "use_nesterov": true, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.003278463878672844, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.004048888758028188, "constant_fraction": 0.2658559516688288}, {"learning_rate": 0.00014343938834426452, "beta1": 0.998705295977521, "beta2": 0.5248205951655771, "epsilon": 2.3963869367604934e-06, "use_nesterov": false, "adamw_weight_decay": 0.00011290206356046102, "l2_weight_decay": 0.0001762891848176236, "warmup_fraction": 0.058518173483950525, "min_learning_rate_mult": 0.020946807243365496, "constant_fraction": 0.3728708904107253}, {"learning_rate": 0.00013200687153944085, "beta1": 0.9973006490864917, "beta2": 0.989733025568773, "epsilon": 0.0060412446071534875, "use_nesterov": false, "adamw_weight_decay": 0.0002984473517507429, "l2_weight_decay": 4.081100818576508e-05, "warmup_fraction": 0.0, "min_learning_rate_mult": 9.57109313658189e-05, "constant_fraction": 0.4061364330469718}, {"learning_rate": 7.261906155480829e-05, "beta1": 0.7681814950653347, "beta2": 0.9999148290151134, "epsilon": 383.6605051990431, "use_nesterov": true, "adamw_weight_decay": 2.2926113742156803e-05, "l2_weight_decay": 0.0035910388279376732, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.007417626512364598, "constant_fraction": 0.37168524035785355}, {"learning_rate": 1.3048478265558753e-05, "beta1": 0.9387416081847262, "beta2": 0.9998736024635289, "epsilon": 1.7419761666476377, "use_nesterov": false, "adamw_weight_decay": 1.58456579671453e-05, "l2_weight_decay": 0.004273886929475364, "warmup_fraction": 1.5335728516361086e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.18228351903539042}, {"learning_rate": 7.852848580332433e-05, "beta1": 0.049024862404724145, "beta2": 0.9959878122060496, "epsilon": 2.2305075752547055e-05, "use_nesterov": true, "adamw_weight_decay": 0.0010016118134872948, "l2_weight_decay": 0.01073541661782933, "warmup_fraction": 1.600459785622812e-05, "min_learning_rate_mult": 0.0, "constant_fraction": 0.7776699229827798}, {"learning_rate": 0.0002143145160620116, "beta1": 0.9935837551458588, "beta2": 0.999924301738625, "epsilon": 1.0223177949601507, "use_nesterov": true, "adamw_weight_decay": 8.077729526935568e-05, "l2_weight_decay": 0.0034230276302542363, "warmup_fraction": 0.0009021106551741756, "min_learning_rate_mult": 8.431046330484348e-05, "constant_fraction": 0.38011830427750615}, {"learning_rate": 0.045960193876507405, "beta1": 0.6216049881662518, "beta2": 0.22112706197867593, "epsilon": 472.20798777675, "use_nesterov": false, "adamw_weight_decay": 0.0, "l2_weight_decay": 0.004752640328136857, "warmup_fraction": 0.0, "min_learning_rate_mult": 0.0, "constant_fraction": 0.23045303180494148}, {"learning_rate": 0.04570368188261027, "beta1": 0.9834256932004822, "beta2": 0.9997816861609249, "epsilon": 6.684891091418533e-06, "use_nesterov": true, "adamw_weight_decay": 0.0004377371683928401, "l2_weight_decay": 0.0, "warmup_fraction": 0.0005525487323201233, "min_learning_rate_mult": 0.0, "constant_fraction": 0.7937974108202099}]