{"step": 1, "z/secs/update0": 36.77715162996901, "global_schedule": 0.0, "l2_grads": 0.3841651976108551, "l2_params": 212.34991455078125, "l2_updates": 0.0, "training_loss": 6.907755374908447, "uptime": 1019.7492486139527, "examples_seen": 1024.0, "progress": 8.970460274316676e-06, "epoch": 0.0008073449468011716}
{"step": 2, "global_schedule": 9.999999747378752e-05, "l2_grads": 0.37830421328544617, "l2_params": 212.34991455078125, "l2_updates": 4.514469765126705e-05, "training_loss": 6.9077558517456055, "uptime": 1021.0140698869945, "examples_seen": 2048.0, "progress": 1.794092054863335e-05, "epoch": 0.0016146898936023433}
{"step": 50, "global_schedule": 0.004900000058114529, "l2_grads": 0.3751427233219147, "l2_params": 212.34854125976562, "l2_updates": 0.011526807211339474, "training_loss": 6.907618999481201, "uptime": 1037.1863562499639, "examples_seen": 51200.0, "progress": 0.00044852301371583374, "epoch": 0.04036724734005858, "img/sec/core": 189.95458842691212, "core_hours_Tesla V100-SXM2-32GB": 0.07187682827986364, "core_hours": 0.07187682827986364}
{"step": 100, "global_schedule": 0.00989999994635582, "l2_grads": 0.4069517254829407, "l2_params": 212.34634399414062, "l2_updates": 0.02609073929488659, "training_loss": 6.904102325439453, "uptime": 1054.015289840987, "examples_seen": 102400.0, "progress": 0.0008970460274316675, "epoch": 0.08073449468011716, "img/sec/core": 190.14870922700345, "core_hours_Tesla V100-SXM2-32GB": 0.14667208868441067, "core_hours": 0.14667208868441067}
{"step": 150, "global_schedule": 0.01489999983459711, "l2_grads": 0.5133287310600281, "l2_params": 212.34576416015625, "l2_updates": 0.034448958933353424, "training_loss": 6.8940324783325195, "uptime": 1070.8714729379863, "examples_seen": 153600.0, "progress": 0.0013455690411475012, "epoch": 0.12110174202017573, "img/sec/core": 189.84131707549238, "core_hours_Tesla V100-SXM2-32GB": 0.22158845800440757, "core_hours": 0.22158845800440757}
{"step": 200, "global_schedule": 0.019899999722838402, "l2_grads": 0.46512937545776367, "l2_params": 212.35238647460938, "l2_updates": 0.041199058294296265, "training_loss": 6.883983612060547, "uptime": 1087.7153575840057, "examples_seen": 204800.0, "progress": 0.001794092054863335, "epoch": 0.16146898936023432, "img/sec/core": 189.97992845766893, "core_hours_Tesla V100-SXM2-32GB": 0.2964501675422717, "core_hours": 0.2964501675422717}
{"step": 250, "global_schedule": 0.024899998679757118, "l2_grads": 0.5569857358932495, "l2_params": 212.35763549804688, "l2_updates": 0.053473588079214096, "training_loss": 6.864233016967773, "uptime": 1104.5703630030039, "examples_seen": 256000.0, "progress": 0.0022426150685791687, "epoch": 0.2018362367002929, "img/sec/core": 189.85458149975477, "core_hours_Tesla V100-SXM2-32GB": 0.37136130273781925, "core_hours": 0.37136130273781925}
{"step": 301, "global_schedule": 0.029899999499320984, "l2_grads": 0.4773981273174286, "l2_params": 212.35842895507812, "l2_updates": 0.0573589913547039, "training_loss": 6.850568771362305, "uptime": 1121.4049053349881, "examples_seen": 307200.0, "progress": 0.0026911380822950024, "epoch": 0.24220348404035147, "img/sec/core": 190.08535764707185, "core_hours_Tesla V100-SXM2-32GB": 0.44618149087997155, "core_hours": 0.44618149087997155}
{"step": 350, "global_schedule": 0.0348999984562397, "l2_grads": 0.5207629203796387, "l2_params": 212.3541259765625, "l2_updates": 0.05447281524538994, "training_loss": 6.850642204284668, "uptime": 1138.2173919829656, "examples_seen": 358400.0, "progress": 0.003139661096010836, "epoch": 0.28257073138041006, "img/sec/core": 190.33472364927962, "core_hours_Tesla V100-SXM2-32GB": 0.5209036537598715, "core_hours": 0.5209036537598715}
{"step": 400, "global_schedule": 0.03989999741315842, "l2_grads": 0.7153612375259399, "l2_params": 212.3491668701172, "l2_updates": 0.07603023946285248, "training_loss": 6.801314830780029, "uptime": 1155.047138164984, "examples_seen": 409600.0, "progress": 0.00358818410972667, "epoch": 0.32293797872046864, "img/sec/core": 190.13952827280355, "core_hours_Tesla V100-SXM2-32GB": 0.5957025256799534, "core_hours": 0.5957025256799534}
{"step": 450, "global_schedule": 0.04490000009536743, "l2_grads": 0.47869959473609924, "l2_params": 212.341796875, "l2_updates": 0.06940924376249313, "training_loss": 6.810227394104004, "uptime": 1171.8867806809722, "examples_seen": 460800.0, "progress": 0.004036707123442504, "epoch": 0.36330522606052723, "img/sec/core": 190.0277869296702, "core_hours_Tesla V100-SXM2-32GB": 0.6705453813065672, "core_hours": 0.6705453813065672}
{"step": 500, "global_schedule": 0.04989999905228615, "l2_grads": 0.7584530711174011, "l2_params": 212.33615112304688, "l2_updates": 0.08718153834342957, "training_loss": 6.847325325012207, "uptime": 1188.7373644469772, "examples_seen": 512000.0, "progress": 0.004485230137158337, "epoch": 0.4036724734005858, "img/sec/core": 189.9044000158499, "core_hours_Tesla V100-SXM2-32GB": 0.7454368647110338, "core_hours": 0.7454368647110338}
{"step": 550, "global_schedule": 0.054899998009204865, "l2_grads": 0.697869598865509, "l2_params": 212.32810974121094, "l2_updates": 0.07738034427165985, "training_loss": 6.7430644035339355, "uptime": 1205.5626577329822, "examples_seen": 563200.0, "progress": 0.004933753150874172, "epoch": 0.44403972074064435, "img/sec/core": 190.1898496272692, "core_hours_Tesla V100-SXM2-32GB": 0.8202159459821673, "core_hours": 0.8202159459821673}
{"step": 600, "global_schedule": 0.05989999696612358, "l2_grads": 0.6585062146186829, "l2_params": 212.3126678466797, "l2_updates": 0.09547639638185501, "training_loss": 6.7133073806762695, "uptime": 1222.4116548749735, "examples_seen": 614400.0, "progress": 0.005382276164590005, "epoch": 0.48440696808070294, "img/sec/core": 189.92228279420388, "core_hours_Tesla V100-SXM2-32GB": 0.8951003777243507, "core_hours": 0.8951003777243507}
{"step": 650, "global_schedule": 0.0648999959230423, "l2_grads": 0.6562597751617432, "l2_params": 212.29798889160156, "l2_updates": 0.0915643721818924, "training_loss": 6.7676873207092285, "uptime": 1239.2510208970052, "examples_seen": 665600.0, "progress": 0.005830799178305839, "epoch": 0.5247742154207615, "img/sec/core": 190.03090709075897, "core_hours_Tesla V100-SXM2-32GB": 0.9699420044889363, "core_hours": 0.9699420044889363}
{"step": 700, "global_schedule": 0.06989999860525131, "l2_grads": 0.7616183161735535, "l2_params": 212.2822265625, "l2_updates": 0.10633880645036697, "training_loss": 6.66453218460083, "uptime": 1256.092698302993, "examples_seen": 716800.0, "progress": 0.006279322192021672, "epoch": 0.5651414627608201, "img/sec/core": 190.0048268863217, "core_hours_Tesla V100-SXM2-32GB": 1.0447939040711047, "core_hours": 1.0447939040711047}
{"step": 750, "global_schedule": 0.07490000128746033, "l2_grads": 0.8987081050872803, "l2_params": 212.26513671875, "l2_updates": 0.10668856650590897, "training_loss": 6.802181243896484, "uptime": 1272.941616800963, "examples_seen": 768000.0, "progress": 0.0067278452057375066, "epoch": 0.6055087101008787, "img/sec/core": 189.92316927555737, "core_hours_Tesla V100-SXM2-32GB": 1.119677986284304, "core_hours": 1.119677986284304}
{"step": 800, "global_schedule": 0.07989999651908875, "l2_grads": 0.8435737490653992, "l2_params": 212.250732421875, "l2_updates": 0.11747224628925323, "training_loss": 6.59929084777832, "uptime": 1289.8002230949933, "examples_seen": 819200.0, "progress": 0.00717636821945334, "epoch": 0.6458759574409373, "img/sec/core": 189.81402994938725, "core_hours_Tesla V100-SXM2-32GB": 1.1946051253688832, "core_hours": 1.1946051253688832}
{"step": 850, "global_schedule": 0.08489999920129776, "l2_grads": 0.9886293411254883, "l2_params": 212.23809814453125, "l2_updates": 0.11077166348695755, "training_loss": 6.598448753356934, "uptime": 1306.6200603540055, "examples_seen": 870400.0, "progress": 0.007624891233169174, "epoch": 0.6862432047809959, "img/sec/core": 190.25154350321677, "core_hours_Tesla V100-SXM2-32GB": 1.26935995763116, "core_hours": 1.26935995763116}
{"step": 900, "global_schedule": 0.08989999443292618, "l2_grads": 0.9542977213859558, "l2_params": 212.21762084960938, "l2_updates": 0.13020677864551544, "training_loss": 6.575689315795898, "uptime": 1323.466796321969, "examples_seen": 921600.0, "progress": 0.008073414246885008, "epoch": 0.7266104521210545, "img/sec/core": 189.94777422079076, "core_hours_Tesla V100-SXM2-32GB": 1.3442343397109977, "core_hours": 1.3442343397109977}
{"step": 950, "global_schedule": 0.09489999711513519, "l2_grads": 1.2547295093536377, "l2_params": 212.19290161132812, "l2_updates": 0.1354880928993225, "training_loss": 6.5643768310546875, "uptime": 1340.3151283169864, "examples_seen": 972800.0, "progress": 0.008521937260600842, "epoch": 0.766977699461113, "img/sec/core": 189.92978064216396, "core_hours_Tesla V100-SXM2-32GB": 1.419115815244408, "core_hours": 1.419115815244408}
{"step": 1000, "global_schedule": 0.09989999979734421, "l2_grads": 0.8950121402740479, "l2_params": 212.16995239257812, "l2_updates": 0.1344139724969864, "training_loss": 6.585766792297363, "uptime": 1357.1581117429887, "examples_seen": 1024000.0, "progress": 0.008970460274316675, "epoch": 0.8073449468011716, "img/sec/core": 189.99009374193272, "core_hours_Tesla V100-SXM2-32GB": 1.493973519359974, "core_hours": 1.493973519359974}
{"step": 1050, "global_schedule": 0.10489999502897263, "l2_grads": 0.947873055934906, "l2_params": 212.1444091796875, "l2_updates": 0.14903365075588226, "training_loss": 6.566429138183594, "uptime": 1374.58809968899, "examples_seen": 1075200.0, "progress": 0.009418983288032508, "epoch": 0.8477121941412302, "img/sec/core": 189.58498152935255, "core_hours_Tesla V100-SXM2-32GB": 1.5689911821911422, "core_hours": 1.5689911821911422}
{"step": 1100, "global_schedule": 0.10989999771118164, "l2_grads": 0.9693641066551208, "l2_params": 212.1219024658203, "l2_updates": 0.1348665952682495, "training_loss": 6.745870590209961, "uptime": 1391.4422742089955, "examples_seen": 1126400.0, "progress": 0.009867506301748343, "epoch": 0.8880794414812887, "img/sec/core": 189.86394119757585, "core_hours_Tesla V100-SXM2-32GB": 1.6438986245022775, "core_hours": 1.6438986245022775}
{"step": 1150, "global_schedule": 0.11490000039339066, "l2_grads": 0.9891306757926941, "l2_params": 212.08949279785156, "l2_updates": 0.14987768232822418, "training_loss": 6.43770694732666, "uptime": 1408.323534132971, "examples_seen": 1177600.0, "progress": 0.010316029315464176, "epoch": 0.9284466888213473, "img/sec/core": 189.55931099995863, "core_hours_Tesla V100-SXM2-32GB": 1.718926446386613, "core_hours": 1.718926446386613}
{"step": 1200, "global_schedule": 0.11989999562501907, "l2_grads": 1.576832890510559, "l2_params": 212.0582275390625, "l2_updates": 0.1437428742647171, "training_loss": 6.454758644104004, "uptime": 1425.2029171949835, "examples_seen": 1228800.0, "progress": 0.01076455232918001, "epoch": 0.9688139361614059, "img/sec/core": 189.58038858669462, "core_hours_Tesla V100-SXM2-32GB": 1.7939459266622242, "core_hours": 1.7939459266622242}
{"step": 1250, "global_schedule": 0.12489999830722809, "l2_grads": 1.185943841934204, "l2_params": 212.03353881835938, "l2_updates": 0.1629931777715683, "training_loss": 6.427267074584961, "uptime": 1442.0500463770004, "examples_seen": 1280000.0, "progress": 0.011213075342895845, "epoch": 1.0091811835014646, "img/sec/core": 189.94334081653284, "core_hours_Tesla V100-SXM2-32GB": 1.868822056360077, "core_hours": 1.868822056360077}
{"step": 1300, "global_schedule": 0.1298999935388565, "l2_grads": 1.0551913976669312, "l2_params": 211.9925994873047, "l2_updates": 0.16375231742858887, "training_loss": 6.417257308959961, "uptime": 1458.9097816129797, "examples_seen": 1331200.0, "progress": 0.011661598356611678, "epoch": 1.049548430841523, "img/sec/core": 189.80131984345036, "core_hours_Tesla V100-SXM2-32GB": 1.9437542129644296, "core_hours": 1.9437542129644296}
{"step": 1350, "global_schedule": 0.13490000367164612, "l2_grads": 1.9589065313339233, "l2_params": 211.9485321044922, "l2_updates": 0.14758896827697754, "training_loss": 6.674082279205322, "uptime": 1475.7715092719882, "examples_seen": 1382400.0, "progress": 0.012110121370327511, "epoch": 1.0899156781815817, "img/sec/core": 189.77889245473511, "core_hours_Tesla V100-SXM2-32GB": 2.018695224782245, "core_hours": 2.018695224782245}
{"step": 1400, "global_schedule": 0.13989999890327454, "l2_grads": 1.265500545501709, "l2_params": 211.89678955078125, "l2_updates": 0.1686880737543106, "training_loss": 6.339283466339111, "uptime": 1492.6287859959994, "examples_seen": 1433600.0, "progress": 0.012558644384043345, "epoch": 1.1302829255216402, "img/sec/core": 189.82900099409196, "core_hours_Tesla V100-SXM2-32GB": 2.0936164546667393, "core_hours": 2.0936164546667393}
{"step": 1450, "global_schedule": 0.14489999413490295, "l2_grads": 0.9331415295600891, "l2_params": 211.85028076171875, "l2_updates": 0.16482453048229218, "training_loss": 6.5578999519348145, "uptime": 1509.5087641909486, "examples_seen": 1484800.0, "progress": 0.01300716739775918, "epoch": 1.170650172861699, "img/sec/core": 189.57370460096303, "core_hours_Tesla V100-SXM2-32GB": 2.1686385799776247, "core_hours": 2.1686385799776247}
{"step": 1500, "global_schedule": 0.14989998936653137, "l2_grads": 1.5567680597305298, "l2_params": 211.80557250976562, "l2_updates": 0.16479498147964478, "training_loss": 6.318841934204102, "uptime": 1526.3698696109932, "examples_seen": 1536000.0, "progress": 0.013455690411475013, "epoch": 1.2110174202017574, "img/sec/core": 189.78589601817052, "core_hours_Tesla V100-SXM2-32GB": 2.243576826288934, "core_hours": 2.243576826288934}
{"step": 1550, "global_schedule": 0.15489999949932098, "l2_grads": 1.0738747119903564, "l2_params": 211.76063537597656, "l2_updates": 0.17487972974777222, "training_loss": 6.457380294799805, "uptime": 1543.2519255639636, "examples_seen": 1587200.0, "progress": 0.013904213425190846, "epoch": 1.2513846675418159, "img/sec/core": 189.55037282866954, "core_hours_Tesla V100-SXM2-32GB": 2.3186081860799135, "core_hours": 2.3186081860799135}
{"step": 1600, "global_schedule": 0.1598999947309494, "l2_grads": 1.091365933418274, "l2_params": 211.72296142578125, "l2_updates": 0.20142149925231934, "training_loss": 6.33799934387207, "uptime": 1560.1327250379836, "examples_seen": 1638400.0, "progress": 0.01435273643890668, "epoch": 1.2917519148818746, "img/sec/core": 189.5644815238094, "core_hours_Tesla V100-SXM2-32GB": 2.3936339615200026, "core_hours": 2.3936339615200026}
{"step": 1651, "global_schedule": 0.16489998996257782, "l2_grads": 0.9972646832466125, "l2_params": 211.66734313964844, "l2_updates": 0.18598413467407227, "training_loss": 6.535104751586914, "uptime": 1577.0191678279662, "examples_seen": 1689600.0, "progress": 0.014801259452622515, "epoch": 1.332119162221933, "img/sec/core": 189.50113056956675, "core_hours_Tesla V100-SXM2-32GB": 2.4686848183643693, "core_hours": 2.4686848183643693}
{"step": 1700, "global_schedule": 0.16990000009536743, "l2_grads": 0.9286719560623169, "l2_params": 211.6153106689453, "l2_updates": 0.18683476746082306, "training_loss": 6.681849956512451, "uptime": 1593.8757753829705, "examples_seen": 1740800.0, "progress": 0.015249782466338348, "epoch": 1.3724864095619917, "img/sec/core": 189.83653677397268, "core_hours_Tesla V100-SXM2-32GB": 2.5436030741643885, "core_hours": 2.5436030741643885}
{"step": 1750, "global_schedule": 0.17489999532699585, "l2_grads": 0.7875488996505737, "l2_params": 211.55044555664062, "l2_updates": 0.168821319937706, "training_loss": 6.533246994018555, "uptime": 1610.7488157549524, "examples_seen": 1792000.0, "progress": 0.015698305480054183, "epoch": 1.4128536569020502, "img/sec/core": 189.65165313737268, "core_hours_Tesla V100-SXM2-32GB": 2.6185943647065306, "core_hours": 2.6185943647065306}
{"step": 1800, "global_schedule": 0.17989999055862427, "l2_grads": 1.10337495803833, "l2_params": 211.48440551757812, "l2_updates": 0.2199375182390213, "training_loss": 6.261199951171875, "uptime": 1627.5939044649713, "examples_seen": 1843200.0, "progress": 0.016146828493770016, "epoch": 1.453220904242109, "img/sec/core": 189.96634895111868, "core_hours_Tesla V100-SXM2-32GB": 2.6934614256399474, "core_hours": 2.6934614256399474}
{"step": 1850, "global_schedule": 0.18490000069141388, "l2_grads": 0.8725283741950989, "l2_params": 211.43760681152344, "l2_updates": 0.21331867575645447, "training_loss": 6.374260902404785, "uptime": 1644.4734152199817, "examples_seen": 1894400.0, "progress": 0.01659535150748585, "epoch": 1.4935881515821674, "img/sec/core": 189.57895441668123, "core_hours_Tesla V100-SXM2-32GB": 2.768481473439994, "core_hours": 2.768481473439994}
{"step": 1900, "global_schedule": 0.1898999959230423, "l2_grads": 1.1577177047729492, "l2_params": 211.3816375732422, "l2_updates": 0.2454456239938736, "training_loss": 6.264530658721924, "uptime": 1661.3491060379893, "examples_seen": 1945600.0, "progress": 0.017043874521201683, "epoch": 1.533955398922226, "img/sec/core": 189.62186701034906, "core_hours_Tesla V100-SXM2-32GB": 2.84348454374225, "core_hours": 2.84348454374225}
{"step": 1950, "global_schedule": 0.19489999115467072, "l2_grads": 0.9730181694030762, "l2_params": 211.33087158203125, "l2_updates": 0.20053783059120178, "training_loss": 6.683507919311523, "uptime": 1678.2239180390025, "examples_seen": 1996800.0, "progress": 0.017492397534917516, "epoch": 1.5743226462622846, "img/sec/core": 189.6317422563206, "core_hours_Tesla V100-SXM2-32GB": 2.9184837081911974, "core_hours": 2.9184837081911974}
{"step": 2000, "global_schedule": 0.19990000128746033, "l2_grads": 1.3647950887680054, "l2_params": 211.2782440185547, "l2_updates": 0.24189884960651398, "training_loss": 6.190445899963379, "uptime": 1695.0806546759559, "examples_seen": 2048000.0, "progress": 0.01794092054863335, "epoch": 1.6146898936023433, "img/sec/core": 189.83508308393112, "core_hours_Tesla V100-SXM2-32GB": 2.993402537688768, "core_hours": 2.993402537688768}
{"step": 2050, "global_schedule": 0.20489999651908875, "l2_grads": 1.2686421871185303, "l2_params": 211.2200469970703, "l2_updates": 0.22831912338733673, "training_loss": 6.195512294769287, "uptime": 1712.5055237699999, "examples_seen": 2099200.0, "progress": 0.018389443562349183, "epoch": 1.6550571409424017, "img/sec/core": 189.56311351129517, "core_hours_Tesla V100-SXM2-32GB": 3.06842885456436, "core_hours": 3.06842885456436}
{"step": 2100, "global_schedule": 0.20989999175071716, "l2_grads": 1.0674551725387573, "l2_params": 211.16543579101562, "l2_updates": 0.24717561900615692, "training_loss": 6.693784713745117, "uptime": 1729.364800426003, "examples_seen": 2150400.0, "progress": 0.018837966576065016, "epoch": 1.6954243882824604, "img/sec/core": 189.80648252548565, "core_hours_Tesla V100-SXM2-32GB": 3.143358973035485, "core_hours": 3.143358973035485}
{"step": 2150, "global_schedule": 0.21490000188350677, "l2_grads": 1.0857622623443604, "l2_params": 211.11610412597656, "l2_updates": 0.23398788273334503, "training_loss": 6.3076934814453125, "uptime": 1746.2343293639715, "examples_seen": 2201600.0, "progress": 0.019286489589780853, "epoch": 1.735791635622519, "img/sec/core": 189.6911295962584, "core_hours_Tesla V100-SXM2-32GB": 3.2183346572042337, "core_hours": 3.2183346572042337}
{"step": 2200, "global_schedule": 0.2198999971151352, "l2_grads": 1.4360867738723755, "l2_params": 211.0568084716797, "l2_updates": 0.2499805986881256, "training_loss": 6.147745132446289, "uptime": 1763.1030209210003, "examples_seen": 2252800.0, "progress": 0.019735012603496686, "epoch": 1.7761588829625774, "img/sec/core": 189.70054607860996, "core_hours_Tesla V100-SXM2-32GB": 3.2933066196799174, "core_hours": 3.2933066196799174}
{"step": 2250, "global_schedule": 0.2248999923467636, "l2_grads": 1.2710508108139038, "l2_params": 211.016845703125, "l2_updates": 0.2524035573005676, "training_loss": 6.219675540924072, "uptime": 1779.9674811050063, "examples_seen": 2304000.0, "progress": 0.02018353561721252, "epoch": 1.816526130302636, "img/sec/core": 189.74814284508363, "core_hours_Tesla V100-SXM2-32GB": 3.3682597760532778, "core_hours": 3.3682597760532778}
{"step": 2300, "global_schedule": 0.22989998757839203, "l2_grads": 1.0430461168289185, "l2_params": 210.96722412109375, "l2_updates": 0.2839798629283905, "training_loss": 6.138179302215576, "uptime": 1796.8524792219978, "examples_seen": 2355200.0, "progress": 0.020632058630928353, "epoch": 1.8568933776426946, "img/sec/core": 189.5173442027109, "core_hours_Tesla V100-SXM2-32GB": 3.4433042121287953, "core_hours": 3.4433042121287953}
{"step": 2350, "global_schedule": 0.23489999771118164, "l2_grads": 1.4234975576400757, "l2_params": 210.92947387695312, "l2_updates": 0.2560364603996277, "training_loss": 6.106334686279297, "uptime": 1813.7294145749765, "examples_seen": 2406400.0, "progress": 0.021080581644644186, "epoch": 1.8972606249827533, "img/sec/core": 189.60788395952486, "core_hours_Tesla V100-SXM2-32GB": 3.5183128136975896, "core_hours": 3.5183128136975896}
{"step": 2400, "global_schedule": 0.23989999294281006, "l2_grads": 1.1771776676177979, "l2_params": 210.89678955078125, "l2_updates": 0.29244306683540344, "training_loss": 6.72015905380249, "uptime": 1830.5940418419777, "examples_seen": 2457600.0, "progress": 0.02152910465836002, "epoch": 1.9376278723228118, "img/sec/core": 189.7462629524816, "core_hours_Tesla V100-SXM2-32GB": 3.59326671266204, "core_hours": 3.59326671266204}
{"step": 2450, "global_schedule": 0.24489998817443848, "l2_grads": 1.4805049896240234, "l2_params": 210.84963989257812, "l2_updates": 0.2797256410121918, "training_loss": 6.0125274658203125, "uptime": 1847.4619450699538, "examples_seen": 2508800.0, "progress": 0.021977627672075853, "epoch": 1.9779951196628704, "img/sec/core": 189.70941181905042, "core_hours_Tesla V100-SXM2-32GB": 3.668235171453044, "core_hours": 3.668235171453044}
{"step": 2500, "global_schedule": 0.2498999983072281, "l2_grads": 1.0897737741470337, "l2_params": 210.78736877441406, "l2_updates": 0.27848103642463684, "training_loss": 6.470258712768555, "uptime": 1864.3409112839727, "examples_seen": 2560000.0, "progress": 0.02242615068579169, "epoch": 2.018362367002929, "img/sec/core": 189.5850705206241, "core_hours_Tesla V100-SXM2-32GB": 3.743252799070906, "core_hours": 3.743252799070906, "minival/prec@1": 0.04534811114580081, "minival/loss": 5.719629302606931, "minival/sample count": 12812.0, "minival/attn_weight_avg": [13312, 12, 281], "minival/attn_mag": [13312, 12, 281], "minival/before_mlp": [13312, 12, 281], "z/secs/eval/minival": 2.9427635720348917, "real/prec@1": 0.05156179943207293, "real/loss": 7.100046166592384, "real/sample count": 46837.0, "real/attn_weight_avg": [50176, 12, 281], "real/attn_mag": [50176, 12, 281], "real/before_mlp": [50176, 12, 281], "z/secs/eval/real": 11.18998681899393, "train/prec@1": 0.0475354173984311, "train/loss": 5.701164915555814, "train/sample count": 25623.0, "train/attn_weight_avg": [26624, 12, 281], "train/attn_mag": [26624, 12, 281], "train/before_mlp": [26624, 12, 281], "z/secs/eval/train": 6.7658189730136655, "v2/prec@1": 0.0348, "v2/loss": 5.89902158203125, "v2/sample count": 10000.0, "v2/attn_weight_avg": [10240, 12, 281], "v2/attn_mag": [10240, 12, 281], "v2/before_mlp": [10240, 12, 281], "z/secs/eval/v2": 3.3455623739864677, "val/prec@1": 0.0447, "val/loss": 5.744050029296875, "val/sample count": 50000.0, "val/attn_weight_avg": [50176, 12, 281], "val/attn_mag": [50176, 12, 281], "val/before_mlp": [50176, 12, 281], "z/secs/eval/val": 12.297316540032625}
{"step": 2550, "global_schedule": 0.2549000084400177, "l2_grads": 1.2661840915679932, "l2_params": 210.7340545654297, "l2_updates": 0.2910936772823334, "training_loss": 6.660520553588867, "uptime": 1917.7800747689907, "examples_seen": 2611200.0, "progress": 0.022874673699507523, "epoch": 2.0587296143429876, "img/sec/core": 189.39714586194583, "core_hours_Tesla V100-SXM2-32GB": 3.818344861084285, "core_hours": 3.818344861084285}
{"step": 2600, "global_schedule": 0.2599000036716461, "l2_grads": 1.112388253211975, "l2_params": 210.7017059326172, "l2_updates": 0.3142172694206238, "training_loss": 5.970408916473389, "uptime": 1934.6383743829792, "examples_seen": 2662400.0, "progress": 0.023323196713223356, "epoch": 2.099096861683046, "img/sec/core": 189.81748297703402, "core_hours_Tesla V100-SXM2-32GB": 3.8932706371464563, "core_hours": 3.8932706371464563}
{"step": 2650, "global_schedule": 0.26489999890327454, "l2_grads": 1.1196500062942505, "l2_params": 210.68026733398438, "l2_updates": 0.3213540017604828, "training_loss": 6.041751384735107, "uptime": 1951.5111796849524, "examples_seen": 2713600.0, "progress": 0.02377171972693919, "epoch": 2.1394641090231046, "img/sec/core": 189.654295342683, "core_hours_Tesla V100-SXM2-32GB": 3.968260882933003, "core_hours": 3.968260882933003}
{"step": 2700, "global_schedule": 0.26989999413490295, "l2_grads": 1.2827777862548828, "l2_params": 210.6323699951172, "l2_updates": 0.2775523364543915, "training_loss": 6.2525739669799805, "uptime": 1968.3550305859535, "examples_seen": 2764800.0, "progress": 0.024220242740655023, "epoch": 2.1798313563631635, "img/sec/core": 189.98030906399228, "core_hours_Tesla V100-SXM2-32GB": 4.043122442493009, "core_hours": 4.043122442493009}
{"step": 2750, "global_schedule": 0.27489998936653137, "l2_grads": 1.2286916971206665, "l2_params": 210.6066436767578, "l2_updates": 0.31539103388786316, "training_loss": 6.371133804321289, "uptime": 1985.2245832799817, "examples_seen": 2816000.0, "progress": 0.024668765754370856, "epoch": 2.220198603703222, "img/sec/core": 189.69086246920986, "core_hours_Tesla V100-SXM2-32GB": 4.118098232244245, "core_hours": 4.118098232244245}
{"step": 2800, "global_schedule": 0.2798999845981598, "l2_grads": 1.2482737302780151, "l2_params": 210.56948852539062, "l2_updates": 0.32022595405578613, "training_loss": 5.996687889099121, "uptime": 2002.0919529589592, "examples_seen": 2867200.0, "progress": 0.02511728876808669, "epoch": 2.2605658510432804, "img/sec/core": 189.71541271122487, "core_hours_Tesla V100-SXM2-32GB": 4.193064319706367, "core_hours": 4.193064319706367}
{"step": 2850, "global_schedule": 0.2848999798297882, "l2_grads": 1.3390990495681763, "l2_params": 210.5488739013672, "l2_updates": 0.3144247233867645, "training_loss": 6.124295234680176, "uptime": 2018.97138833598, "examples_seen": 2918400.0, "progress": 0.025565811781802523, "epoch": 2.300933098383339, "img/sec/core": 189.5798010137461, "core_hours_Tesla V100-SXM2-32GB": 4.2680840324931255, "core_hours": 4.2680840324931255}
{"step": 2900, "global_schedule": 0.289900004863739, "l2_grads": 1.4471417665481567, "l2_params": 210.54039001464844, "l2_updates": 0.3001730740070343, "training_loss": 6.522437572479248, "uptime": 2035.8488446959527, "examples_seen": 2969600.0, "progress": 0.02601433479551836, "epoch": 2.341300345723398, "img/sec/core": 189.6020307650894, "core_hours_Tesla V100-SXM2-32GB": 4.3430949496485605, "core_hours": 4.3430949496485605}
{"step": 2950, "global_schedule": 0.29490000009536743, "l2_grads": 1.0076826810836792, "l2_params": 210.52354431152344, "l2_updates": 0.35627037286758423, "training_loss": 6.214904308319092, "uptime": 2052.7316626639804, "examples_seen": 3020800.0, "progress": 0.026462857809234193, "epoch": 2.3816675930634563, "img/sec/core": 189.54181737077863, "core_hours_Tesla V100-SXM2-32GB": 4.418129696173128, "core_hours": 4.418129696173128}
{"step": 3000, "global_schedule": 0.29989999532699585, "l2_grads": 1.211171269416809, "l2_params": 210.50698852539062, "l2_updates": 0.3555494546890259, "training_loss": 5.930032730102539, "uptime": 2069.574805716984, "examples_seen": 3072000.0, "progress": 0.026911380822950026, "epoch": 2.422034840403515, "img/sec/core": 189.98829315466472, "core_hours_Tesla V100-SXM2-32GB": 4.492988109742033, "core_hours": 4.492988109742033}
{"step": 3050, "global_schedule": 0.30489999055862427, "l2_grads": 1.3994032144546509, "l2_params": 210.50621032714844, "l2_updates": 0.3482573628425598, "training_loss": 6.345682144165039, "uptime": 2087.242051298963, "examples_seen": 3123200.0, "progress": 0.02735990383666586, "epoch": 2.4624020877435733, "img/sec/core": 189.5793412800794, "core_hours_Tesla V100-SXM2-32GB": 4.568008004453086, "core_hours": 4.568008004453086}
{"step": 3100, "global_schedule": 0.3098999857902527, "l2_grads": 1.145997405052185, "l2_params": 210.49526977539062, "l2_updates": 0.34622037410736084, "training_loss": 5.976232051849365, "uptime": 2104.109938077978, "examples_seen": 3174400.0, "progress": 0.027808426850381693, "epoch": 2.5027693350836318, "img/sec/core": 189.70959681689735, "core_hours_Tesla V100-SXM2-32GB": 4.642976390137595, "core_hours": 4.642976390137595}
{"step": 3150, "global_schedule": 0.3148999810218811, "l2_grads": 1.1112520694732666, "l2_params": 210.51194763183594, "l2_updates": 0.38637858629226685, "training_loss": 5.869185924530029, "uptime": 2120.987306439958, "examples_seen": 3225600.0, "progress": 0.028256949864097526, "epoch": 2.5431365824236907, "img/sec/core": 189.60301934326864, "core_hours_Tesla V100-SXM2-32GB": 4.717986916190841, "core_hours": 4.717986916190841}
{"step": 3200, "global_schedule": 0.3199000060558319, "l2_grads": 1.3811664581298828, "l2_params": 210.49996948242188, "l2_updates": 0.3628596365451813, "training_loss": 5.87326192855835, "uptime": 2137.851776029973, "examples_seen": 3276800.0, "progress": 0.02870547287781336, "epoch": 2.583503829763749, "img/sec/core": 189.7480370147352, "core_hours_Tesla V100-SXM2-32GB": 4.792940114368685, "core_hours": 4.792940114368685}
{"step": 3250, "global_schedule": 0.3249000012874603, "l2_grads": 1.3017022609710693, "l2_params": 210.53106689453125, "l2_updates": 0.34679847955703735, "training_loss": 6.612641334533691, "uptime": 2154.7350705769495, "examples_seen": 3328000.0, "progress": 0.029153995891529193, "epoch": 2.6238710771038076, "img/sec/core": 189.53646701455128, "core_hours_Tesla V100-SXM2-32GB": 4.867976979021915, "core_hours": 4.867976979021915}
{"step": 3300, "global_schedule": 0.32989999651908875, "l2_grads": 1.2983148097991943, "l2_params": 210.533935546875, "l2_updates": 0.3903762698173523, "training_loss": 5.972095966339111, "uptime": 2171.615745435003, "examples_seen": 3379200.0, "progress": 0.02960251890524503, "epoch": 2.664238324443866, "img/sec/core": 189.56588092053067, "core_hours_Tesla V100-SXM2-32GB": 4.943002200613264, "core_hours": 4.943002200613264}
{"step": 3350, "global_schedule": 0.33489999175071716, "l2_grads": 1.4048622846603394, "l2_params": 210.55276489257812, "l2_updates": 0.35953113436698914, "training_loss": 6.300963878631592, "uptime": 2188.5061879049754, "examples_seen": 3430400.0, "progress": 0.030051041918960863, "epoch": 2.704605571783925, "img/sec/core": 189.45625644141396, "core_hours_Tesla V100-SXM2-32GB": 5.01807083381314, "core_hours": 5.01807083381314}
{"step": 3401, "global_schedule": 0.3398999869823456, "l2_grads": 0.9841370582580566, "l2_params": 210.59893798828125, "l2_updates": 0.36661213636398315, "training_loss": 6.3623456954956055, "uptime": 2205.3967173869605, "examples_seen": 3481600.0, "progress": 0.030499564932676696, "epoch": 2.7449728191239835, "img/sec/core": 189.4552804524577, "core_hours_Tesla V100-SXM2-32GB": 5.093139853733074, "core_hours": 5.093139853733074}
{"step": 3450, "global_schedule": 0.344899982213974, "l2_grads": 1.2305545806884766, "l2_params": 210.6353759765625, "l2_updates": 0.39278748631477356, "training_loss": 5.969921112060547, "uptime": 2222.259158234985, "examples_seen": 3532800.0, "progress": 0.03094808794639253, "epoch": 2.785340066464042, "img/sec/core": 189.77086584560982, "core_hours_Tesla V100-SXM2-32GB": 5.16808403527985, "core_hours": 5.16808403527985}
{"step": 3500, "global_schedule": 0.3498999774456024, "l2_grads": 1.4215236902236938, "l2_params": 210.650390625, "l2_updates": 0.3586690425872803, "training_loss": 6.365225791931152, "uptime": 2239.1619628399494, "examples_seen": 3584000.0, "progress": 0.031396610960108366, "epoch": 2.8257073138041005, "img/sec/core": 189.31769459490553, "core_hours_Tesla V100-SXM2-32GB": 5.243207611301914, "core_hours": 5.243207611301914}
{"step": 3550, "global_schedule": 0.3549000024795532, "l2_grads": 1.169923186302185, "l2_params": 210.7021484375, "l2_updates": 0.41266506910324097, "training_loss": 5.793849468231201, "uptime": 2256.027776064002, "examples_seen": 3635200.0, "progress": 0.0318451339738242, "epoch": 2.8660745611441594, "img/sec/core": 189.73292052330098, "core_hours_Tesla V100-SXM2-32GB": 5.318166781186592, "core_hours": 5.318166781186592}
{"step": 3600, "global_schedule": 0.35989999771118164, "l2_grads": 1.0210198163986206, "l2_params": 210.74549865722656, "l2_updates": 0.40268781781196594, "training_loss": 6.22429084777832, "uptime": 2272.9100328619825, "examples_seen": 3686400.0, "progress": 0.03229365698754003, "epoch": 2.906441808484218, "img/sec/core": 189.5481177838018, "core_hours_Tesla V100-SXM2-32GB": 5.393199033622062, "core_hours": 5.393199033622062}
{"step": 3650, "global_schedule": 0.36489999294281006, "l2_grads": 1.0282480716705322, "l2_params": 210.7711181640625, "l2_updates": 0.4401716887950897, "training_loss": 5.845099449157715, "uptime": 2289.7753749309923, "examples_seen": 3737600.0, "progress": 0.032742180001255866, "epoch": 2.9468090558242763, "img/sec/core": 189.73822095669368, "core_hours_Tesla V100-SXM2-32GB": 5.468156109484326, "core_hours": 5.468156109484326}
{"step": 3700, "global_schedule": 0.3698999881744385, "l2_grads": 1.2120044231414795, "l2_params": 210.82656860351562, "l2_updates": 0.44731032848358154, "training_loss": 5.694382190704346, "uptime": 2306.6575183399837, "examples_seen": 3788800.0, "progress": 0.0331907030149717, "epoch": 2.987176303164335, "img/sec/core": 189.54939088455356, "core_hours_Tesla V100-SXM2-32GB": 5.543187857968733, "core_hours": 5.543187857968733}
{"step": 3750, "global_schedule": 0.3748999834060669, "l2_grads": 1.3104119300842285, "l2_params": 210.90872192382812, "l2_updates": 0.4125710129737854, "training_loss": 5.652183532714844, "uptime": 2323.527550383995, "examples_seen": 3840000.0, "progress": 0.03363922602868753, "epoch": 3.0275435505043933, "img/sec/core": 189.68547253803197, "core_hours_Tesla V100-SXM2-32GB": 5.618165778164338, "core_hours": 5.618165778164338}
{"step": 3800, "global_schedule": 0.3798999786376953, "l2_grads": 0.8944023251533508, "l2_params": 211.00372314453125, "l2_updates": 0.3971507251262665, "training_loss": 6.149394989013672, "uptime": 2340.40511083795, "examples_seen": 3891200.0, "progress": 0.034087749042403366, "epoch": 3.067910797844452, "img/sec/core": 189.6008613762727, "core_hours_Tesla V100-SXM2-32GB": 5.693177157959694, "core_hours": 5.693177157959694}
{"step": 3850, "global_schedule": 0.3849000036716461, "l2_grads": 1.7115428447723389, "l2_params": 211.10411071777344, "l2_updates": 0.44297629594802856, "training_loss": 5.75006103515625, "uptime": 2357.291265397973, "examples_seen": 3942400.0, "progress": 0.0345362720561192, "epoch": 3.1082780451845107, "img/sec/core": 189.50436516646712, "core_hours_Tesla V100-SXM2-32GB": 5.768226733782018, "core_hours": 5.768226733782018}
{"step": 3900, "global_schedule": 0.38989999890327454, "l2_grads": 1.1209264993667603, "l2_params": 211.21078491210938, "l2_updates": 0.48146766424179077, "training_loss": 5.699551105499268, "uptime": 2374.173010784958, "examples_seen": 3993600.0, "progress": 0.03498479506983503, "epoch": 3.148645292524569, "img/sec/core": 189.55385990284032, "core_hours_Tesla V100-SXM2-32GB": 5.84325671327973, "core_hours": 5.84325671327973}
{"step": 3950, "global_schedule": 0.39489999413490295, "l2_grads": 1.4003711938858032, "l2_params": 211.31483459472656, "l2_updates": 0.43571749329566956, "training_loss": 5.9069695472717285, "uptime": 2391.0712218309636, "examples_seen": 4044800.0, "progress": 0.035433318083550866, "epoch": 3.1890125398646276, "img/sec/core": 189.36915814863232, "core_hours_Tesla V100-SXM2-32GB": 5.9183598734841985, "core_hours": 5.9183598734841985}
{"step": 4000, "global_schedule": 0.39989998936653137, "l2_grads": 1.0448046922683716, "l2_params": 211.38992309570312, "l2_updates": 0.5241608023643494, "training_loss": 5.692379951477051, "uptime": 2407.97535163298, "examples_seen": 4096000.0, "progress": 0.0358818410972667, "epoch": 3.2293797872046865, "img/sec/core": 189.30285305891718, "core_hours_Tesla V100-SXM2-32GB": 5.99348933927094, "core_hours": 5.99348933927094}
{"step": 4050, "global_schedule": 0.4048999845981598, "l2_grads": 0.948795735836029, "l2_params": 211.49301147460938, "l2_updates": 0.4654107093811035, "training_loss": 5.827812194824219, "uptime": 2425.651557873003, "examples_seen": 4147200.0, "progress": 0.03633036411098253, "epoch": 3.269747034544745, "img/sec/core": 189.2963031588471, "core_hours_Tesla V100-SXM2-32GB": 6.068621404635617, "core_hours": 6.068621404635617}
{"step": 4100, "global_schedule": 0.4098999798297882, "l2_grads": 1.2236398458480835, "l2_params": 211.65625, "l2_updates": 0.4833448827266693, "training_loss": 6.344205379486084, "uptime": 2442.5508804940036, "examples_seen": 4198400.0, "progress": 0.036778887124698366, "epoch": 3.3101142818848035, "img/sec/core": 189.3567021451748, "core_hours_Tesla V100-SXM2-32GB": 6.143729505173396, "core_hours": 6.143729505173396}
{"step": 4150, "global_schedule": 0.4148999750614166, "l2_grads": 0.987625002861023, "l2_params": 211.76806640625, "l2_updates": 0.44885918498039246, "training_loss": 6.4401092529296875, "uptime": 2459.4388520539505, "examples_seen": 4249600.0, "progress": 0.0372274101384142, "epoch": 3.350481529224862, "img/sec/core": 189.48397613301424, "core_hours_Tesla V100-SXM2-32GB": 6.218787156550937, "core_hours": 6.218787156550937}
{"step": 4200, "global_schedule": 0.41990000009536743, "l2_grads": 1.3104158639907837, "l2_params": 211.9163818359375, "l2_updates": 0.493966668844223, "training_loss": 5.682477951049805, "uptime": 2476.3197320459876, "examples_seen": 4300800.0, "progress": 0.03767593315213003, "epoch": 3.390848776564921, "img/sec/core": 189.56357734368584, "core_hours_Tesla V100-SXM2-32GB": 6.293813289848881, "core_hours": 6.293813289848881}
{"step": 4250, "global_schedule": 0.42489999532699585, "l2_grads": 1.1391830444335938, "l2_params": 212.0771026611328, "l2_updates": 0.47068706154823303, "training_loss": 6.0124382972717285, "uptime": 2493.2130194409983, "examples_seen": 4352000.0, "progress": 0.03812445616584587, "epoch": 3.4312160239049794, "img/sec/core": 189.4243509374673, "core_hours_Tesla V100-SXM2-32GB": 6.368894567160039, "core_hours": 6.368894567160039}
{"step": 4301, "global_schedule": 0.42989999055862427, "l2_grads": 1.246059536933899, "l2_params": 212.24301147460938, "l2_updates": 0.4913162291049957, "training_loss": 5.844810485839844, "uptime": 2510.106115494971, "examples_seen": 4403200.0, "progress": 0.038572979179561706, "epoch": 3.471583271245038, "img/sec/core": 189.42649646791293, "core_hours_Tesla V100-SXM2-32GB": 6.4439749940665845, "core_hours": 6.4439749940665845}
{"step": 4350, "global_schedule": 0.4348999857902527, "l2_grads": 1.2045936584472656, "l2_params": 212.38865661621094, "l2_updates": 0.484755277633667, "training_loss": 6.61359977722168, "uptime": 2526.983951278962, "examples_seen": 4454400.0, "progress": 0.03902150219327754, "epoch": 3.5119505185850963, "img/sec/core": 189.59776839606798, "core_hours_Tesla V100-SXM2-32GB": 6.51898759755099, "core_hours": 6.51898759755099}
{"step": 4400, "global_schedule": 0.4398999810218811, "l2_grads": 1.3228907585144043, "l2_params": 212.57330322265625, "l2_updates": 0.49538514018058777, "training_loss": 5.654891014099121, "uptime": 2543.8777181589976, "examples_seen": 4505600.0, "progress": 0.03947002520699337, "epoch": 3.552317765925155, "img/sec/core": 189.41897462677042, "core_hours_Tesla V100-SXM2-32GB": 6.594071005906702, "core_hours": 6.594071005906702}
{"step": 4450, "global_schedule": 0.4448999762535095, "l2_grads": 1.3313148021697998, "l2_params": 212.79188537597656, "l2_updates": 0.5030797719955444, "training_loss": 5.556790351867676, "uptime": 2560.767299376952, "examples_seen": 4556800.0, "progress": 0.039918548220709206, "epoch": 3.5926850132652137, "img/sec/core": 189.46591740227714, "core_hours_Tesla V100-SXM2-32GB": 6.669135811319833, "core_hours": 6.669135811319833}
{"step": 4500, "global_schedule": 0.4499000012874603, "l2_grads": 0.9859107136726379, "l2_params": 212.99220275878906, "l2_updates": 0.5017133951187134, "training_loss": 6.230005741119385, "uptime": 2577.658656554995, "examples_seen": 4608000.0, "progress": 0.04036707123442504, "epoch": 3.633052260605272, "img/sec/core": 189.4459969243706, "core_hours_Tesla V100-SXM2-32GB": 6.744208509888915, "core_hours": 6.744208509888915}
{"step": 4550, "global_schedule": 0.45489999651908875, "l2_grads": 1.0122766494750977, "l2_params": 213.14178466796875, "l2_updates": 0.4946054220199585, "training_loss": 6.590252876281738, "uptime": 2594.5477253209683, "examples_seen": 4659200.0, "progress": 0.04081559424814087, "epoch": 3.6734195079453307, "img/sec/core": 189.4716662204084, "core_hours_Tesla V100-SXM2-32GB": 6.819271037737684, "core_hours": 6.819271037737684}
{"step": 4600, "global_schedule": 0.45989999175071716, "l2_grads": 0.8860654234886169, "l2_params": 213.32675170898438, "l2_updates": 0.49675965309143066, "training_loss": 6.424964904785156, "uptime": 2611.4320239039953, "examples_seen": 4710400.0, "progress": 0.041264117261856706, "epoch": 3.713786755285389, "img/sec/core": 189.52519610242, "core_hours_Tesla V100-SXM2-32GB": 6.894312364773359, "core_hours": 6.894312364773359}
{"step": 4650, "global_schedule": 0.4648999869823456, "l2_grads": 1.2942429780960083, "l2_params": 213.48162841796875, "l2_updates": 0.5469762682914734, "training_loss": 5.511626243591309, "uptime": 2628.3331290219794, "examples_seen": 4761600.0, "progress": 0.04171264027557254, "epoch": 3.754154002625448, "img/sec/core": 189.3367313948569, "core_hours_Tesla V100-SXM2-32GB": 6.969428387519955, "core_hours": 6.969428387519955}
{"step": 4700, "global_schedule": 0.469899982213974, "l2_grads": 1.1928801536560059, "l2_params": 213.6596221923828, "l2_updates": 0.5101318359375, "training_loss": 5.5441083908081055, "uptime": 2645.2062277919613, "examples_seen": 4812800.0, "progress": 0.04216116328928837, "epoch": 3.7945212499655065, "img/sec/core": 189.65099675069564, "core_hours_Tesla V100-SXM2-32GB": 7.0444199376087635, "core_hours": 7.0444199376087635}
{"step": 4750, "global_schedule": 0.4748999774456024, "l2_grads": 1.1042042970657349, "l2_params": 213.8351287841797, "l2_updates": 0.5226755142211914, "training_loss": 6.388588905334473, "uptime": 2662.0868174839998, "examples_seen": 4864000.0, "progress": 0.042609686303004206, "epoch": 3.834888497305565, "img/sec/core": 189.56683731903271, "core_hours_Tesla V100-SXM2-32GB": 7.11944478068449, "core_hours": 7.11944478068449}
{"step": 4800, "global_schedule": 0.4799000024795532, "l2_grads": 1.0464507341384888, "l2_params": 214.04397583007812, "l2_updates": 0.6137215495109558, "training_loss": 5.5106611251831055, "uptime": 2678.980169329967, "examples_seen": 4915200.0, "progress": 0.04305820931672004, "epoch": 3.8752557446456235, "img/sec/core": 189.42362825195778, "core_hours_Tesla V100-SXM2-32GB": 7.194526344444344, "core_hours": 7.194526344444344}
{"step": 4850, "global_schedule": 0.48489999771118164, "l2_grads": 1.4433298110961914, "l2_params": 214.28736877441406, "l2_updates": 0.5191740393638611, "training_loss": 5.597702980041504, "uptime": 2695.8777162529877, "examples_seen": 4966400.0, "progress": 0.04350673233043587, "epoch": 3.9156229919856824, "img/sec/core": 189.37660091006398, "core_hours_Tesla V100-SXM2-32GB": 7.269626552991103, "core_hours": 7.269626552991103}
{"step": 4900, "global_schedule": 0.48989999294281006, "l2_grads": 1.1753857135772705, "l2_params": 214.52951049804688, "l2_updates": 0.542466938495636, "training_loss": 5.560588359832764, "uptime": 2712.7568362299935, "examples_seen": 5017600.0, "progress": 0.043955255344151706, "epoch": 3.955990239325741, "img/sec/core": 189.58334346573312, "core_hours_Tesla V100-SXM2-32GB": 7.344644864000018, "core_hours": 7.344644864000018}
{"step": 4950, "global_schedule": 0.4948999881744385, "l2_grads": 1.3481794595718384, "l2_params": 214.7752685546875, "l2_updates": 0.568818211555481, "training_loss": 5.475867748260498, "uptime": 2729.643119077955, "examples_seen": 5068800.0, "progress": 0.04440377835786754, "epoch": 3.9963574866657994, "img/sec/core": 189.50292546984778, "core_hours_Tesla V100-SXM2-32GB": 7.419695009990957, "core_hours": 7.419695009990957}
{"step": 5000, "global_schedule": 0.4998999834060669, "l2_grads": 1.1475614309310913, "l2_params": 215.02455139160156, "l2_updates": 0.5913711190223694, "training_loss": 5.4568562507629395, "uptime": 2746.539496628975, "examples_seen": 5120000.0, "progress": 0.04485230137158338, "epoch": 4.036724734005858, "img/sec/core": 189.3897073699563, "core_hours_Tesla V100-SXM2-32GB": 7.494790021328825, "core_hours": 7.494790021328825, "minival/prec@1": 0.12433655947549173, "minival/loss": 4.772855484146942, "minival/sample count": 12812.0, "minival/attn_weight_avg": [13312, 12, 281], "minival/attn_mag": [13312, 12, 281], "minival/before_mlp": [13312, 12, 281], "z/secs/eval/minival": 2.9527912540361285, "real/prec@1": 0.13342015927578624, "real/loss": 6.040110829012052, "real/sample count": 46837.0, "real/attn_weight_avg": [50176, 12, 281], "real/attn_mag": [50176, 12, 281], "real/before_mlp": [50176, 12, 281], "z/secs/eval/real": 11.193446564022452, "train/prec@1": 0.12836123795027904, "train/loss": 4.761832173784467, "train/sample count": 25623.0, "train/attn_weight_avg": [26624, 12, 281], "train/attn_mag": [26624, 12, 281], "train/before_mlp": [26624, 12, 281], "z/secs/eval/train": 6.611017799994443, "v2/prec@1": 0.0916, "v2/loss": 5.123782080078125, "v2/sample count": 10000.0, "v2/attn_weight_avg": [10240, 12, 281], "v2/attn_mag": [10240, 12, 281], "v2/before_mlp": [10240, 12, 281], "z/secs/eval/v2": 3.3991005350253545, "val/prec@1": 0.11596, "val/loss": 4.835164228515625, "val/sample count": 50000.0, "val/attn_weight_avg": [50176, 12, 281], "val/attn_mag": [50176, 12, 281], "val/before_mlp": [50176, 12, 281], "z/secs/eval/val": 12.246361953031737}
{"step": 5050, "global_schedule": 0.5048999786376953, "l2_grads": 1.2337517738342285, "l2_params": 215.32107543945312, "l2_updates": 0.5464857220649719, "training_loss": 5.66121768951416, "uptime": 2800.4242748909746, "examples_seen": 5171200.0, "progress": 0.04530082438529921, "epoch": 4.077091981345917, "img/sec/core": 189.3369509434413, "core_hours_Tesla V100-SXM2-32GB": 7.569905956973477, "core_hours": 7.569905956973477}
{"step": 5100, "global_schedule": 0.5098999738693237, "l2_grads": 1.653253197669983, "l2_params": 215.53150939941406, "l2_updates": 0.5188894867897034, "training_loss": 5.478298187255859, "uptime": 2817.298124076973, "examples_seen": 5222400.0, "progress": 0.045749347399015046, "epoch": 4.117459228685975, "img/sec/core": 189.64256256689023, "core_hours_Tesla V100-SXM2-32GB": 7.644900842244581, "core_hours": 7.644900842244581}
{"step": 5150, "global_schedule": 0.5148999691009521, "l2_grads": 1.1200833320617676, "l2_params": 215.87246704101562, "l2_updates": 0.6066314578056335, "training_loss": 5.469752311706543, "uptime": 2834.1725046520005, "examples_seen": 5273600.0, "progress": 0.04619787041273088, "epoch": 4.157826476026034, "img/sec/core": 189.63659055644, "core_hours_Tesla V100-SXM2-32GB": 7.719898089244704, "core_hours": 7.719898089244704}
{"step": 5200, "global_schedule": 0.5198999643325806, "l2_grads": 1.1364288330078125, "l2_params": 216.17308044433594, "l2_updates": 0.5622920989990234, "training_loss": 5.528487205505371, "uptime": 2851.0421534209745, "examples_seen": 5324800.0, "progress": 0.04664639342644671, "epoch": 4.198193723366092, "img/sec/core": 189.68978215393048, "core_hours_Tesla V100-SXM2-32GB": 7.794874305995699, "core_hours": 7.794874305995699}
{"step": 5250, "global_schedule": 0.524899959564209, "l2_grads": 1.153244972229004, "l2_params": 216.41964721679688, "l2_updates": 0.6171825528144836, "training_loss": 5.390334129333496, "uptime": 2867.922684628982, "examples_seen": 5376000.0, "progress": 0.047094916440162546, "epoch": 4.238560970706151, "img/sec/core": 189.5674940894052, "core_hours_Tesla V100-SXM2-32GB": 7.8698988891424, "core_hours": 7.8698988891424}
{"step": 5300, "global_schedule": 0.5299000144004822, "l2_grads": 1.1533887386322021, "l2_params": 216.7255401611328, "l2_updates": 0.6175206303596497, "training_loss": 5.495122909545898, "uptime": 2884.7983405039995, "examples_seen": 5427200.0, "progress": 0.04754343945387838, "epoch": 4.278928218046209, "img/sec/core": 189.6222596442759, "core_hours_Tesla V100-SXM2-32GB": 7.944901804142476, "core_hours": 7.944901804142476}
{"step": 5350, "global_schedule": 0.5349000096321106, "l2_grads": 0.8924332857131958, "l2_params": 217.01702880859375, "l2_updates": 0.57454514503479, "training_loss": 6.3219313621521, "uptime": 2901.6784388399683, "examples_seen": 5478400.0, "progress": 0.04799196246759421, "epoch": 4.319295465386268, "img/sec/core": 189.57235534471448, "core_hours_Tesla V100-SXM2-32GB": 8.01992446341345, "core_hours": 8.01992446341345}
{"step": 5400, "global_schedule": 0.539900004863739, "l2_grads": 0.9639424681663513, "l2_params": 217.24937438964844, "l2_updates": 0.5475191473960876, "training_loss": 6.242027759552002, "uptime": 2918.5371240079985, "examples_seen": 5529600.0, "progress": 0.048440485481310046, "epoch": 4.359662712726327, "img/sec/core": 189.81314189722738, "core_hours_Tesla V100-SXM2-32GB": 8.094851953049139, "core_hours": 8.094851953049139}
{"step": 5450, "global_schedule": 0.5449000000953674, "l2_grads": 1.7482584714889526, "l2_params": 217.54782104492188, "l2_updates": 0.580420196056366, "training_loss": 5.250315189361572, "uptime": 2935.4269086809945, "examples_seen": 5580800.0, "progress": 0.04888900849502588, "epoch": 4.4000299600663855, "img/sec/core": 189.46363508803464, "core_hours_Tesla V100-SXM2-32GB": 8.169917662706899, "core_hours": 8.169917662706899}
{"step": 5500, "global_schedule": 0.5498999953269958, "l2_grads": 1.5073314905166626, "l2_params": 217.88136291503906, "l2_updates": 0.5943872928619385, "training_loss": 6.552088260650635, "uptime": 2952.278867257992, "examples_seen": 5632000.0, "progress": 0.04933753150874171, "epoch": 4.440397207406444, "img/sec/core": 189.88890729698102, "core_hours_Tesla V100-SXM2-32GB": 8.244815256382442, "core_hours": 8.244815256382442}
{"step": 5550, "global_schedule": 0.5548999905586243, "l2_grads": 1.2427135705947876, "l2_params": 218.21815490722656, "l2_updates": 0.5661004781723022, "training_loss": 5.369213104248047, "uptime": 2969.1709928439814, "examples_seen": 5683200.0, "progress": 0.049786054522457546, "epoch": 4.480764454746502, "img/sec/core": 189.4373791924742, "core_hours_Tesla V100-SXM2-32GB": 8.319891370097952, "core_hours": 8.319891370097952}
{"step": 5600, "global_schedule": 0.5598999857902527, "l2_grads": 1.0718646049499512, "l2_params": 218.54539489746094, "l2_updates": 0.6315741539001465, "training_loss": 5.263959884643555, "uptime": 2986.050178491976, "examples_seen": 5734400.0, "progress": 0.05023457753617338, "epoch": 4.521131702086561, "img/sec/core": 189.58260586346245, "core_hours_Tesla V100-SXM2-32GB": 8.394909972977928, "core_hours": 8.394909972977928}
{"step": 5650, "global_schedule": 0.5648999810218811, "l2_grads": 0.8978228569030762, "l2_params": 218.84335327148438, "l2_updates": 0.6125076413154602, "training_loss": 6.435113906860352, "uptime": 3002.9257229499635, "examples_seen": 5785600.0, "progress": 0.05068310054988921, "epoch": 4.561498949426619, "img/sec/core": 189.62351158308246, "core_hours_Tesla V100-SXM2-32GB": 8.469912392791205, "core_hours": 8.469912392791205}
{"step": 5700, "global_schedule": 0.5698999762535095, "l2_grads": 1.1172205209732056, "l2_params": 219.20457458496094, "l2_updates": 0.6671862006187439, "training_loss": 5.276125907897949, "uptime": 3019.798049439967, "examples_seen": 5836800.0, "progress": 0.051131623563605046, "epoch": 4.601866196766678, "img/sec/core": 189.6596774544347, "core_hours_Tesla V100-SXM2-32GB": 8.544900510524554, "core_hours": 8.544900510524554}
{"step": 5750, "global_schedule": 0.5748999714851379, "l2_grads": 1.3672508001327515, "l2_params": 219.5732879638672, "l2_updates": 0.6277287006378174, "training_loss": 5.309223651885986, "uptime": 3036.6790116879856, "examples_seen": 5888000.0, "progress": 0.05158014657732088, "epoch": 4.642233444106736, "img/sec/core": 189.5626536559326, "core_hours_Tesla V100-SXM2-32GB": 8.619927009404638, "core_hours": 8.619927009404638}
{"step": 5800, "global_schedule": 0.5798999667167664, "l2_grads": 1.021497368812561, "l2_params": 219.92430114746094, "l2_updates": 0.6300625205039978, "training_loss": 6.0338826179504395, "uptime": 3053.567015239969, "examples_seen": 5939200.0, "progress": 0.05202866959103672, "epoch": 4.682600691446796, "img/sec/core": 189.48361718127433, "core_hours_Tesla V100-SXM2-32GB": 8.694984802969007, "core_hours": 8.694984802969007}
{"step": 5850, "global_schedule": 0.5848999619483948, "l2_grads": 1.1329532861709595, "l2_params": 220.30003356933594, "l2_updates": 0.651028573513031, "training_loss": 5.261085510253906, "uptime": 3070.4422520269873, "examples_seen": 5990400.0, "progress": 0.05247719260475255, "epoch": 4.722967938786854, "img/sec/core": 189.62696881750827, "core_hours_Tesla V100-SXM2-32GB": 8.769985855355754, "core_hours": 8.769985855355754}
{"step": 5900, "global_schedule": 0.5898999571800232, "l2_grads": 1.0332461595535278, "l2_params": 220.60183715820312, "l2_updates": 0.6827479600906372, "training_loss": 5.564532279968262, "uptime": 3087.32564163598, "examples_seen": 6041600.0, "progress": 0.052925715618468386, "epoch": 4.763335186126913, "img/sec/core": 189.53539982845385, "core_hours_Tesla V100-SXM2-32GB": 8.845023142506834, "core_hours": 8.845023142506834}
{"step": 5950, "global_schedule": 0.5949000120162964, "l2_grads": 1.2299835681915283, "l2_params": 220.9651641845703, "l2_updates": 0.6664475798606873, "training_loss": 5.206035137176514, "uptime": 3104.204896630952, "examples_seen": 6092800.0, "progress": 0.05337423863218422, "epoch": 4.803702433466971, "img/sec/core": 189.58182697951955, "core_hours_Tesla V100-SXM2-32GB": 8.9200420535956, "core_hours": 8.9200420535956}
{"step": 6000, "global_schedule": 0.5999000072479248, "l2_grads": 0.9133805632591248, "l2_params": 221.33517456054688, "l2_updates": 0.6595739126205444, "training_loss": 6.540201187133789, "uptime": 3121.099925074959, "examples_seen": 6144000.0, "progress": 0.05382276164590005, "epoch": 4.84406968080703, "img/sec/core": 189.40483057518, "core_hours_Tesla V100-SXM2-32GB": 8.995131068902298, "core_hours": 8.995131068902298}
{"step": 6050, "global_schedule": 0.6049000024795532, "l2_grads": 1.2125027179718018, "l2_params": 221.69467163085938, "l2_updates": 0.6502617001533508, "training_loss": 5.2891316413879395, "uptime": 3138.4847265119897, "examples_seen": 6195200.0, "progress": 0.054271284659615886, "epoch": 4.884436928147088, "img/sec/core": 189.7217687961696, "core_hours_Tesla V100-SXM2-32GB": 9.070094644840186, "core_hours": 9.070094644840186}
{"step": 6100, "global_schedule": 0.6098999977111816, "l2_grads": 1.0733922719955444, "l2_params": 222.0376434326172, "l2_updates": 0.7055180072784424, "training_loss": 5.4002203941345215, "uptime": 3155.3561269879574, "examples_seen": 6246400.0, "progress": 0.05471980767333172, "epoch": 4.9248041754871466, "img/sec/core": 189.67008723183432, "core_hours_Tesla V100-SXM2-32GB": 9.145078646955598, "core_hours": 9.145078646955598}
{"step": 6150, "global_schedule": 0.6148999929428101, "l2_grads": 1.1212519407272339, "l2_params": 222.42388916015625, "l2_updates": 0.7456761002540588, "training_loss": 5.152811050415039, "uptime": 3172.2389699589694, "examples_seen": 6297600.0, "progress": 0.05516833068704755, "epoch": 4.965171422827205, "img/sec/core": 189.54153666502916, "core_hours_Tesla V100-SXM2-32GB": 9.22011350460454, "core_hours": 9.22011350460454}
{"step": 6200, "global_schedule": 0.6198999881744385, "l2_grads": 1.6294385194778442, "l2_params": 222.83285522460938, "l2_updates": 0.6763316988945007, "training_loss": 5.150721073150635, "uptime": 3189.136284159962, "examples_seen": 6348800.0, "progress": 0.055616853700763386, "epoch": 5.0055386701672635, "img/sec/core": 189.37920914153352, "core_hours_Tesla V100-SXM2-32GB": 9.295212678831174, "core_hours": 9.295212678831174}
{"step": 6250, "global_schedule": 0.6248999834060669, "l2_grads": 1.0941160917282104, "l2_params": 223.21949768066406, "l2_updates": 0.6852265000343323, "training_loss": 5.038415908813477, "uptime": 3205.9857118839864, "examples_seen": 6400000.0, "progress": 0.05606537671447922, "epoch": 5.045905917507323, "img/sec/core": 189.9174293876682, "core_hours_Tesla V100-SXM2-32GB": 9.370099024271282, "core_hours": 9.370099024271282}
{"step": 6300, "global_schedule": 0.6298999786376953, "l2_grads": 1.0390552282333374, "l2_params": 223.61180114746094, "l2_updates": 0.7105417251586914, "training_loss": 5.588413715362549, "uptime": 3222.8840341459727, "examples_seen": 6451200.0, "progress": 0.05651389972819505, "epoch": 5.086273164847381, "img/sec/core": 189.3679118191852, "core_hours_Tesla V100-SXM2-32GB": 9.445202678768998, "core_hours": 9.445202678768998}
{"step": 6350, "global_schedule": 0.6348999738693237, "l2_grads": 1.9650416374206543, "l2_params": 224.05210876464844, "l2_updates": 0.6356248259544373, "training_loss": 5.207459926605225, "uptime": 3239.7867591619724, "examples_seen": 6502400.0, "progress": 0.056962422741910886, "epoch": 5.12664041218744, "img/sec/core": 189.31858602509064, "core_hours_Tesla V100-SXM2-32GB": 9.520325901062332, "core_hours": 9.520325901062332}
{"step": 6400, "global_schedule": 0.6398999691009521, "l2_grads": 1.092612385749817, "l2_params": 224.4020538330078, "l2_updates": 0.6800515055656433, "training_loss": 5.116988182067871, "uptime": 3256.681448636984, "examples_seen": 6553600.0, "progress": 0.05741094575562672, "epoch": 5.167007659527498, "img/sec/core": 189.40863072582832, "core_hours_Tesla V100-SXM2-32GB": 9.595413409840159, "core_hours": 9.595413409840159}
{"step": 6450, "global_schedule": 0.6448999643325806, "l2_grads": 1.9003959894180298, "l2_params": 224.77047729492188, "l2_updates": 0.6700160503387451, "training_loss": 5.129581451416016, "uptime": 3273.5717534349533, "examples_seen": 6604800.0, "progress": 0.05785946876934255, "epoch": 5.207374906867557, "img/sec/core": 189.45780068958456, "core_hours_Tesla V100-SXM2-32GB": 9.670481431164468, "core_hours": 9.670481431164468}
{"step": 6500, "global_schedule": 0.649899959564209, "l2_grads": 1.5935492515563965, "l2_params": 225.24215698242188, "l2_updates": 0.6939482092857361, "training_loss": 5.123081207275391, "uptime": 3290.4554883749806, "examples_seen": 6656000.0, "progress": 0.058307991783058385, "epoch": 5.247742154207615, "img/sec/core": 189.5315231710701, "core_hours_Tesla V100-SXM2-32GB": 9.745520253120144, "core_hours": 9.745520253120144}
{"step": 6550, "global_schedule": 0.6548999547958374, "l2_grads": 1.2292979955673218, "l2_params": 225.66217041015625, "l2_updates": 0.7370054125785828, "training_loss": 5.087565898895264, "uptime": 3307.3567738769925, "examples_seen": 6707200.0, "progress": 0.058756514796774226, "epoch": 5.288109401547674, "img/sec/core": 189.33471064192602, "core_hours_Tesla V100-SXM2-32GB": 9.820637077573531, "core_hours": 9.820637077573531}
{"step": 6600, "global_schedule": 0.6599000096321106, "l2_grads": 1.0911400318145752, "l2_params": 226.0711669921875, "l2_updates": 0.7437885403633118, "training_loss": 5.359241485595703, "uptime": 3324.2516524149687, "examples_seen": 6758400.0, "progress": 0.05920503781049006, "epoch": 5.328476648887732, "img/sec/core": 189.40651113928186, "core_hours_Tesla V100-SXM2-32GB": 9.895725426631204, "core_hours": 9.895725426631204}
{"step": 6650, "global_schedule": 0.664900004863739, "l2_grads": 1.126299500465393, "l2_params": 226.48976135253906, "l2_updates": 0.6869666576385498, "training_loss": 5.706397533416748, "uptime": 3341.127862322959, "examples_seen": 6809600.0, "progress": 0.05965356082420589, "epoch": 5.368843896227791, "img/sec/core": 189.6160344915412, "core_hours_Tesla V100-SXM2-32GB": 9.97073080400005, "core_hours": 9.97073080400005}
{"step": 6700, "global_schedule": 0.6699000000953674, "l2_grads": 1.4421945810317993, "l2_params": 226.96788024902344, "l2_updates": 0.7315662503242493, "training_loss": 5.033751010894775, "uptime": 3358.008210001979, "examples_seen": 6860800.0, "progress": 0.060102083837921726, "epoch": 5.40921114356785, "img/sec/core": 189.5695551328713, "core_hours_Tesla V100-SXM2-32GB": 10.04575457146236, "core_hours": 10.04575457146236}
{"step": 6750, "global_schedule": 0.6748999953269958, "l2_grads": 1.5105304718017578, "l2_params": 227.4319610595703, "l2_updates": 0.7106032967567444, "training_loss": 4.9139790534973145, "uptime": 3374.893465864996, "examples_seen": 6912000.0, "progress": 0.06055060685163756, "epoch": 5.4495783909079085, "img/sec/core": 189.51445130356745, "core_hours_Tesla V100-SXM2-32GB": 10.12080015307577, "core_hours": 10.12080015307577}
{"step": 6800, "global_schedule": 0.6798999905586243, "l2_grads": 1.3777669668197632, "l2_params": 227.89027404785156, "l2_updates": 0.6842074990272522, "training_loss": 5.208654880523682, "uptime": 3391.773211891006, "examples_seen": 6963200.0, "progress": 0.06099912986535339, "epoch": 5.489945638247967, "img/sec/core": 189.57631205286336, "core_hours_Tesla V100-SXM2-32GB": 10.195821246524703, "core_hours": 10.195821246524703}
{"step": 6850, "global_schedule": 0.6848999857902527, "l2_grads": 1.3488177061080933, "l2_params": 228.30738830566406, "l2_updates": 0.7408307790756226, "training_loss": 5.034512519836426, "uptime": 3408.6354310089955, "examples_seen": 7014400.0, "progress": 0.061447652879069226, "epoch": 5.5303128855880255, "img/sec/core": 189.77336124081737, "core_hours_Tesla V100-SXM2-32GB": 10.270764442604655, "core_hours": 10.270764442604655}
{"step": 6900, "global_schedule": 0.6898999810218811, "l2_grads": 1.0675361156463623, "l2_params": 228.7380828857422, "l2_updates": 0.7882079482078552, "training_loss": 5.88060188293457, "uptime": 3425.510494472983, "examples_seen": 7065600.0, "progress": 0.06189617589278506, "epoch": 5.570680132928084, "img/sec/core": 189.62891646772448, "core_hours_Tesla V100-SXM2-32GB": 10.345764724666822, "core_hours": 10.345764724666822}
{"step": 6950, "global_schedule": 0.6948999762535095, "l2_grads": 1.0313470363616943, "l2_params": 229.20001220703125, "l2_updates": 0.7808309197425842, "training_loss": 5.855043411254883, "uptime": 3442.388569995004, "examples_seen": 7116800.0, "progress": 0.06234469890650089, "epoch": 5.611047380268142, "img/sec/core": 189.59507532863287, "core_hours_Tesla V100-SXM2-32GB": 10.420778393653585, "core_hours": 10.420778393653585}
{"step": 7000, "global_schedule": 0.6998999714851379, "l2_grads": 1.480669379234314, "l2_params": 229.62738037109375, "l2_updates": 0.7289791703224182, "training_loss": 4.914257049560547, "uptime": 3459.2760330429883, "examples_seen": 7168000.0, "progress": 0.06279322192021673, "epoch": 5.651414627608201, "img/sec/core": 189.48968183720174, "core_hours_Tesla V100-SXM2-32GB": 10.495833784977956, "core_hours": 10.495833784977956}
{"step": 7050, "global_schedule": 0.7048999667167664, "l2_grads": 1.2882314920425415, "l2_params": 230.11940002441406, "l2_updates": 0.7556297779083252, "training_loss": 4.994602680206299, "uptime": 3477.0040722849662, "examples_seen": 7219200.0, "progress": 0.06324174493393256, "epoch": 5.691781874948259, "img/sec/core": 189.63054359873928, "core_hours_Tesla V100-SXM2-32GB": 10.570833423497778, "core_hours": 10.570833423497778}
{"step": 7100, "global_schedule": 0.7098999619483948, "l2_grads": 1.1455802917480469, "l2_params": 230.5598602294922, "l2_updates": 0.7940431833267212, "training_loss": 4.964804649353027, "uptime": 3493.8634672469925, "examples_seen": 7270400.0, "progress": 0.0636902679476484, "epoch": 5.732149122288319, "img/sec/core": 189.80515061232086, "core_hours_Tesla V100-SXM2-32GB": 10.645764067773449, "core_hours": 10.645764067773449}
{"step": 7150, "global_schedule": 0.7148999571800232, "l2_grads": 1.0616769790649414, "l2_params": 231.1007537841797, "l2_updates": 0.7675542235374451, "training_loss": 6.120277404785156, "uptime": 3510.7410122089786, "examples_seen": 7321600.0, "progress": 0.06413879096136423, "epoch": 5.772516369628377, "img/sec/core": 189.60103541169457, "core_hours_Tesla V100-SXM2-32GB": 10.72077537871561, "core_hours": 10.72077537871561}
{"step": 7200, "global_schedule": 0.7198999524116516, "l2_grads": 1.3926105499267578, "l2_params": 231.61192321777344, "l2_updates": 0.7378065586090088, "training_loss": 4.875516891479492, "uptime": 3527.631029986951, "examples_seen": 7372800.0, "progress": 0.06458731397508007, "epoch": 5.812883616968436, "img/sec/core": 189.46102023488535, "core_hours_Tesla V100-SXM2-32GB": 10.795842124395486, "core_hours": 10.795842124395486}
{"step": 7250, "global_schedule": 0.7249000072479248, "l2_grads": 1.070106029510498, "l2_params": 232.03366088867188, "l2_updates": 0.785541832447052, "training_loss": 5.259341716766357, "uptime": 3544.502201177005, "examples_seen": 7424000.0, "progress": 0.06503583698879589, "epoch": 5.853250864308494, "img/sec/core": 189.67266492360974, "core_hours_Tesla V100-SXM2-32GB": 10.870825107462394, "core_hours": 10.870825107462394}
{"step": 7300, "global_schedule": 0.7299000024795532, "l2_grads": 0.8734434247016907, "l2_params": 232.46141052246094, "l2_updates": 0.8053590655326843, "training_loss": 6.331187725067139, "uptime": 3561.3762761749676, "examples_seen": 7475200.0, "progress": 0.06548436000251173, "epoch": 5.893618111648553, "img/sec/core": 189.6400247353648, "core_hours_Tesla V100-SXM2-32GB": 10.945820996342228, "core_hours": 10.945820996342228}
{"step": 7350, "global_schedule": 0.7348999977111816, "l2_grads": 0.9698489308357239, "l2_params": 232.89248657226562, "l2_updates": 0.7727465629577637, "training_loss": 6.343906402587891, "uptime": 3578.2498381899786, "examples_seen": 7526400.0, "progress": 0.06593288301622756, "epoch": 5.933985358988611, "img/sec/core": 189.64579009181534, "core_hours_Tesla V100-SXM2-32GB": 11.020814605297831, "core_hours": 11.020814605297831}
{"step": 7400, "global_schedule": 0.7398999929428101, "l2_grads": 0.9442388415336609, "l2_params": 233.3817138671875, "l2_updates": 0.7773462533950806, "training_loss": 5.7814106941223145, "uptime": 3595.129945753957, "examples_seen": 7577600.0, "progress": 0.0663814060299434, "epoch": 5.97435260632867, "img/sec/core": 189.57225170938318, "core_hours_Tesla V100-SXM2-32GB": 11.095837305582181, "core_hours": 11.095837305582181}
{"step": 7450, "global_schedule": 0.7448999881744385, "l2_grads": 1.4986647367477417, "l2_params": 233.92352294921875, "l2_updates": 0.7649744153022766, "training_loss": 4.828360557556152, "uptime": 3611.9855908859754, "examples_seen": 7628800.0, "progress": 0.06682992904365923, "epoch": 6.014719853668728, "img/sec/core": 189.8473760533448, "core_hours_Tesla V100-SXM2-32GB": 11.170751283946707, "core_hours": 11.170751283946707}
{"step": 7500, "global_schedule": 0.7498999834060669, "l2_grads": 1.1827143430709839, "l2_params": 234.4937286376953, "l2_updates": 0.8568640947341919, "training_loss": 4.857760906219482, "uptime": 3628.896192290995, "examples_seen": 7680000.0, "progress": 0.06727845205737507, "epoch": 6.0550871010087866, "img/sec/core": 189.23040779910855, "core_hours_Tesla V100-SXM2-32GB": 11.245909512413458, "core_hours": 11.245909512413458, "minival/prec@1": 0.22463315641586012, "minival/loss": 3.9333027325456604, "minival/sample count": 12812.0, "minival/attn_weight_avg": [13312, 12, 281], "minival/attn_mag": [13312, 12, 281], "minival/before_mlp": [13312, 12, 281], "z/secs/eval/minival": 2.915524943964556, "real/prec@1": 0.24060038004142023, "real/loss": 5.085751265692721, "real/sample count": 46837.0, "real/attn_weight_avg": [50176, 12, 281], "real/attn_mag": [50176, 12, 281], "real/before_mlp": [50176, 12, 281], "z/secs/eval/real": 11.218566427996848, "train/prec@1": 0.22885688639113297, "train/loss": 3.903361295000273, "train/sample count": 25623.0, "train/attn_weight_avg": [26624, 12, 281], "train/attn_mag": [26624, 12, 281], "train/before_mlp": [26624, 12, 281], "z/secs/eval/train": 6.648265764990356, "v2/prec@1": 0.1588, "v2/loss": 4.431121215820313, "v2/sample count": 10000.0, "v2/attn_weight_avg": [10240, 12, 281], "v2/attn_mag": [10240, 12, 281], "v2/before_mlp": [10240, 12, 281], "z/secs/eval/v2": 3.3869657600298524, "val/prec@1": 0.20956, "val/loss": 4.019377846679688, "val/sample count": 50000.0, "val/attn_weight_avg": [50176, 12, 281], "val/attn_mag": [50176, 12, 281], "val/before_mlp": [50176, 12, 281], "z/secs/eval/val": 12.338950524048414}
{"step": 7550, "global_schedule": 0.7548999786376953, "l2_grads": 1.3205561637878418, "l2_params": 235.03411865234375, "l2_updates": 0.758647084236145, "training_loss": 4.7297844886779785, "uptime": 3682.336809615954, "examples_seen": 7731200.0, "progress": 0.06772697507109089, "epoch": 6.095454348348846, "img/sec/core": 189.00900378736918, "core_hours_Tesla V100-SXM2-32GB": 11.321155780777593, "core_hours": 11.321155780777593}
{"step": 7600, "global_schedule": 0.7598999738693237, "l2_grads": 1.7899597883224487, "l2_params": 235.55963134765625, "l2_updates": 0.7852051258087158, "training_loss": 4.815295219421387, "uptime": 3699.223976402951, "examples_seen": 7782400.0, "progress": 0.06817549808480673, "epoch": 6.135821595688904, "img/sec/core": 189.49300616039133, "core_hours_Tesla V100-SXM2-32GB": 11.39620985538647, "core_hours": 11.39620985538647}
{"step": 7650, "global_schedule": 0.7648999691009521, "l2_grads": 1.268568515777588, "l2_params": 236.12234497070312, "l2_updates": 0.8183668851852417, "training_loss": 4.843252182006836, "uptime": 3716.10629921098, "examples_seen": 7833600.0, "progress": 0.06862402109852256, "epoch": 6.176188843028963, "img/sec/core": 189.54737664879264, "core_hours_Tesla V100-SXM2-32GB": 11.471242401199932, "core_hours": 11.471242401199932}
{"step": 7700, "global_schedule": 0.7698999643325806, "l2_grads": 1.026214838027954, "l2_params": 236.5779266357422, "l2_updates": 0.8291800618171692, "training_loss": 5.407321929931641, "uptime": 3732.9874556809664, "examples_seen": 7884800.0, "progress": 0.0690725441122384, "epoch": 6.216556090369021, "img/sec/core": 189.560472689736, "core_hours_Tesla V100-SXM2-32GB": 11.54626976328876, "core_hours": 11.54626976328876}
{"step": 7750, "global_schedule": 0.774899959564209, "l2_grads": 1.0266205072402954, "l2_params": 237.00335693359375, "l2_updates": 0.8175699710845947, "training_loss": 6.344047546386719, "uptime": 3749.86587347195, "examples_seen": 7936000.0, "progress": 0.06952106712595424, "epoch": 6.25692333770908, "img/sec/core": 189.5912306252658, "core_hours_Tesla V100-SXM2-32GB": 11.62128495347091, "core_hours": 11.62128495347091}
{"step": 7800, "global_schedule": 0.7798999547958374, "l2_grads": 1.406908392906189, "l2_params": 237.536376953125, "l2_updates": 0.7511354684829712, "training_loss": 4.849312782287598, "uptime": 3766.7556259789853, "examples_seen": 7987200.0, "progress": 0.06996959013967007, "epoch": 6.297290585049138, "img/sec/core": 189.46399591510246, "core_hours_Tesla V100-SXM2-32GB": 11.696350520168844, "core_hours": 11.696350520168844}
{"step": 7850, "global_schedule": 0.7849000096321106, "l2_grads": 1.1144192218780518, "l2_params": 238.0439453125, "l2_updates": 0.8904518485069275, "training_loss": 4.896664619445801, "uptime": 3783.6164733759942, "examples_seen": 8038400.0, "progress": 0.0704181131533859, "epoch": 6.337657832389197, "img/sec/core": 189.78880032848616, "core_hours_Tesla V100-SXM2-32GB": 11.771287619711106, "core_hours": 11.771287619711106}
{"step": 7900, "global_schedule": 0.789900004863739, "l2_grads": 1.1321829557418823, "l2_params": 238.63401794433594, "l2_updates": 0.8327786922454834, "training_loss": 4.760506629943848, "uptime": 3800.5009810589836, "examples_seen": 8089600.0, "progress": 0.07086663616710173, "epoch": 6.378025079729255, "img/sec/core": 189.52284899748108, "core_hours_Tesla V100-SXM2-32GB": 11.846329876079949, "core_hours": 11.846329876079949}
{"step": 7950, "global_schedule": 0.7949000000953674, "l2_grads": 0.7423640489578247, "l2_params": 239.26329040527344, "l2_updates": 0.7215197682380676, "training_loss": 6.232558727264404, "uptime": 3817.379772609973, "examples_seen": 8140800.0, "progress": 0.07131515918081757, "epoch": 6.418392327069315, "img/sec/core": 189.58703236147545, "core_hours_Tesla V100-SXM2-32GB": 11.921346727417678, "core_hours": 11.921346727417678}
{"step": 8000, "global_schedule": 0.7998999953269958, "l2_grads": 1.0669212341308594, "l2_params": 239.86180114746094, "l2_updates": 0.8505417704582214, "training_loss": 5.23112678527832, "uptime": 3834.26929846697, "examples_seen": 8192000.0, "progress": 0.0717636821945334, "epoch": 6.458759574409373, "img/sec/core": 189.4665384389246, "core_hours_Tesla V100-SXM2-32GB": 11.996411286782111, "core_hours": 11.996411286782111}
{"step": 8050, "global_schedule": 0.8048999905586243, "l2_grads": 1.3969721794128418, "l2_params": 240.42340087890625, "l2_updates": 0.7301192283630371, "training_loss": 4.893584251403809, "uptime": 3851.6276521919644, "examples_seen": 8243200.0, "progress": 0.07221220520824924, "epoch": 6.499126821749432, "img/sec/core": 189.69351260446845, "core_hours_Tesla V100-SXM2-32GB": 12.071386029075367, "core_hours": 12.071386029075367}
{"step": 8100, "global_schedule": 0.8098999857902527, "l2_grads": 1.1301240921020508, "l2_params": 240.97230529785156, "l2_updates": 0.8963261246681213, "training_loss": 4.757059097290039, "uptime": 3868.5173162400024, "examples_seen": 8294400.0, "progress": 0.07266072822196507, "epoch": 6.53949406908949, "img/sec/core": 189.46498822584564, "core_hours_Tesla V100-SXM2-32GB": 12.1464512026222, "core_hours": 12.1464512026222}
{"step": 8150, "global_schedule": 0.8148999810218811, "l2_grads": 1.08784818649292, "l2_params": 241.63150024414062, "l2_updates": 0.9061465859413147, "training_loss": 5.342029571533203, "uptime": 3885.3899353499874, "examples_seen": 8345600.0, "progress": 0.0731092512356809, "epoch": 6.5798613164295485, "img/sec/core": 189.65638820746506, "core_hours_Tesla V100-SXM2-32GB": 12.221440620888801, "core_hours": 12.221440620888801}
{"step": 8200, "global_schedule": 0.8198999762535095, "l2_grads": 1.135797381401062, "l2_params": 242.23138427734375, "l2_updates": 0.836259126663208, "training_loss": 4.794388771057129, "uptime": 3902.2806297619827, "examples_seen": 8396800.0, "progress": 0.07355777424939673, "epoch": 6.620228563769607, "img/sec/core": 189.45343050712225, "core_hours_Tesla V100-SXM2-32GB": 12.296510373831003, "core_hours": 12.296510373831003}
{"step": 8250, "global_schedule": 0.8248999714851379, "l2_grads": 1.096826434135437, "l2_params": 242.7584228515625, "l2_updates": 0.891226589679718, "training_loss": 4.903538703918457, "uptime": 3919.151177560969, "examples_seen": 8448000.0, "progress": 0.07400629726311257, "epoch": 6.6605958111096655, "img/sec/core": 189.67967360208183, "core_hours_Tesla V100-SXM2-32GB": 12.37149058627094, "core_hours": 12.37149058627094}
{"step": 8300, "global_schedule": 0.8298999667167664, "l2_grads": 1.1721241474151611, "l2_params": 243.41143798828125, "l2_updates": 0.9196012020111084, "training_loss": 4.6661882400512695, "uptime": 3936.0133208530024, "examples_seen": 8499200.0, "progress": 0.0744548202768284, "epoch": 6.700963058449724, "img/sec/core": 189.77421461670423, "core_hours_Tesla V100-SXM2-32GB": 12.446433445346646, "core_hours": 12.446433445346646}
{"step": 8350, "global_schedule": 0.8348999619483948, "l2_grads": 0.9508176445960999, "l2_params": 243.99880981445312, "l2_updates": 0.8746692538261414, "training_loss": 6.06010627746582, "uptime": 3952.8985534219537, "examples_seen": 8550400.0, "progress": 0.07490334329054424, "epoch": 6.741330305789782, "img/sec/core": 189.51471274871162, "core_hours_Tesla V100-SXM2-32GB": 12.521478923430873, "core_hours": 12.521478923430873}
{"step": 8400, "global_schedule": 0.8398999571800232, "l2_grads": 1.2048588991165161, "l2_params": 244.52293395996094, "l2_updates": 0.9540868401527405, "training_loss": 4.760628700256348, "uptime": 3969.791208817973, "examples_seen": 8601600.0, "progress": 0.07535186630426007, "epoch": 6.781697553129842, "img/sec/core": 189.43143780427238, "core_hours_Tesla V100-SXM2-32GB": 12.596557391857624, "core_hours": 12.596557391857624}
{"step": 8450, "global_schedule": 0.8448999524116516, "l2_grads": 0.8821199536323547, "l2_params": 245.21163940429688, "l2_updates": 0.8105381727218628, "training_loss": 6.163093566894531, "uptime": 3986.6617043139995, "examples_seen": 8652800.0, "progress": 0.0758003893179759, "epoch": 6.8220648004699, "img/sec/core": 189.6802616588028, "core_hours_Tesla V100-SXM2-32GB": 12.671537371839966, "core_hours": 12.671537371839966}
{"step": 8500, "global_schedule": 0.8499000072479248, "l2_grads": 1.1238226890563965, "l2_params": 245.8842315673828, "l2_updates": 0.8475059270858765, "training_loss": 4.71041202545166, "uptime": 4003.5351356829633, "examples_seen": 8704000.0, "progress": 0.07624891233169175, "epoch": 6.862432047809959, "img/sec/core": 189.64725846373676, "core_hours_Tesla V100-SXM2-32GB": 12.74653040014647, "core_hours": 12.74653040014647}
{"step": 8550, "global_schedule": 0.8549000024795532, "l2_grads": 1.1473745107650757, "l2_params": 246.416015625, "l2_updates": 0.9233143925666809, "training_loss": 4.57228422164917, "uptime": 4020.4118862680043, "examples_seen": 8755200.0, "progress": 0.07669743534540757, "epoch": 6.902799295150017, "img/sec/core": 189.6099598009331, "core_hours_Tesla V100-SXM2-32GB": 12.821538180524433, "core_hours": 12.821538180524433}
{"step": 8600, "global_schedule": 0.8598999977111816, "l2_grads": 0.931867778301239, "l2_params": 246.98471069335938, "l2_updates": 0.7996900081634521, "training_loss": 6.196318626403809, "uptime": 4037.2810248889728, "examples_seen": 8806400.0, "progress": 0.07714595835912341, "epoch": 6.943166542490076, "img/sec/core": 189.69551865691474, "core_hours_Tesla V100-SXM2-32GB": 12.896512129950958, "core_hours": 12.896512129950958}
{"step": 8650, "global_schedule": 0.8648999929428101, "l2_grads": 0.9475762248039246, "l2_params": 247.5143280029297, "l2_updates": 0.9496294856071472, "training_loss": 5.463679313659668, "uptime": 4054.1663136069546, "examples_seen": 8857600.0, "progress": 0.07759448137283924, "epoch": 6.983533789830134, "img/sec/core": 189.51408255117238, "core_hours_Tesla V100-SXM2-32GB": 12.971557857586435, "core_hours": 12.971557857586435}
{"step": 8700, "global_schedule": 0.8698999881744385, "l2_grads": 1.3883997201919556, "l2_params": 248.24143981933594, "l2_updates": 1.0042617321014404, "training_loss": 4.618002891540527, "uptime": 4071.0395468269708, "examples_seen": 8908800.0, "progress": 0.07804300438655508, "epoch": 7.023901037170193, "img/sec/core": 189.6494855653363, "core_hours_Tesla V100-SXM2-32GB": 13.04655000523095, "core_hours": 13.04655000523095}
{"step": 8750, "global_schedule": 0.8748999834060669, "l2_grads": 1.5484724044799805, "l2_params": 248.88803100585938, "l2_updates": 0.880477786064148, "training_loss": 6.113138675689697, "uptime": 4087.9258252849686, "examples_seen": 8960000.0, "progress": 0.0784915274002709, "epoch": 7.064268284510251, "img/sec/core": 189.50297473534715, "core_hours_Tesla V100-SXM2-32GB": 13.12160013171094, "core_hours": 13.12160013171094}
{"step": 8800, "global_schedule": 0.8798999786376953, "l2_grads": 1.2322633266448975, "l2_params": 249.453857421875, "l2_updates": 0.9237368106842041, "training_loss": 5.280052661895752, "uptime": 4104.81723620696, "examples_seen": 9011200.0, "progress": 0.07894005041398675, "epoch": 7.10463553185031, "img/sec/core": 189.4453941579174, "core_hours_Tesla V100-SXM2-32GB": 13.196673069142012, "core_hours": 13.196673069142012}
{"step": 8851, "global_schedule": 0.8848999738693237, "l2_grads": 1.2169588804244995, "l2_params": 250.12135314941406, "l2_updates": 0.9923065900802612, "training_loss": 4.703574180603027, "uptime": 4121.701960131002, "examples_seen": 9062400.0, "progress": 0.07938857342770257, "epoch": 7.145002779190369, "img/sec/core": 189.52042179638565, "core_hours_Tesla V100-SXM2-32GB": 13.2717162865822, "core_hours": 13.2717162865822}
{"step": 8900, "global_schedule": 0.8898999691009521, "l2_grads": 1.1720778942108154, "l2_params": 250.72816467285156, "l2_updates": 0.9839093685150146, "training_loss": 4.542871475219727, "uptime": 4138.583802059991, "examples_seen": 9113600.0, "progress": 0.07983709644141841, "epoch": 7.1853700265304274, "img/sec/core": 189.5527759032635, "core_hours_Tesla V100-SXM2-32GB": 13.346746695155485, "core_hours": 13.346746695155485}
{"step": 8950, "global_schedule": 0.8948999643325806, "l2_grads": 0.9459819793701172, "l2_params": 251.45718383789062, "l2_updates": 0.8843970894813538, "training_loss": 5.788968563079834, "uptime": 4155.4726364089875, "examples_seen": 9164800.0, "progress": 0.08028561945513424, "epoch": 7.225737273870486, "img/sec/core": 189.47429608664496, "core_hours_Tesla V100-SXM2-32GB": 13.421808181151023, "core_hours": 13.421808181151023}
{"step": 9000, "global_schedule": 0.899899959564209, "l2_grads": 1.0017415285110474, "l2_params": 252.1096954345703, "l2_updates": 0.957187831401825, "training_loss": 4.829763412475586, "uptime": 4172.363270398986, "examples_seen": 9216000.0, "progress": 0.08073414246885008, "epoch": 7.266104521210544, "img/sec/core": 189.4541082291408, "core_hours_Tesla V100-SXM2-32GB": 13.496877665551017, "core_hours": 13.496877665551017}
{"step": 9050, "global_schedule": 0.9048999547958374, "l2_grads": 1.0362776517868042, "l2_params": 252.76925659179688, "l2_updates": 0.982168436050415, "training_loss": 4.563256740570068, "uptime": 4189.799206775962, "examples_seen": 9267200.0, "progress": 0.0811826654825659, "epoch": 7.306471768550603, "img/sec/core": 189.43349988312474, "core_hours_Tesla V100-SXM2-32GB": 13.571955316710905, "core_hours": 13.571955316710905}
{"step": 9100, "global_schedule": 0.9098999500274658, "l2_grads": 1.0725812911987305, "l2_params": 253.3812713623047, "l2_updates": 1.0096725225448608, "training_loss": 4.466355323791504, "uptime": 4206.69544434495, "examples_seen": 9318400.0, "progress": 0.08163118849628175, "epoch": 7.346839015890661, "img/sec/core": 189.39127642673552, "core_hours_Tesla V100-SXM2-32GB": 13.647049705906408, "core_hours": 13.647049705906408}
{"step": 9150, "global_schedule": 0.914900004863739, "l2_grads": 1.038016676902771, "l2_params": 254.0167694091797, "l2_updates": 0.9338468313217163, "training_loss": 5.746173858642578, "uptime": 4223.59357084299, "examples_seen": 9369600.0, "progress": 0.08207971150999757, "epoch": 7.38720626323072, "img/sec/core": 189.3701056369349, "core_hours_Tesla V100-SXM2-32GB": 13.722152490342138, "core_hours": 13.722152490342138}
{"step": 9200, "global_schedule": 0.9199000000953674, "l2_grads": 1.19447660446167, "l2_params": 254.75820922851562, "l2_updates": 0.9898189902305603, "training_loss": 4.604168891906738, "uptime": 4240.499963722948, "examples_seen": 9420800.0, "progress": 0.08252823452371341, "epoch": 7.427573510570778, "img/sec/core": 189.27751311123035, "core_hours_Tesla V100-SXM2-32GB": 13.797292014253067, "core_hours": 13.797292014253067}
{"step": 9250, "global_schedule": 0.9248999953269958, "l2_grads": 1.0242130756378174, "l2_params": 255.4944305419922, "l2_updates": 1.0055891275405884, "training_loss": 4.460507869720459, "uptime": 4257.412622176984, "examples_seen": 9472000.0, "progress": 0.08297675753742925, "epoch": 7.467940757910838, "img/sec/core": 189.20739212565786, "core_hours_Tesla V100-SXM2-32GB": 13.87245938515989, "core_hours": 13.87245938515989}
{"step": 9300, "global_schedule": 0.9298999905586243, "l2_grads": 1.1404942274093628, "l2_params": 256.111083984375, "l2_updates": 0.9862880110740662, "training_loss": 4.572149276733398, "uptime": 4274.319444068999, "examples_seen": 9523200.0, "progress": 0.08342528055114508, "epoch": 7.508308005250896, "img/sec/core": 189.27271017809673, "core_hours_Tesla V100-SXM2-32GB": 13.947600815791068, "core_hours": 13.947600815791068}
{"step": 9350, "global_schedule": 0.9348999857902527, "l2_grads": 1.1411360502243042, "l2_params": 256.7784423828125, "l2_updates": 1.0664936304092407, "training_loss": 4.624421119689941, "uptime": 4291.2200557789765, "examples_seen": 9574400.0, "progress": 0.08387380356486092, "epoch": 7.548675252590955, "img/sec/core": 189.3422590207637, "core_hours_Tesla V100-SXM2-32GB": 14.02271464561319, "core_hours": 14.02271464561319}
{"step": 9400, "global_schedule": 0.9398999810218811, "l2_grads": 1.230049967765808, "l2_params": 257.5314636230469, "l2_updates": 1.0007176399230957, "training_loss": 4.51535701751709, "uptime": 4308.142052017967, "examples_seen": 9625600.0, "progress": 0.08432232657857675, "epoch": 7.589042499931013, "img/sec/core": 189.10298494374706, "core_hours_Tesla V100-SXM2-32GB": 14.097923517786484, "core_hours": 14.097923517786484}
{"step": 9450, "global_schedule": 0.9448999762535095, "l2_grads": 1.07886803150177, "l2_params": 258.1344909667969, "l2_updates": 1.0209146738052368, "training_loss": 4.413834571838379, "uptime": 4325.040735500981, "examples_seen": 9676800.0, "progress": 0.08477084959229259, "epoch": 7.629409747271072, "img/sec/core": 189.36386394931634, "core_hours_Tesla V100-SXM2-32GB": 14.17302877771099, "core_hours": 14.17302877771099}
{"step": 9500, "global_schedule": 0.9498999714851379, "l2_grads": 1.0350456237792969, "l2_params": 258.81396484375, "l2_updates": 1.005746603012085, "training_loss": 4.360157489776611, "uptime": 4341.953065323993, "examples_seen": 9728000.0, "progress": 0.08521937260600841, "epoch": 7.66977699461113, "img/sec/core": 189.21106869888283, "core_hours_Tesla V100-SXM2-32GB": 14.248194688035486, "core_hours": 14.248194688035486}
{"step": 9550, "global_schedule": 0.9548999667167664, "l2_grads": 0.8841432929039001, "l2_params": 259.4385986328125, "l2_updates": 0.9270210266113281, "training_loss": 5.684181213378906, "uptime": 4358.867034900002, "examples_seen": 9779200.0, "progress": 0.08566789561972425, "epoch": 7.7101442419511885, "img/sec/core": 189.19272531616818, "core_hours_Tesla V100-SXM2-32GB": 14.323367886151084, "core_hours": 14.323367886151084}
{"step": 9600, "global_schedule": 0.9598999619483948, "l2_grads": 1.1298326253890991, "l2_params": 260.1244201660156, "l2_updates": 1.027336597442627, "training_loss": 4.4824113845825195, "uptime": 4375.759172733, "examples_seen": 9830400.0, "progress": 0.08611641863344008, "epoch": 7.750511489291247, "img/sec/core": 189.43724184803781, "core_hours_Tesla V100-SXM2-32GB": 14.39844405429774, "core_hours": 14.39844405429774}
{"step": 9650, "global_schedule": 0.9648999571800232, "l2_grads": 1.020433783531189, "l2_params": 260.8918151855469, "l2_updates": 0.9721680283546448, "training_loss": 5.162064552307129, "uptime": 4392.6746320129605, "examples_seen": 9881600.0, "progress": 0.08656494164715592, "epoch": 7.7908787366313055, "img/sec/core": 189.17606356636122, "core_hours_Tesla V100-SXM2-32GB": 14.473623873319786, "core_hours": 14.473623873319786}
{"step": 9700, "global_schedule": 0.9698999524116516, "l2_grads": 1.298932433128357, "l2_params": 261.62725830078125, "l2_updates": 0.9813395738601685, "training_loss": 4.454730033874512, "uptime": 4409.578895735962, "examples_seen": 9932800.0, "progress": 0.08701346466087174, "epoch": 7.831245983971365, "img/sec/core": 189.30135334115815, "core_hours_Tesla V100-SXM2-32GB": 14.548753934310904, "core_hours": 14.548753934310904}
{"step": 9750, "global_schedule": 0.97489994764328, "l2_grads": 1.067873477935791, "l2_params": 262.30169677734375, "l2_updates": 1.068083643913269, "training_loss": 4.846660137176514, "uptime": 4426.456901587953, "examples_seen": 9984000.0, "progress": 0.08746198767458759, "epoch": 7.871613231311423, "img/sec/core": 189.59585795038842, "core_hours_Tesla V100-SXM2-32GB": 14.623767293653088, "core_hours": 14.623767293653088}
{"step": 9800, "global_schedule": 0.9799000024795532, "l2_grads": 0.8904595971107483, "l2_params": 262.9306945800781, "l2_updates": 0.9849461317062378, "training_loss": 6.136987686157227, "uptime": 4443.3532201349735, "examples_seen": 10035200.0, "progress": 0.08791051068830341, "epoch": 7.911980478651482, "img/sec/core": 189.39036874185504, "core_hours_Tesla V100-SXM2-32GB": 14.698862042750957, "core_hours": 14.698862042750957}
{"step": 9850, "global_schedule": 0.9848999977111816, "l2_grads": 1.275927186012268, "l2_params": 263.7276306152344, "l2_updates": 1.0447005033493042, "training_loss": 4.484591960906982, "uptime": 4460.243820275995, "examples_seen": 10086400.0, "progress": 0.08835903370201925, "epoch": 7.95234772599154, "img/sec/core": 189.45448789757964, "core_hours_Tesla V100-SXM2-32GB": 14.773931376711053, "core_hours": 14.773931376711053}
{"step": 9900, "global_schedule": 0.9898999929428101, "l2_grads": 1.0242551565170288, "l2_params": 264.3812255859375, "l2_updates": 1.0886059999465942, "training_loss": 4.540975093841553, "uptime": 4477.136133235996, "examples_seen": 10137600.0, "progress": 0.08880755671573508, "epoch": 7.992714973331599, "img/sec/core": 189.43527790287078, "core_hours_Tesla V100-SXM2-32GB": 14.849008323199943, "core_hours": 14.849008323199943}
{"step": 9950, "global_schedule": 0.9948999881744385, "l2_grads": 1.0383776426315308, "l2_params": 265.07855224609375, "l2_updates": 0.9780839085578918, "training_loss": 5.007414817810059, "uptime": 4494.026070257998, "examples_seen": 10188800.0, "progress": 0.08925607972945092, "epoch": 8.033082220671657, "img/sec/core": 189.46192610614122, "core_hours_Tesla V100-SXM2-32GB": 14.9240747099644, "core_hours": 14.9240747099644}
{"step": 10000, "global_schedule": 0.9998999834060669, "l2_grads": 1.3566179275512695, "l2_params": 265.9672546386719, "l2_updates": 1.0906953811645508, "training_loss": 4.364154815673828, "uptime": 4510.913224613003, "examples_seen": 10240000.0, "progress": 0.08970460274316676, "epoch": 8.073449468011717, "img/sec/core": 189.4931456614303, "core_hours_Tesla V100-SXM2-32GB": 14.999128729319976, "core_hours": 14.999128729319976, "minival/prec@1": 0.29261629722135496, "minival/loss": 3.3940372997025494, "minival/sample count": 12812.0, "minival/attn_weight_avg": [13312, 12, 281], "minival/attn_mag": [13312, 12, 281], "minival/before_mlp": [13312, 12, 281], "z/secs/eval/minival": 2.9189425879740156, "real/prec@1": 0.3198753122531332, "real/loss": 4.458003736278877, "real/sample count": 46837.0, "real/attn_weight_avg": [50176, 12, 281], "real/attn_mag": [50176, 12, 281], "real/before_mlp": [50176, 12, 281], "z/secs/eval/real": 11.20323568902677, "train/prec@1": 0.29758420169379074, "train/loss": 3.346722313016275, "train/sample count": 25623.0, "train/attn_weight_avg": [26624, 12, 281], "train/attn_mag": [26624, 12, 281], "train/before_mlp": [26624, 12, 281], "z/secs/eval/train": 6.594460493011866, "v2/prec@1": 0.2178, "v2/loss": 3.97645380859375, "v2/sample count": 10000.0, "v2/attn_weight_avg": [10240, 12, 281], "v2/attn_mag": [10240, 12, 281], "v2/before_mlp": [10240, 12, 281], "z/secs/eval/v2": 3.3724862649687566, "val/prec@1": 0.2791, "val/loss": 3.4883075732421873, "val/sample count": 50000.0, "val/attn_weight_avg": [50176, 12, 281], "val/attn_mag": [50176, 12, 281], "val/before_mlp": [50176, 12, 281], "z/secs/eval/val": 12.341588139010128}
{"step": 10050, "global_schedule": 0.9999994039535522, "l2_grads": 1.2200374603271484, "l2_params": 266.58575439453125, "l2_updates": 0.9796658158302307, "training_loss": 4.472228527069092, "uptime": 4564.81400432199, "examples_seen": 10291200.0, "progress": 0.09015312575688259, "epoch": 8.113816715351774, "img/sec/core": 189.2651567545239, "core_hours_Tesla V100-SXM2-32GB": 15.074273158786559, "core_hours": 15.074273158786559}
{"step": 10100, "global_schedule": 0.999997615814209, "l2_grads": 1.1010873317718506, "l2_params": 267.3551330566406, "l2_updates": 1.09795081615448, "training_loss": 4.522805213928223, "uptime": 4581.695248655975, "examples_seen": 10342400.0, "progress": 0.09060164877059843, "epoch": 8.154183962691834, "img/sec/core": 189.55948605979594, "core_hours_Tesla V100-SXM2-32GB": 15.149300911382047, "core_hours": 15.149300911382047}
{"step": 10150, "global_schedule": 0.999994695186615, "l2_grads": 1.1617817878723145, "l2_params": 268.18634033203125, "l2_updates": 1.075120449066162, "training_loss": 4.292905807495117, "uptime": 4598.556682629976, "examples_seen": 10393600.0, "progress": 0.09105017178431425, "epoch": 8.194551210031891, "img/sec/core": 189.78219793963206, "core_hours_Tesla V100-SXM2-32GB": 15.224240617933166, "core_hours": 15.224240617933166}
{"step": 10200, "global_schedule": 0.9999905228614807, "l2_grads": 1.1694148778915405, "l2_params": 268.97796630859375, "l2_updates": 1.0091196298599243, "training_loss": 4.4957685470581055, "uptime": 4615.42136679095, "examples_seen": 10444800.0, "progress": 0.09149869479803009, "epoch": 8.23491845737195, "img/sec/core": 189.74562283266025, "core_hours_Tesla V100-SXM2-32GB": 15.299194769759714, "core_hours": 15.299194769759714}
{"step": 10250, "global_schedule": 0.9999851584434509, "l2_grads": 0.7996388673782349, "l2_params": 269.5700988769531, "l2_updates": 0.9962300658226013, "training_loss": 6.030635356903076, "uptime": 4632.298884845979, "examples_seen": 10496000.0, "progress": 0.09194721781174592, "epoch": 8.275285704712008, "img/sec/core": 189.6013376828505, "core_hours_Tesla V100-SXM2-32GB": 15.374205961115399, "core_hours": 15.374205961115399}
{"step": 10300, "global_schedule": 0.9999785423278809, "l2_grads": 0.9138261675834656, "l2_params": 270.3213806152344, "l2_updates": 1.0192244052886963, "training_loss": 5.564879894256592, "uptime": 4649.168768520991, "examples_seen": 10547200.0, "progress": 0.09239574082546176, "epoch": 8.315652952052067, "img/sec/core": 189.68714080346263, "core_hours_Tesla V100-SXM2-32GB": 15.44918322189323, "core_hours": 15.44918322189323}
{"step": 10350, "global_schedule": 0.9999707937240601, "l2_grads": 0.9321932196617126, "l2_params": 271.001708984375, "l2_updates": 1.0307244062423706, "training_loss": 4.934969425201416, "uptime": 4666.043656577996, "examples_seen": 10598400.0, "progress": 0.09284426383917758, "epoch": 8.356020199392127, "img/sec/core": 189.63088757626, "core_hours_Tesla V100-SXM2-32GB": 15.52418272436881, "core_hours": 15.52418272436881}
{"step": 10400, "global_schedule": 0.9999618530273438, "l2_grads": 1.1760765314102173, "l2_params": 271.6911926269531, "l2_updates": 1.058396577835083, "training_loss": 4.604788780212402, "uptime": 4682.907292728953, "examples_seen": 10649600.0, "progress": 0.09329278685289343, "epoch": 8.396387446732184, "img/sec/core": 189.75741479209765, "core_hours_Tesla V100-SXM2-32GB": 15.59913221837306, "core_hours": 15.59913221837306}
{"step": 10450, "global_schedule": 0.9999517202377319, "l2_grads": 1.0311779975891113, "l2_params": 272.32684326171875, "l2_updates": 1.0916028022766113, "training_loss": 4.648671627044678, "uptime": 4699.789353515953, "examples_seen": 10700800.0, "progress": 0.09374130986660925, "epoch": 8.436754694072244, "img/sec/core": 189.55031855258517, "core_hours_Tesla V100-SXM2-32GB": 15.674163599648615, "core_hours": 15.674163599648615}
{"step": 10501, "global_schedule": 0.9999403357505798, "l2_grads": 0.9741016626358032, "l2_params": 272.9510803222656, "l2_updates": 1.0114154815673828, "training_loss": 6.206577777862549, "uptime": 4716.666889633983, "examples_seen": 10752000.0, "progress": 0.09418983288032509, "epoch": 8.477121941412301, "img/sec/core": 189.60113476406, "core_hours_Tesla V100-SXM2-32GB": 15.749174871284309, "core_hours": 15.749174871284309}
{"step": 10550, "global_schedule": 0.9999277591705322, "l2_grads": 1.0326536893844604, "l2_params": 273.5738525390625, "l2_updates": 1.0751057863235474, "training_loss": 5.654620170593262, "uptime": 4733.547823989997, "examples_seen": 10803200.0, "progress": 0.09463835589404092, "epoch": 8.51748918875236, "img/sec/core": 189.56296686623264, "core_hours_Tesla V100-SXM2-32GB": 15.824201246199923, "core_hours": 15.824201246199923}
{"step": 10600, "global_schedule": 0.9999140501022339, "l2_grads": 0.7912506461143494, "l2_params": 274.2313537597656, "l2_updates": 0.927155077457428, "training_loss": 5.5080342292785645, "uptime": 4750.415188660962, "examples_seen": 10854400.0, "progress": 0.09508687890775676, "epoch": 8.557856436092418, "img/sec/core": 189.71546903876512, "core_hours_Tesla V100-SXM2-32GB": 15.89916731140421, "core_hours": 15.89916731140421}
{"step": 10650, "global_schedule": 0.9998990893363953, "l2_grads": 0.934333324432373, "l2_params": 274.7010192871094, "l2_updates": 0.9843287467956543, "training_loss": 5.9710187911987305, "uptime": 4767.300867107988, "examples_seen": 10905600.0, "progress": 0.09553540192147258, "epoch": 8.598223683432478, "img/sec/core": 189.50970848100843, "core_hours_Tesla V100-SXM2-32GB": 15.974214771168771, "core_hours": 15.974214771168771}
{"step": 10700, "global_schedule": 0.9998829364776611, "l2_grads": 0.9398232698440552, "l2_params": 275.2821960449219, "l2_updates": 1.0772559642791748, "training_loss": 5.389168739318848, "uptime": 4784.192967139999, "examples_seen": 10956800.0, "progress": 0.09598392493518842, "epoch": 8.638590930772535, "img/sec/core": 189.4376657689579, "core_hours_Tesla V100-SXM2-32GB": 16.049290771311046, "core_hours": 16.049290771311046}
{"step": 10750, "global_schedule": 0.9998655915260315, "l2_grads": 0.9049479961395264, "l2_params": 275.8927917480469, "l2_updates": 0.9513688683509827, "training_loss": 5.123607635498047, "uptime": 4801.093379142985, "examples_seen": 11008000.0, "progress": 0.09643244794890427, "epoch": 8.678958178112595, "img/sec/core": 189.34449642024404, "core_hours_Tesla V100-SXM2-32GB": 16.12440371354654, "core_hours": 16.12440371354654}
{"step": 10800, "global_schedule": 0.9998470544815063, "l2_grads": 0.851817786693573, "l2_params": 276.4700927734375, "l2_updates": 1.0303150415420532, "training_loss": 5.9192280769348145, "uptime": 4817.954278924968, "examples_seen": 11059200.0, "progress": 0.09688097096262009, "epoch": 8.719325425452654, "img/sec/core": 189.78821067541347, "core_hours_Tesla V100-SXM2-32GB": 16.199341045910906, "core_hours": 16.199341045910906}
{"step": 10850, "global_schedule": 0.9998272657394409, "l2_grads": 0.9774565100669861, "l2_params": 277.0855712890625, "l2_updates": 1.0497268438339233, "training_loss": 4.862181186676025, "uptime": 4834.834481408994, "examples_seen": 11110400.0, "progress": 0.09732949397633593, "epoch": 8.759692672792712, "img/sec/core": 189.57118571463783, "core_hours_Tesla V100-SXM2-32GB": 16.27436416806213, "core_hours": 16.27436416806213}
{"step": 10900, "global_schedule": 0.9998063445091248, "l2_grads": 0.764284610748291, "l2_params": 277.811279296875, "l2_updates": 0.9025118947029114, "training_loss": 6.003533363342285, "uptime": 4851.69077238196, "examples_seen": 11161600.0, "progress": 0.09777801699005176, "epoch": 8.800059920132771, "img/sec/core": 189.8401021394382, "core_hours_Tesla V100-SXM2-32GB": 16.349281016830872, "core_hours": 16.349281016830872}
{"step": 10950, "global_schedule": 0.9997842311859131, "l2_grads": 1.1808208227157593, "l2_params": 278.52215576171875, "l2_updates": 1.180240273475647, "training_loss": 4.275867462158203, "uptime": 4868.570736532973, "examples_seen": 11212800.0, "progress": 0.0982265400037676, "epoch": 8.840427167472829, "img/sec/core": 189.57386232411545, "core_hours_Tesla V100-SXM2-32GB": 16.42430307972426, "core_hours": 16.42430307972426}
{"step": 11000, "global_schedule": 0.9997608661651611, "l2_grads": 0.9497623443603516, "l2_params": 279.1529846191406, "l2_updates": 1.01434326171875, "training_loss": 6.178974628448486, "uptime": 4885.465733652993, "examples_seen": 11264000.0, "progress": 0.09867506301748342, "epoch": 8.880794414812888, "img/sec/core": 189.40518173916183, "core_hours_Tesla V100-SXM2-32GB": 16.499391955813238, "core_hours": 16.499391955813238}
{"step": 11050, "global_schedule": 0.9997363686561584, "l2_grads": 1.1937803030014038, "l2_params": 279.686767578125, "l2_updates": 1.132827877998352, "training_loss": 4.4015913009643555, "uptime": 4903.151624841965, "examples_seen": 11315200.0, "progress": 0.09912358603119927, "epoch": 8.921161662152945, "img/sec/core": 189.6702103666407, "core_hours_Tesla V100-SXM2-32GB": 16.574375909248676, "core_hours": 16.574375909248676}
{"step": 11100, "global_schedule": 0.9997106194496155, "l2_grads": 0.8997027277946472, "l2_params": 280.2313537597656, "l2_updates": 1.006208896636963, "training_loss": 5.441362380981445, "uptime": 4920.028157932975, "examples_seen": 11366400.0, "progress": 0.09957210904491509, "epoch": 8.961528909493005, "img/sec/core": 189.6124033735699, "core_hours_Tesla V100-SXM2-32GB": 16.6493827229865, "core_hours": 16.6493827229865}
{"step": 11150, "global_schedule": 0.9996837377548218, "l2_grads": 0.7906211018562317, "l2_params": 280.80474853515625, "l2_updates": 0.9981765151023865, "training_loss": 5.735773086547852, "uptime": 4936.9216967289685, "examples_seen": 11417600.0, "progress": 0.10002063205863093, "epoch": 9.001896156833062, "img/sec/core": 189.42153202139545, "core_hours_Tesla V100-SXM2-32GB": 16.72446511763536, "core_hours": 16.72446511763536}
{"step": 11200, "global_schedule": 0.9996556043624878, "l2_grads": 1.125473976135254, "l2_params": 281.4263916015625, "l2_updates": 1.010462999343872, "training_loss": 4.006726264953613, "uptime": 4953.793146510958, "examples_seen": 11468800.0, "progress": 0.10046915507234676, "epoch": 9.042263404173122, "img/sec/core": 189.6695329298907, "core_hours_Tesla V100-SXM2-32GB": 16.799449338888646, "core_hours": 16.799449338888646}
{"step": 11250, "global_schedule": 0.9996262788772583, "l2_grads": 1.0327335596084595, "l2_params": 281.9223937988281, "l2_updates": 1.134953498840332, "training_loss": 4.275514602661133, "uptime": 4970.683816788951, "examples_seen": 11520000.0, "progress": 0.1009176780860626, "epoch": 9.082630651513181, "img/sec/core": 189.45370120505345, "core_hours_Tesla V100-SXM2-32GB": 16.874518984568617, "core_hours": 16.874518984568617}
{"step": 11300, "global_schedule": 0.9995957612991333, "l2_grads": 0.7677459716796875, "l2_params": 282.5458068847656, "l2_updates": 0.9667848348617554, "training_loss": 5.878210067749023, "uptime": 4987.571243145969, "examples_seen": 11571200.0, "progress": 0.10136620109977842, "epoch": 9.122997898853239, "img/sec/core": 189.49009353756207, "core_hours_Tesla V100-SXM2-32GB": 16.94957421282203, "core_hours": 16.94957421282203}
{"step": 11350, "global_schedule": 0.9995640516281128, "l2_grads": 1.1332082748413086, "l2_params": 283.127197265625, "l2_updates": 1.145765781402588, "training_loss": 4.348937511444092, "uptime": 5004.456081141951, "examples_seen": 11622400.0, "progress": 0.10181472411349426, "epoch": 9.163365146193298, "img/sec/core": 189.51914141915523, "core_hours_Tesla V100-SXM2-32GB": 17.024617937248614, "core_hours": 17.024617937248614}
{"step": 11400, "global_schedule": 0.9995311498641968, "l2_grads": 1.219459891319275, "l2_params": 283.74725341796875, "l2_updates": 1.0830022096633911, "training_loss": 4.051757335662842, "uptime": 5021.331488166994, "examples_seen": 11673600.0, "progress": 0.10226324712721009, "epoch": 9.203732393533356, "img/sec/core": 189.62505587279443, "core_hours_Tesla V100-SXM2-32GB": 17.09961974624881, "core_hours": 17.09961974624881}
{"step": 11450, "global_schedule": 0.9994969964027405, "l2_grads": 1.1152057647705078, "l2_params": 284.36773681640625, "l2_updates": 1.0188552141189575, "training_loss": 4.162574768066406, "uptime": 5038.240351396962, "examples_seen": 11724800.0, "progress": 0.10271177014092593, "epoch": 9.244099640873415, "img/sec/core": 189.24986005733004, "core_hours_Tesla V100-SXM2-32GB": 17.17477024949311, "core_hours": 17.17477024949311}
{"step": 11500, "global_schedule": 0.9994616508483887, "l2_grads": 1.2544333934783936, "l2_params": 284.8153991699219, "l2_updates": 1.0765093564987183, "training_loss": 4.2627410888671875, "uptime": 5055.112810087972, "examples_seen": 11776000.0, "progress": 0.10316029315464176, "epoch": 9.284466888213473, "img/sec/core": 189.65819141136672, "core_hours_Tesla V100-SXM2-32GB": 17.24975895478649, "core_hours": 17.24975895478649}
{"step": 11550, "global_schedule": 0.9994251728057861, "l2_grads": 1.1320539712905884, "l2_params": 285.25201416015625, "l2_updates": 1.0547263622283936, "training_loss": 4.148284435272217, "uptime": 5071.988376675989, "examples_seen": 11827200.0, "progress": 0.1036088161683576, "epoch": 9.324834135553532, "img/sec/core": 189.6232629174301, "core_hours_Tesla V100-SXM2-32GB": 17.32476147295545, "core_hours": 17.32476147295545}
{"step": 11600, "global_schedule": 0.9993875026702881, "l2_grads": 1.268906831741333, "l2_params": 285.7479248046875, "l2_updates": 1.0844979286193848, "training_loss": 4.210082530975342, "uptime": 5088.868419409962, "examples_seen": 11878400.0, "progress": 0.10405733918207344, "epoch": 9.365201382893591, "img/sec/core": 189.57297978632963, "core_hours_Tesla V100-SXM2-32GB": 17.399783885106444, "core_hours": 17.399783885106444}
{"step": 11650, "global_schedule": 0.9993485808372498, "l2_grads": 1.0860573053359985, "l2_params": 286.3551940917969, "l2_updates": 1.1292436122894287, "training_loss": 4.870105266571045, "uptime": 5105.753780305968, "examples_seen": 11929600.0, "progress": 0.10450586219578926, "epoch": 9.405568630233649, "img/sec/core": 189.51327245584957, "core_hours_Tesla V100-SXM2-32GB": 17.474829933533137, "core_hours": 17.474829933533137}
{"step": 11700, "global_schedule": 0.9993084669113159, "l2_grads": 1.1625710725784302, "l2_params": 287.0069580078125, "l2_updates": 1.1236268281936646, "training_loss": 4.08085823059082, "uptime": 5122.631895467988, "examples_seen": 11980800.0, "progress": 0.1049543852095051, "epoch": 9.445935877573708, "img/sec/core": 189.59463004498866, "core_hours_Tesla V100-SXM2-32GB": 17.54984377869767, "core_hours": 17.54984377869767}
{"step": 11750, "global_schedule": 0.9992672204971313, "l2_grads": 1.0570056438446045, "l2_params": 287.4841613769531, "l2_updates": 1.0028793811798096, "training_loss": 5.0864386558532715, "uptime": 5139.491633901955, "examples_seen": 12032000.0, "progress": 0.10540290822322093, "epoch": 9.486303124913766, "img/sec/core": 189.80128384157675, "core_hours_Tesla V100-SXM2-32GB": 17.6247759495153, "core_hours": 17.6247759495153}
{"step": 11801, "global_schedule": 0.9992247223854065, "l2_grads": 1.16002357006073, "l2_params": 287.93499755859375, "l2_updates": 1.0188610553741455, "training_loss": 4.924921035766602, "uptime": 5156.371186839999, "examples_seen": 12083200.0, "progress": 0.10585143123693677, "epoch": 9.526670372253825, "img/sec/core": 189.57848064729623, "core_hours_Tesla V100-SXM2-32GB": 17.699796184795495, "core_hours": 17.699796184795495}
{"step": 11850, "global_schedule": 0.9991810321807861, "l2_grads": 1.1945236921310425, "l2_params": 288.4706115722656, "l2_updates": 1.061639428138733, "training_loss": 4.0632195472717285, "uptime": 5173.236704570998, "examples_seen": 12134400.0, "progress": 0.1062999542506526, "epoch": 9.567037619593883, "img/sec/core": 189.73624474737082, "core_hours_Tesla V100-SXM2-32GB": 17.774754041377715, "core_hours": 17.774754041377715}
{"step": 11900, "global_schedule": 0.999136209487915, "l2_grads": 1.8193771839141846, "l2_params": 289.02764892578125, "l2_updates": 0.9964253902435303, "training_loss": 4.140198707580566, "uptime": 5190.129592493991, "examples_seen": 12185600.0, "progress": 0.10674847726436844, "epoch": 9.607404866933942, "img/sec/core": 189.42883032121392, "core_hours_Tesla V100-SXM2-32GB": 17.849833543257684, "core_hours": 17.849833543257684}
{"step": 11950, "global_schedule": 0.9990900754928589, "l2_grads": 1.0807181596755981, "l2_params": 289.4741516113281, "l2_updates": 1.1361316442489624, "training_loss": 3.991137742996216, "uptime": 5206.999106141971, "examples_seen": 12236800.0, "progress": 0.10719700027808426, "epoch": 9.647772114274, "img/sec/core": 189.69130152623964, "core_hours_Tesla V100-SXM2-32GB": 17.924809159470932, "core_hours": 17.924809159470932}
{"step": 12000, "global_schedule": 0.9990428686141968, "l2_grads": 1.2278493642807007, "l2_params": 289.9569396972656, "l2_updates": 1.0085701942443848, "training_loss": 4.061941623687744, "uptime": 5223.89414579398, "examples_seen": 12288000.0, "progress": 0.1076455232918001, "epoch": 9.68813936161406, "img/sec/core": 189.4047049258963, "core_hours_Tesla V100-SXM2-32GB": 17.999898224590968, "core_hours": 17.999898224590968}
{"step": 12050, "global_schedule": 0.9989943504333496, "l2_grads": 1.1497526168823242, "l2_params": 290.5139465332031, "l2_updates": 1.0673695802688599, "training_loss": 4.169745922088623, "uptime": 5241.2837003709865, "examples_seen": 12339200.0, "progress": 0.10809404630551593, "epoch": 9.728506608954119, "img/sec/core": 189.70344622518465, "core_hours_Tesla V100-SXM2-32GB": 18.074869040910983, "core_hours": 18.074869040910983}
{"step": 12100, "global_schedule": 0.9989446997642517, "l2_grads": 1.0358017683029175, "l2_params": 291.003173828125, "l2_updates": 1.02817702293396, "training_loss": 4.255690574645996, "uptime": 5258.144521126989, "examples_seen": 12390400.0, "progress": 0.10854256931923177, "epoch": 9.768873856294176, "img/sec/core": 189.7891002050262, "core_hours_Tesla V100-SXM2-32GB": 18.14980602204877, "core_hours": 18.14980602204877}
{"step": 12150, "global_schedule": 0.9988938570022583, "l2_grads": 1.180609941482544, "l2_params": 291.5008544921875, "l2_updates": 1.0242695808410645, "training_loss": 4.169126510620117, "uptime": 5275.016817386961, "examples_seen": 12441600.0, "progress": 0.1089910923329476, "epoch": 9.809241103634236, "img/sec/core": 189.6600172669939, "core_hours_Tesla V100-SXM2-32GB": 18.22479400542642, "core_hours": 18.22479400542642}
{"step": 12200, "global_schedule": 0.9988417625427246, "l2_grads": 1.085109829902649, "l2_params": 291.96185302734375, "l2_updates": 1.1212211847305298, "training_loss": 4.028820514678955, "uptime": 5291.888946248975, "examples_seen": 12492800.0, "progress": 0.10943961534666344, "epoch": 9.849608350974293, "img/sec/core": 189.66189899156123, "core_hours_Tesla V100-SXM2-32GB": 18.299781244813154, "core_hours": 18.299781244813154}
{"step": 12250, "global_schedule": 0.9987885355949402, "l2_grads": 0.9268732070922852, "l2_params": 292.5213623046875, "l2_updates": 0.9700244665145874, "training_loss": 4.977009296417236, "uptime": 5308.7481449279585, "examples_seen": 12544000.0, "progress": 0.10988813836037926, "epoch": 9.889975598314352, "img/sec/core": 189.807360416786, "core_hours_Tesla V100-SXM2-32GB": 18.374711016719747, "core_hours": 18.374711016719747}
{"step": 12300, "global_schedule": 0.9987341165542603, "l2_grads": 1.2247130870819092, "l2_params": 293.0367736816406, "l2_updates": 1.1455914974212646, "training_loss": 3.9970309734344482, "uptime": 5325.637445265951, "examples_seen": 12595200.0, "progress": 0.1103366613740951, "epoch": 9.93034284565441, "img/sec/core": 189.46906834272914, "core_hours_Tesla V100-SXM2-32GB": 18.449774573777493, "core_hours": 18.449774573777493}
{"step": 12350, "global_schedule": 0.99867844581604, "l2_grads": 1.0972832441329956, "l2_params": 293.4686279296875, "l2_updates": 1.0103751420974731, "training_loss": 4.43673038482666, "uptime": 5342.508553346968, "examples_seen": 12646400.0, "progress": 0.11078518438781094, "epoch": 9.97071009299447, "img/sec/core": 189.6733744240866, "core_hours_Tesla V100-SXM2-32GB": 18.52475727635979, "core_hours": 18.52475727635979}
{"step": 12400, "global_schedule": 0.9986216425895691, "l2_grads": 1.2918270826339722, "l2_params": 293.9491271972656, "l2_updates": 0.9850529432296753, "training_loss": 3.979156970977783, "uptime": 5359.390573073993, "examples_seen": 12697600.0, "progress": 0.11123370740152677, "epoch": 10.011077340334527, "img/sec/core": 189.5507795715554, "core_hours_Tesla V100-SXM2-32GB": 18.599788475146568, "core_hours": 18.599788475146568}
{"step": 12450, "global_schedule": 0.9985636472702026, "l2_grads": 1.1810811758041382, "l2_params": 294.3807067871094, "l2_updates": 1.0788902044296265, "training_loss": 3.9543018341064453, "uptime": 5376.267773611995, "examples_seen": 12748800.0, "progress": 0.11168223041524261, "epoch": 10.051444587674586, "img/sec/core": 189.60490472307487, "core_hours_Tesla V100-SXM2-32GB": 18.674798255315466, "core_hours": 18.674798255315466}
{"step": 12500, "global_schedule": 0.9985044002532959, "l2_grads": 1.1143925189971924, "l2_params": 294.866455078125, "l2_updates": 1.0901705026626587, "training_loss": 3.864398956298828, "uptime": 5393.161574126978, "examples_seen": 12800000.0, "progress": 0.11213075342895844, "epoch": 10.091811835014646, "img/sec/core": 189.41859750042263, "core_hours_Tesla V100-SXM2-32GB": 18.749881813159835, "core_hours": 18.749881813159835, "minival/prec@1": 0.3616141117702154, "minival/loss": 2.9887416338198562, "minival/sample count": 12812.0, "minival/attn_weight_avg": [13312, 12, 281], "minival/attn_mag": [13312, 12, 281], "minival/before_mlp": [13312, 12, 281], "z/secs/eval/minival": 2.9125823919894174, "real/prec@1": 0.39823216687661467, "real/loss": 3.9945124211944485, "real/sample count": 46837.0, "real/attn_weight_avg": [50176, 12, 281], "real/attn_mag": [50176, 12, 281], "real/before_mlp": [50176, 12, 281], "z/secs/eval/real": 11.163050422968809, "train/prec@1": 0.37762947351988446, "train/loss": 2.9248996682958524, "train/sample count": 25623.0, "train/attn_weight_avg": [26624, 12, 281], "train/attn_mag": [26624, 12, 281], "train/before_mlp": [26624, 12, 281], "z/secs/eval/train": 6.581248839967884, "v2/prec@1": 0.2632, "v2/loss": 3.63672021484375, "v2/sample count": 10000.0, "v2/attn_weight_avg": [10240, 12, 281], "v2/attn_mag": [10240, 12, 281], "v2/before_mlp": [10240, 12, 281], "z/secs/eval/v2": 3.406702846987173, "val/prec@1": 0.3492, "val/loss": 3.085227421875, "val/sample count": 50000.0, "val/attn_weight_avg": [50176, 12, 281], "val/attn_mag": [50176, 12, 281], "val/before_mlp": [50176, 12, 281], "z/secs/eval/val": 12.247267456026748}
{"step": 12550, "global_schedule": 0.9984439611434937, "l2_grads": 1.098023772239685, "l2_params": 295.4112854003906, "l2_updates": 1.1168729066848755, "training_loss": 4.098095893859863, "uptime": 5446.4090558529715, "examples_seen": 12851200.0, "progress": 0.11257927644267428, "epoch": 10.132179082354703, "img/sec/core": 188.9624558265814, "core_hours_Tesla V100-SXM2-32GB": 18.82514661727137, "core_hours": 18.82514661727137}
{"step": 12600, "global_schedule": 0.9983823299407959, "l2_grads": 1.1657556295394897, "l2_params": 295.8088073730469, "l2_updates": 1.009631633758545, "training_loss": 4.053195953369141, "uptime": 5463.2806807809975, "examples_seen": 12902400.0, "progress": 0.1130277994563901, "epoch": 10.172546329694763, "img/sec/core": 189.66756395137602, "core_hours_Tesla V100-SXM2-32GB": 18.900131616951487, "core_hours": 18.900131616951487}
{"step": 12650, "global_schedule": 0.9983195662498474, "l2_grads": 0.8629714846611023, "l2_params": 296.2807922363281, "l2_updates": 0.9829097390174866, "training_loss": 6.043212890625, "uptime": 5480.152793026995, "examples_seen": 12953600.0, "progress": 0.11347632247010594, "epoch": 10.21291357703482, "img/sec/core": 189.66208577465687, "core_hours_Tesla V100-SXM2-32GB": 18.97511878248925, "core_hours": 18.97511878248925}
{"step": 12700, "global_schedule": 0.9982555508613586, "l2_grads": 1.1851662397384644, "l2_params": 296.6960754394531, "l2_updates": 1.1302069425582886, "training_loss": 4.026829242706299, "uptime": 5497.032915274962, "examples_seen": 13004800.0, "progress": 0.11392484548382177, "epoch": 10.25328082437488, "img/sec/core": 189.57208680081757, "core_hours_Tesla V100-SXM2-32GB": 19.050141548035768, "core_hours": 19.050141548035768}
{"step": 12750, "global_schedule": 0.9981904029846191, "l2_grads": 1.1320245265960693, "l2_params": 297.1925964355469, "l2_updates": 0.9686138033866882, "training_loss": 4.183197975158691, "uptime": 5513.924402566976, "examples_seen": 13056000.0, "progress": 0.11437336849753761, "epoch": 10.293648071714937, "img/sec/core": 189.44453763481752, "core_hours_Tesla V100-SXM2-32GB": 19.125214824889166, "core_hours": 19.125214824889166}
{"step": 12800, "global_schedule": 0.9981240034103394, "l2_grads": 0.9940457344055176, "l2_params": 297.53094482421875, "l2_updates": 1.0441721677780151, "training_loss": 5.455168724060059, "uptime": 5530.791179667984, "examples_seen": 13107200.0, "progress": 0.11482189151125344, "epoch": 10.334015319054997, "img/sec/core": 189.72207795458485, "core_hours_Tesla V100-SXM2-32GB": 19.200178278671423, "core_hours": 19.200178278671423}
{"step": 12850, "global_schedule": 0.9980564117431641, "l2_grads": 0.8960315585136414, "l2_params": 298.029296875, "l2_updates": 1.0933855772018433, "training_loss": 5.268714427947998, "uptime": 5547.651302605984, "examples_seen": 13158400.0, "progress": 0.11527041452496928, "epoch": 10.374382566395054, "img/sec/core": 189.79695532276878, "core_hours_Tesla V100-SXM2-32GB": 19.275112158395867, "core_hours": 19.275112158395867}
{"step": 12900, "global_schedule": 0.9979876279830933, "l2_grads": 1.0728917121887207, "l2_params": 298.4642028808594, "l2_updates": 1.0834991931915283, "training_loss": 3.8826053142547607, "uptime": 5564.527915350976, "examples_seen": 13209600.0, "progress": 0.1157189375386851, "epoch": 10.414749813735114, "img/sec/core": 189.61150844380552, "core_hours_Tesla V100-SXM2-32GB": 19.35011932615139, "core_hours": 19.35011932615139}
{"step": 12950, "global_schedule": 0.997917652130127, "l2_grads": 1.2050927877426147, "l2_params": 298.9261779785156, "l2_updates": 1.0939369201660156, "training_loss": 3.8494515419006348, "uptime": 5581.397076398949, "examples_seen": 13260800.0, "progress": 0.11616746055240094, "epoch": 10.455117061075173, "img/sec/core": 189.69526646285482, "core_hours_Tesla V100-SXM2-32GB": 19.42509337525349, "core_hours": 19.42509337525349}
{"step": 13000, "global_schedule": 0.9978464841842651, "l2_grads": 1.0879539251327515, "l2_params": 299.3041687011719, "l2_updates": 1.0290119647979736, "training_loss": 3.9350123405456543, "uptime": 5598.285859110998, "examples_seen": 13312000.0, "progress": 0.11661598356611677, "epoch": 10.49548430841523, "img/sec/core": 189.47487539863045, "core_hours_Tesla V100-SXM2-32GB": 19.50015463175149, "core_hours": 19.50015463175149}
{"step": 13050, "global_schedule": 0.9977741241455078, "l2_grads": 1.1557328701019287, "l2_params": 299.6863098144531, "l2_updates": 1.0793935060501099, "training_loss": 3.906635046005249, "uptime": 5615.7159749919665, "examples_seen": 13363200.0, "progress": 0.11706450657983261, "epoch": 10.53585155575529, "img/sec/core": 189.44570871998383, "core_hours_Tesla V100-SXM2-32GB": 19.575227444528913, "core_hours": 19.575227444528913}
{"step": 13100, "global_schedule": 0.997700572013855, "l2_grads": 1.0998679399490356, "l2_params": 300.1014709472656, "l2_updates": 1.0963706970214844, "training_loss": 4.155267715454102, "uptime": 5632.600141948962, "examples_seen": 13414400.0, "progress": 0.11751302959354845, "epoch": 10.576218803095347, "img/sec/core": 189.52667360791196, "core_hours_Tesla V100-SXM2-32GB": 19.650268186560005, "core_hours": 19.650268186560005}
{"step": 13150, "global_schedule": 0.9976258277893066, "l2_grads": 1.121761679649353, "l2_params": 300.5202331542969, "l2_updates": 1.0703436136245728, "training_loss": 4.098562717437744, "uptime": 5649.492625562998, "examples_seen": 13465600.0, "progress": 0.11796155260726428, "epoch": 10.616586050435407, "img/sec/core": 189.43336415855012, "core_hours_Tesla V100-SXM2-32GB": 19.725345891511274, "core_hours": 19.725345891511274}
{"step": 13200, "global_schedule": 0.9975498914718628, "l2_grads": 1.305654764175415, "l2_params": 300.997314453125, "l2_updates": 1.1145453453063965, "training_loss": 4.233192443847656, "uptime": 5666.355617413006, "examples_seen": 13516800.0, "progress": 0.11841007562098012, "epoch": 10.656953297775464, "img/sec/core": 189.76466504064837, "core_hours_Tesla V100-SXM2-32GB": 19.800292521955758, "core_hours": 19.800292521955758}
{"step": 13250, "global_schedule": 0.9974728226661682, "l2_grads": 1.3296362161636353, "l2_params": 301.2940368652344, "l2_updates": 1.051175832748413, "training_loss": 4.003744125366211, "uptime": 5683.233404711005, "examples_seen": 13568000.0, "progress": 0.11885859863469594, "epoch": 10.697320545115524, "img/sec/core": 189.59831306674792, "core_hours_Tesla V100-SXM2-32GB": 19.875304909946863, "core_hours": 19.875304909946863}
{"step": 13300, "global_schedule": 0.9973945021629333, "l2_grads": 1.112662672996521, "l2_params": 301.66534423828125, "l2_updates": 1.1062744855880737, "training_loss": 3.856586456298828, "uptime": 5700.095428375993, "examples_seen": 13619200.0, "progress": 0.11930712164841178, "epoch": 10.737687792455581, "img/sec/core": 189.7755609633314, "core_hours_Tesla V100-SXM2-32GB": 19.950247237346808, "core_hours": 19.950247237346808}
{"step": 13350, "global_schedule": 0.997314989566803, "l2_grads": 1.0409704446792603, "l2_params": 302.11322021484375, "l2_updates": 1.0882892608642578, "training_loss": 4.810594081878662, "uptime": 5716.988439715991, "examples_seen": 13670400.0, "progress": 0.11975564466212761, "epoch": 10.77805503979564, "img/sec/core": 189.4274463915866, "core_hours_Tesla V100-SXM2-32GB": 20.0253272877468, "core_hours": 20.0253272877468}
{"step": 13400, "global_schedule": 0.9972342848777771, "l2_grads": 1.1895475387573242, "l2_params": 302.4962158203125, "l2_updates": 1.0755903720855713, "training_loss": 3.9213054180145264, "uptime": 5733.85476634698, "examples_seen": 13721600.0, "progress": 0.12020416767584345, "epoch": 10.8184222871357, "img/sec/core": 189.72714509872097, "core_hours_Tesla V100-SXM2-32GB": 20.100288739440085, "core_hours": 20.100288739440085}
{"step": 13450, "global_schedule": 0.9971524477005005, "l2_grads": 1.0560263395309448, "l2_params": 302.8525085449219, "l2_updates": 1.1427392959594727, "training_loss": 3.8711814880371094, "uptime": 5750.729540315981, "examples_seen": 13772800.0, "progress": 0.12065269068955928, "epoch": 10.858789534475758, "img/sec/core": 189.6321696443739, "core_hours_Tesla V100-SXM2-32GB": 20.175287734857864, "core_hours": 20.175287734857864}
{"step": 13500, "global_schedule": 0.9970693588256836, "l2_grads": 1.1461361646652222, "l2_params": 303.2832946777344, "l2_updates": 1.0445784330368042, "training_loss": 3.9297590255737305, "uptime": 5767.603872992971, "examples_seen": 13824000.0, "progress": 0.12110121370327512, "epoch": 10.899156781815817, "img/sec/core": 189.63712884263458, "core_hours_Tesla V100-SXM2-32GB": 20.250284768977824, "core_hours": 20.250284768977824}
{"step": 13550, "global_schedule": 0.9969850778579712, "l2_grads": 0.9966997504234314, "l2_params": 303.6966552734375, "l2_updates": 1.0315746068954468, "training_loss": 5.807555198669434, "uptime": 5784.463062880968, "examples_seen": 13875200.0, "progress": 0.12154973671699094, "epoch": 10.939524029155875, "img/sec/core": 189.8074593891551, "core_hours_Tesla V100-SXM2-32GB": 20.325214501813367, "core_hours": 20.325214501813367}
{"step": 13600, "global_schedule": 0.9968996047973633, "l2_grads": 1.0697925090789795, "l2_params": 304.0010070800781, "l2_updates": 1.1076011657714844, "training_loss": 3.840646743774414, "uptime": 5801.3491985089495, "examples_seen": 13926400.0, "progress": 0.12199825973070678, "epoch": 10.979891276495934, "img/sec/core": 189.50457763097793, "core_hours_Tesla V100-SXM2-32GB": 20.400263993493283, "core_hours": 20.400263993493283}
{"step": 13650, "global_schedule": 0.9968129396438599, "l2_grads": 1.1395769119262695, "l2_params": 304.4058837890625, "l2_updates": 1.1538469791412354, "training_loss": 3.7415666580200195, "uptime": 5818.211962948961, "examples_seen": 13977600.0, "progress": 0.12244678274442261, "epoch": 11.020258523835992, "img/sec/core": 189.76722419291937, "core_hours_Tesla V100-SXM2-32GB": 20.475209613226664, "core_hours": 20.475209613226664}
{"step": 13700, "global_schedule": 0.9967250823974609, "l2_grads": 1.2333498001098633, "l2_params": 304.77349853515625, "l2_updates": 1.0746971368789673, "training_loss": 3.8568367958068848, "uptime": 5835.093158526986, "examples_seen": 14028800.0, "progress": 0.12289530575813845, "epoch": 11.060625771176051, "img/sec/core": 189.5600335420234, "core_hours_Tesla V100-SXM2-32GB": 20.550237149129, "core_hours": 20.550237149129}
{"step": 13750, "global_schedule": 0.9966360330581665, "l2_grads": 1.1664172410964966, "l2_params": 305.0969543457031, "l2_updates": 1.0942343473434448, "training_loss": 3.9771156311035156, "uptime": 5851.9814052199945, "examples_seen": 14080000.0, "progress": 0.12334382877185428, "epoch": 11.10099301851611, "img/sec/core": 189.48088917512254, "core_hours_Tesla V100-SXM2-32GB": 20.62529602332015, "core_hours": 20.62529602332015}
{"step": 13800, "global_schedule": 0.9965458512306213, "l2_grads": 1.1317073106765747, "l2_params": 305.49432373046875, "l2_updates": 1.1073880195617676, "training_loss": 4.762063980102539, "uptime": 5868.871280206949, "examples_seen": 14131200.0, "progress": 0.12379235178557012, "epoch": 11.141360265856168, "img/sec/core": 189.4626219833804, "core_hours_Tesla V100-SXM2-32GB": 20.700362134373282, "core_hours": 20.700362134373282}
{"step": 13851, "global_schedule": 0.9964544177055359, "l2_grads": 1.153902530670166, "l2_params": 305.7861328125, "l2_updates": 1.0977741479873657, "training_loss": 3.8334925174713135, "uptime": 5885.731853421952, "examples_seen": 14182400.0, "progress": 0.12424087479928596, "epoch": 11.181727513196227, "img/sec/core": 189.79188662177967, "core_hours_Tesla V100-SXM2-32GB": 20.77529801532885, "core_hours": 20.77529801532885}
{"step": 13900, "global_schedule": 0.9963618516921997, "l2_grads": 1.1150449514389038, "l2_params": 306.1861572265625, "l2_updates": 1.0661910772323608, "training_loss": 3.859933853149414, "uptime": 5902.623139518953, "examples_seen": 14233600.0, "progress": 0.12468939781300178, "epoch": 11.222094760536285, "img/sec/core": 189.44679414127603, "core_hours_Tesla V100-SXM2-32GB": 20.85037039798219, "core_hours": 20.85037039798219}
{"step": 13950, "global_schedule": 0.9962680339813232, "l2_grads": 1.0827432870864868, "l2_params": 306.47845458984375, "l2_updates": 1.0594902038574219, "training_loss": 5.219099044799805, "uptime": 5919.502179692965, "examples_seen": 14284800.0, "progress": 0.12513792082671762, "epoch": 11.262462007876344, "img/sec/core": 189.58423980333845, "core_hours_Tesla V100-SXM2-32GB": 20.925388354311128, "core_hours": 20.925388354311128}
{"step": 14000, "global_schedule": 0.9961730241775513, "l2_grads": 0.9784246683120728, "l2_params": 306.8202209472656, "l2_updates": 1.0543620586395264, "training_loss": 5.1508259773254395, "uptime": 5936.389069219993, "examples_seen": 14336000.0, "progress": 0.12558644384043346, "epoch": 11.302829255216402, "img/sec/core": 189.4961173801905, "core_hours_Tesla V100-SXM2-32GB": 21.000441196653473, "core_hours": 21.000441196653473}
{"step": 14050, "global_schedule": 0.9960768818855286, "l2_grads": 0.9347802400588989, "l2_params": 307.12554931640625, "l2_updates": 1.0788260698318481, "training_loss": 4.823282241821289, "uptime": 5954.057688999979, "examples_seen": 14387200.0, "progress": 0.12603496685414928, "epoch": 11.343196502556461, "img/sec/core": 189.54131112889874, "core_hours_Tesla V100-SXM2-32GB": 21.07547614358676, "core_hours": 21.07547614358676}
{"step": 14100, "global_schedule": 0.9959795475006104, "l2_grads": 1.1721211671829224, "l2_params": 307.468505859375, "l2_updates": 1.1037025451660156, "training_loss": 3.6609349250793457, "uptime": 5970.944197809964, "examples_seen": 14438400.0, "progress": 0.12648348986786512, "epoch": 11.383563749896519, "img/sec/core": 189.50038969025397, "core_hours_Tesla V100-SXM2-32GB": 21.150527293853358, "core_hours": 21.150527293853358}
{"step": 14150, "global_schedule": 0.9958809614181519, "l2_grads": 1.196174144744873, "l2_params": 307.82916259765625, "l2_updates": 1.0953805446624756, "training_loss": 3.8437092304229736, "uptime": 5987.837569775002, "examples_seen": 14489600.0, "progress": 0.12693201288158096, "epoch": 11.423930997236578, "img/sec/core": 189.42340265890584, "core_hours_Tesla V100-SXM2-32GB": 21.2256089470313, "core_hours": 21.2256089470313}
{"step": 14200, "global_schedule": 0.9957812428474426, "l2_grads": 1.249460220336914, "l2_params": 308.0942077636719, "l2_updates": 0.9838734865188599, "training_loss": 3.7953078746795654, "uptime": 6004.727605458, "examples_seen": 14540800.0, "progress": 0.1273805358952968, "epoch": 11.464298244576637, "img/sec/core": 189.46081938839168, "core_hours_Tesla V100-SXM2-32GB": 21.300675772289072, "core_hours": 21.300675772289072}
{"step": 14250, "global_schedule": 0.9956803321838379, "l2_grads": 1.1012953519821167, "l2_params": 308.3800964355469, "l2_updates": 1.0457055568695068, "training_loss": 4.353381633758545, "uptime": 6021.606397661963, "examples_seen": 14592000.0, "progress": 0.1278290589090126, "epoch": 11.504665491916695, "img/sec/core": 189.58702502710497, "core_hours_Tesla V100-SXM2-32GB": 21.37569262652891, "core_hours": 21.37569262652891}
{"step": 14300, "global_schedule": 0.9955781698226929, "l2_grads": 1.0320794582366943, "l2_params": 308.7633056640625, "l2_updates": 1.0629149675369263, "training_loss": 4.5824408531188965, "uptime": 6038.503949866979, "examples_seen": 14643200.0, "progress": 0.12827758192272845, "epoch": 11.545032739256754, "img/sec/core": 189.37654171294284, "core_hours_Tesla V100-SXM2-32GB": 21.450792858551203, "core_hours": 21.450792858551203}
{"step": 14350, "global_schedule": 0.9954749345779419, "l2_grads": 1.1052409410476685, "l2_params": 309.03741455078125, "l2_updates": 1.061617374420166, "training_loss": 3.7920591831207275, "uptime": 6055.4105564799975, "examples_seen": 14694400.0, "progress": 0.1287261049364443, "epoch": 11.585399986596812, "img/sec/core": 189.27512026783663, "core_hours_Tesla V100-SXM2-32GB": 21.525933332386842, "core_hours": 21.525933332386842}
{"step": 14400, "global_schedule": 0.9953703880310059, "l2_grads": 1.1491005420684814, "l2_params": 309.3777160644531, "l2_updates": 1.1408421993255615, "training_loss": 3.74863600730896, "uptime": 6072.28990533395, "examples_seen": 14745600.0, "progress": 0.12917462795016013, "epoch": 11.625767233936871, "img/sec/core": 189.58077279448662, "core_hours_Tesla V100-SXM2-32GB": 21.60095266062663, "core_hours": 21.60095266062663}
{"step": 14450, "global_schedule": 0.9952647686004639, "l2_grads": 0.9731631875038147, "l2_params": 309.6123046875, "l2_updates": 1.0373386144638062, "training_loss": 4.554994583129883, "uptime": 6089.1692420140025, "examples_seen": 14796800.0, "progress": 0.12962315096387594, "epoch": 11.666134481276929, "img/sec/core": 189.580909526001, "core_hours_Tesla V100-SXM2-32GB": 21.675971934760195, "core_hours": 21.675971934760195}
{"step": 14500, "global_schedule": 0.9951578974723816, "l2_grads": 0.8588841557502747, "l2_params": 309.79925537109375, "l2_updates": 1.0376296043395996, "training_loss": 5.868075370788574, "uptime": 6106.067926110001, "examples_seen": 14848000.0, "progress": 0.13007167397759178, "epoch": 11.706501728616988, "img/sec/core": 189.363857080309, "core_hours_Tesla V100-SXM2-32GB": 21.751077197409078, "core_hours": 21.751077197409078}
{"step": 14550, "global_schedule": 0.9950498342514038, "l2_grads": 1.2074716091156006, "l2_params": 310.14581298828125, "l2_updates": 1.039340615272522, "training_loss": 4.127640247344971, "uptime": 6122.960721378971, "examples_seen": 14899200.0, "progress": 0.13052019699130762, "epoch": 11.746868975957046, "img/sec/core": 189.42986930517026, "core_hours_Tesla V100-SXM2-32GB": 21.826156287493394, "core_hours": 21.826156287493394}
{"step": 14600, "global_schedule": 0.9949406385421753, "l2_grads": 1.306969404220581, "l2_params": 310.4325866699219, "l2_updates": 1.0099769830703735, "training_loss": 3.6882071495056152, "uptime": 6139.831540567975, "examples_seen": 14950400.0, "progress": 0.13096872000502346, "epoch": 11.787236223297105, "img/sec/core": 189.67662234716775, "core_hours_Tesla V100-SXM2-32GB": 21.901137706111186, "core_hours": 21.901137706111186}
{"step": 14650, "global_schedule": 0.9948301911354065, "l2_grads": 1.1921758651733398, "l2_params": 310.601318359375, "l2_updates": 1.0873218774795532, "training_loss": 3.7931439876556396, "uptime": 6156.73465542699, "examples_seen": 15001600.0, "progress": 0.1314172430187393, "epoch": 11.827603470637165, "img/sec/core": 189.31421969799723, "core_hours_Tesla V100-SXM2-32GB": 21.976262661040142, "core_hours": 21.976262661040142}
{"step": 14700, "global_schedule": 0.994718611240387, "l2_grads": 1.148988962173462, "l2_params": 310.8614807128906, "l2_updates": 1.0685608386993408, "training_loss": 3.710827350616455, "uptime": 6173.615740315989, "examples_seen": 15052800.0, "progress": 0.13186576603245512, "epoch": 11.867970717977222, "img/sec/core": 189.56127648439144, "core_hours_Tesla V100-SXM2-32GB": 22.051289704991245, "core_hours": 22.051289704991245}
{"step": 14750, "global_schedule": 0.9946057796478271, "l2_grads": 1.153396725654602, "l2_params": 311.2613830566406, "l2_updates": 1.0015870332717896, "training_loss": 3.7859625816345215, "uptime": 6190.49660364195, "examples_seen": 15104000.0, "progress": 0.13231428904617096, "epoch": 11.908337965317282, "img/sec/core": 189.56376449530632, "core_hours_Tesla V100-SXM2-32GB": 22.12631576421774, "core_hours": 22.12631576421774}
{"step": 14800, "global_schedule": 0.9944918155670166, "l2_grads": 0.8254289031028748, "l2_params": 311.5251159667969, "l2_updates": 1.0070592164993286, "training_loss": 5.947600364685059, "uptime": 6207.373964353988, "examples_seen": 15155200.0, "progress": 0.1327628120598868, "epoch": 11.94870521265734, "img/sec/core": 189.6031052839613, "core_hours_Tesla V100-SXM2-32GB": 22.201326256271248, "core_hours": 22.201326256271248}
{"step": 14850, "global_schedule": 0.9943766593933105, "l2_grads": 1.2653095722198486, "l2_params": 311.78692626953125, "l2_updates": 1.126265048980713, "training_loss": 3.8222365379333496, "uptime": 6224.2566118259565, "examples_seen": 15206400.0, "progress": 0.13321133507360264, "epoch": 11.989072459997399, "img/sec/core": 189.54373153341464, "core_hours_Tesla V100-SXM2-32GB": 22.276360245035548, "core_hours": 22.276360245035548}
{"step": 14900, "global_schedule": 0.994260311126709, "l2_grads": 1.1375216245651245, "l2_params": 312.0946044921875, "l2_updates": 1.0673573017120361, "training_loss": 3.5842535495758057, "uptime": 6241.114138287958, "examples_seen": 15257600.0, "progress": 0.13365985808731845, "epoch": 12.029439707337456, "img/sec/core": 189.82618874798482, "core_hours_Tesla V100-SXM2-32GB": 22.351282584866667, "core_hours": 22.351282584866667}
{"step": 14950, "global_schedule": 0.9941427707672119, "l2_grads": 1.0233972072601318, "l2_params": 312.4540100097656, "l2_updates": 1.094306230545044, "training_loss": 3.8272695541381836, "uptime": 6257.996688782994, "examples_seen": 15308800.0, "progress": 0.1341083811010343, "epoch": 12.069806954677516, "img/sec/core": 189.54482031259568, "core_hours_Tesla V100-SXM2-32GB": 22.426316142622383, "core_hours": 22.426316142622383}
{"step": 15000, "global_schedule": 0.9940240979194641, "l2_grads": 0.9602388739585876, "l2_params": 312.760498046875, "l2_updates": 1.0694479942321777, "training_loss": 5.722232341766357, "uptime": 6274.86927479296, "examples_seen": 15360000.0, "progress": 0.13455690411475013, "epoch": 12.110174202017573, "img/sec/core": 189.65676026839805, "core_hours_Tesla V100-SXM2-32GB": 22.501305413777786, "core_hours": 22.501305413777786, "minival/prec@1": 0.4302997190134249, "minival/loss": 2.567939350986868, "minival/sample count": 12812.0, "minival/attn_weight_avg": [13312, 12, 281], "minival/attn_mag": [13312, 12, 281], "minival/before_mlp": [13312, 12, 281], "z/secs/eval/minival": 2.8785216210526414, "real/prec@1": 0.46482481798578046, "real/loss": 3.5505507819172077, "real/sample count": 46837.0, "real/attn_weight_avg": [50176, 12, 281], "real/attn_mag": [50176, 12, 281], "real/before_mlp": [50176, 12, 281], "z/secs/eval/real": 11.210177803004626, "train/prec@1": 0.4427272372477852, "train/loss": 2.514565128430184, "train/sample count": 25623.0, "train/attn_weight_avg": [26624, 12, 281], "train/attn_mag": [26624, 12, 281], "train/before_mlp": [26624, 12, 281], "z/secs/eval/train": 6.603064128023107, "v2/prec@1": 0.3153, "v2/loss": 3.285883056640625, "v2/sample count": 10000.0, "v2/attn_weight_avg": [10240, 12, 281], "v2/attn_mag": [10240, 12, 281], "v2/before_mlp": [10240, 12, 281], "z/secs/eval/v2": 3.3747067349613644, "val/prec@1": 0.40902, "val/loss": 2.70764408203125, "val/sample count": 50000.0, "val/attn_weight_avg": [50176, 12, 281], "val/attn_mag": [50176, 12, 281], "val/before_mlp": [50176, 12, 281], "z/secs/eval/val": 12.402834504027851}
{"step": 15050, "global_schedule": 0.9939042329788208, "l2_grads": 1.0961943864822388, "l2_params": 313.1015625, "l2_updates": 1.1220438480377197, "training_loss": 4.025968551635742, "uptime": 6329.033121179964, "examples_seen": 15411200.0, "progress": 0.13500542712846597, "epoch": 12.150541449357632, "img/sec/core": 189.34743889814868, "core_hours_Tesla V100-SXM2-32GB": 22.576417188750735, "core_hours": 22.576417188750735}
{"step": 15100, "global_schedule": 0.9937831163406372, "l2_grads": 1.1404483318328857, "l2_params": 313.38299560546875, "l2_updates": 1.0871018171310425, "training_loss": 3.689462184906006, "uptime": 6345.919990864, "examples_seen": 15462400.0, "progress": 0.13545395014218178, "epoch": 12.190908696697692, "img/sec/core": 189.49634004844913, "core_hours_Tesla V100-SXM2-32GB": 22.651469942902008, "core_hours": 22.651469942902008}
{"step": 15150, "global_schedule": 0.9936608672142029, "l2_grads": 1.2541263103485107, "l2_params": 313.6962585449219, "l2_updates": 1.0393413305282593, "training_loss": 3.8054614067077637, "uptime": 6362.789600080985, "examples_seen": 15513600.0, "progress": 0.13590247315589762, "epoch": 12.23127594403775, "img/sec/core": 189.69022689500977, "core_hours_Tesla V100-SXM2-32GB": 22.726445983866384, "core_hours": 22.726445983866384}
{"step": 15200, "global_schedule": 0.993537425994873, "l2_grads": 1.1623021364212036, "l2_params": 313.9957275390625, "l2_updates": 1.0973950624465942, "training_loss": 4.068944454193115, "uptime": 6379.649264915963, "examples_seen": 15564800.0, "progress": 0.13635099616961346, "epoch": 12.271643191377809, "img/sec/core": 189.8021123979392, "core_hours_Tesla V100-SXM2-32GB": 22.801377827577394, "core_hours": 22.801377827577394}
{"step": 15250, "global_schedule": 0.9934127926826477, "l2_grads": 1.304939866065979, "l2_params": 314.2857666015625, "l2_updates": 1.1349984407424927, "training_loss": 3.704923629760742, "uptime": 6396.519939005957, "examples_seen": 15616000.0, "progress": 0.1367995191833293, "epoch": 12.312010438717866, "img/sec/core": 189.67825369217863, "core_hours_Tesla V100-SXM2-32GB": 22.876358601310702, "core_hours": 22.876358601310702}
{"step": 15300, "global_schedule": 0.9932869672775269, "l2_grads": 1.1889848709106445, "l2_params": 314.5712890625, "l2_updates": 1.1195603609085083, "training_loss": 3.614732503890991, "uptime": 6413.3946040399605, "examples_seen": 15667200.0, "progress": 0.13724804219704512, "epoch": 12.352377686057926, "img/sec/core": 189.6333938215538, "core_hours_Tesla V100-SXM2-32GB": 22.951357112572943, "core_hours": 22.951357112572943}
{"step": 15350, "global_schedule": 0.9931600093841553, "l2_grads": 1.061295509338379, "l2_params": 314.82611083984375, "l2_updates": 1.1074209213256836, "training_loss": 4.104526519775391, "uptime": 6430.23867223796, "examples_seen": 15718400.0, "progress": 0.13769656521076096, "epoch": 12.392744933397983, "img/sec/core": 189.97785822192986, "core_hours_Tesla V100-SXM2-32GB": 23.026219637897384, "core_hours": 23.026219637897384}
{"step": 15400, "global_schedule": 0.9930317997932434, "l2_grads": 1.3026100397109985, "l2_params": 315.117431640625, "l2_updates": 1.036239743232727, "training_loss": 3.7546043395996094, "uptime": 6447.121997319977, "examples_seen": 15769600.0, "progress": 0.1381450882244768, "epoch": 12.433112180738043, "img/sec/core": 189.53612422048352, "core_hours_Tesla V100-SXM2-32GB": 23.101256638261905, "core_hours": 23.101256638261905}
{"step": 15450, "global_schedule": 0.9929024577140808, "l2_grads": 0.9937642812728882, "l2_params": 315.2984924316406, "l2_updates": 0.9478055834770203, "training_loss": 5.724140644073486, "uptime": 6463.9751755109755, "examples_seen": 15820800.0, "progress": 0.13859361123819264, "epoch": 12.4734794280781, "img/sec/core": 189.8751656058035, "core_hours_Tesla V100-SXM2-32GB": 23.17615965244412, "core_hours": 23.17615965244412}
{"step": 15500, "global_schedule": 0.9927719235420227, "l2_grads": 1.098352313041687, "l2_params": 315.5480041503906, "l2_updates": 1.0327895879745483, "training_loss": 3.6848363876342773, "uptime": 6480.8400906329625, "examples_seen": 15872000.0, "progress": 0.13904213425190848, "epoch": 12.51384667541816, "img/sec/core": 189.74302431134805, "core_hours_Tesla V100-SXM2-32GB": 23.25111483076406, "core_hours": 23.25111483076406}
{"step": 15550, "global_schedule": 0.9926401972770691, "l2_grads": 1.2078819274902344, "l2_params": 315.7865295410156, "l2_updates": 1.090401530265808, "training_loss": 3.8294241428375244, "uptime": 6497.708844707988, "examples_seen": 15923200.0, "progress": 0.1394906572656243, "epoch": 12.554213922758219, "img/sec/core": 189.6998430214662, "core_hours_Tesla V100-SXM2-32GB": 23.326087071097508, "core_hours": 23.326087071097508}
{"step": 15600, "global_schedule": 0.9925073385238647, "l2_grads": 1.2404968738555908, "l2_params": 316.0111999511719, "l2_updates": 0.990436315536499, "training_loss": 3.7239081859588623, "uptime": 6514.558878725977, "examples_seen": 15974400.0, "progress": 0.13993918027934013, "epoch": 12.594581170098277, "img/sec/core": 189.91059582335018, "core_hours_Tesla V100-SXM2-32GB": 23.400976111177457, "core_hours": 23.400976111177457}
{"step": 15650, "global_schedule": 0.9923732280731201, "l2_grads": 0.8969954252243042, "l2_params": 316.1579895019531, "l2_updates": 1.0280792713165283, "training_loss": 5.246922969818115, "uptime": 6531.422725720971, "examples_seen": 16025600.0, "progress": 0.14038770329305597, "epoch": 12.634948417438336, "img/sec/core": 189.75504230735643, "core_hours_Tesla V100-SXM2-32GB": 23.475926542266325, "core_hours": 23.475926542266325}
{"step": 15700, "global_schedule": 0.9922379851341248, "l2_grads": 0.9518669843673706, "l2_params": 316.3604431152344, "l2_updates": 1.0645723342895508, "training_loss": 4.796217918395996, "uptime": 6548.2931459060055, "examples_seen": 16076800.0, "progress": 0.1408362263067718, "epoch": 12.675315664778394, "img/sec/core": 189.68110840764575, "core_hours_Tesla V100-SXM2-32GB": 23.550906187533144, "core_hours": 23.550906187533144}
{"step": 15750, "global_schedule": 0.9921015501022339, "l2_grads": 1.1050496101379395, "l2_params": 316.6739501953125, "l2_updates": 1.049473762512207, "training_loss": 3.880690574645996, "uptime": 6565.159332654963, "examples_seen": 16128000.0, "progress": 0.14128474932048762, "epoch": 12.715682912118453, "img/sec/core": 189.72871862680148, "core_hours_Tesla V100-SXM2-32GB": 23.625867017528506, "core_hours": 23.625867017528506}
{"step": 15800, "global_schedule": 0.9919639229774475, "l2_grads": 1.2701890468597412, "l2_params": 316.89593505859375, "l2_updates": 1.0851186513900757, "training_loss": 3.635730743408203, "uptime": 6582.0151307139895, "examples_seen": 16179200.0, "progress": 0.14173327233420346, "epoch": 12.75605015945851, "img/sec/core": 189.84565363170793, "core_hours_Tesla V100-SXM2-32GB": 23.700781675568628, "core_hours": 23.700781675568628}
{"step": 15850, "global_schedule": 0.9918251037597656, "l2_grads": 1.247754454612732, "l2_params": 317.245849609375, "l2_updates": 1.0913251638412476, "training_loss": 3.7529139518737793, "uptime": 6598.885732396971, "examples_seen": 16230400.0, "progress": 0.1421817953479193, "epoch": 12.79641740679857, "img/sec/core": 189.6790677731411, "core_hours_Tesla V100-SXM2-32GB": 23.775762127492992, "core_hours": 23.775762127492992}
{"step": 15900, "global_schedule": 0.991685152053833, "l2_grads": 1.3608213663101196, "l2_params": 317.5045471191406, "l2_updates": 1.0479345321655273, "training_loss": 3.5964694023132324, "uptime": 6615.754113991978, "examples_seen": 16281600.0, "progress": 0.14263031836163514, "epoch": 12.83678465413863, "img/sec/core": 189.70403188811792, "core_hours_Tesla V100-SXM2-32GB": 23.850732712359683, "core_hours": 23.850732712359683}
{"step": 15950, "global_schedule": 0.9915440082550049, "l2_grads": 1.1915467977523804, "l2_params": 317.68475341796875, "l2_updates": 1.0932748317718506, "training_loss": 3.7107558250427246, "uptime": 6632.61006007297, "examples_seen": 16332800.0, "progress": 0.14307884137535096, "epoch": 12.877151901478687, "img/sec/core": 189.8439864854904, "core_hours_Tesla V100-SXM2-32GB": 23.925648028275205, "core_hours": 23.925648028275205}
{"step": 16000, "global_schedule": 0.9914016723632812, "l2_grads": 1.0691630840301514, "l2_params": 317.9012145996094, "l2_updates": 1.0813450813293457, "training_loss": 3.7544145584106445, "uptime": 6649.489954569959, "examples_seen": 16384000.0, "progress": 0.1435273643890668, "epoch": 12.917519148818746, "img/sec/core": 189.57464459097932, "core_hours_Tesla V100-SXM2-32GB": 24.000669781595157, "core_hours": 24.000669781595157}
{"step": 16050, "global_schedule": 0.9912581443786621, "l2_grads": 1.4310113191604614, "l2_params": 318.0886535644531, "l2_updates": 1.031445026397705, "training_loss": 3.716963768005371, "uptime": 6666.905259102001, "examples_seen": 16435200.0, "progress": 0.14397588740278264, "epoch": 12.957886396158804, "img/sec/core": 189.55330254029113, "core_hours_Tesla V100-SXM2-32GB": 24.07569998171103, "core_hours": 24.07569998171103}
{"step": 16100, "global_schedule": 0.9911134839057922, "l2_grads": 1.2960039377212524, "l2_params": 318.27264404296875, "l2_updates": 1.0839266777038574, "training_loss": 3.6405625343322754, "uptime": 6683.783988977957, "examples_seen": 16486400.0, "progress": 0.14442441041649848, "epoch": 12.998253643498863, "img/sec/core": 189.58772511422262, "core_hours_Tesla V100-SXM2-32GB": 24.150716558937503, "core_hours": 24.150716558937503}
{"step": 16150, "global_schedule": 0.9909676313400269, "l2_grads": 1.1135374307632446, "l2_params": 318.44158935546875, "l2_updates": 1.013188123703003, "training_loss": 3.972949504852295, "uptime": 6700.633932505967, "examples_seen": 16537600.0, "progress": 0.14487293343021432, "epoch": 13.03862089083892, "img/sec/core": 189.91161570841868, "core_hours_Tesla V100-SXM2-32GB": 24.225605196839766, "core_hours": 24.225605196839766}
{"step": 16200, "global_schedule": 0.990820586681366, "l2_grads": 0.8784522414207458, "l2_params": 318.6053771972656, "l2_updates": 1.0140433311462402, "training_loss": 5.752344131469727, "uptime": 6717.511210939963, "examples_seen": 16588800.0, "progress": 0.14532145644393013, "epoch": 13.07898813817898, "img/sec/core": 189.60402961381342, "core_hours_Tesla V100-SXM2-32GB": 24.300615323213083, "core_hours": 24.300615323213083}
{"step": 16250, "global_schedule": 0.9906723499298096, "l2_grads": 1.2992726564407349, "l2_params": 318.818115234375, "l2_updates": 1.055397868156433, "training_loss": 3.717836856842041, "uptime": 6734.391687884985, "examples_seen": 16640000.0, "progress": 0.14576997945764597, "epoch": 13.119355385519038, "img/sec/core": 189.5681034618951, "core_hours_Tesla V100-SXM2-32GB": 24.375639665190956, "core_hours": 24.375639665190956}
{"step": 16301, "global_schedule": 0.9905229806900024, "l2_grads": 0.83016037940979, "l2_params": 319.051513671875, "l2_updates": 1.0249944925308228, "training_loss": 5.767398357391357, "uptime": 6751.255782612949, "examples_seen": 16691200.0, "progress": 0.1462185024713618, "epoch": 13.159722632859097, "img/sec/core": 189.75225481233983, "core_hours_Tesla V100-SXM2-32GB": 24.45059119731524, "core_hours": 24.45059119731524}
{"step": 16350, "global_schedule": 0.9903724193572998, "l2_grads": 0.8713321685791016, "l2_params": 319.30322265625, "l2_updates": 1.0155616998672485, "training_loss": 5.229797840118408, "uptime": 6768.115190527984, "examples_seen": 16742400.0, "progress": 0.14666702548507765, "epoch": 13.200089880199156, "img/sec/core": 189.805004785858, "core_hours_Tesla V100-SXM2-32GB": 24.525521899159845, "core_hours": 24.525521899159845}
{"step": 16400, "global_schedule": 0.9902206659317017, "l2_grads": 1.2611912488937378, "l2_params": 319.46649169921875, "l2_updates": 1.038130521774292, "training_loss": 3.570774555206299, "uptime": 6784.986944891978, "examples_seen": 16793600.0, "progress": 0.14711554849879346, "epoch": 13.240457127539214, "img/sec/core": 189.666108868269, "core_hours_Tesla V100-SXM2-32GB": 24.600507474110927, "core_hours": 24.600507474110927}
{"step": 16450, "global_schedule": 0.9900677800178528, "l2_grads": 1.0269129276275635, "l2_params": 319.7047119140625, "l2_updates": 1.0070806741714478, "training_loss": 4.793573379516602, "uptime": 6801.8464802679955, "examples_seen": 16844800.0, "progress": 0.1475640715125093, "epoch": 13.280824374879273, "img/sec/core": 189.80356982743274, "core_hours_Tesla V100-SXM2-32GB": 24.675438742448783, "core_hours": 24.675438742448783}
{"step": 16500, "global_schedule": 0.9899137020111084, "l2_grads": 1.317132830619812, "l2_params": 319.8997497558594, "l2_updates": 0.9763271808624268, "training_loss": 3.599303722381592, "uptime": 6818.709979631996, "examples_seen": 16896000.0, "progress": 0.14801259452622514, "epoch": 13.321191622219331, "img/sec/core": 189.75895399451795, "core_hours_Tesla V100-SXM2-32GB": 24.75038762851101, "core_hours": 24.75038762851101}
{"step": 16550, "global_schedule": 0.9897584319114685, "l2_grads": 0.9421337842941284, "l2_params": 320.1398620605469, "l2_updates": 1.0490080118179321, "training_loss": 5.345444679260254, "uptime": 6835.595085813955, "examples_seen": 16947200.0, "progress": 0.14846111753994098, "epoch": 13.36155886955939, "img/sec/core": 189.5161312884795, "core_hours_Tesla V100-SXM2-32GB": 24.825432544875266, "core_hours": 24.825432544875266}
{"step": 16600, "global_schedule": 0.9896019697189331, "l2_grads": 0.9986655712127686, "l2_params": 320.31591796875, "l2_updates": 1.0157042741775513, "training_loss": 4.708841323852539, "uptime": 6852.467358867987, "examples_seen": 16998400.0, "progress": 0.1489096405536568, "epoch": 13.401926116899448, "img/sec/core": 189.66027812330046, "core_hours_Tesla V100-SXM2-32GB": 24.90042042511541, "core_hours": 24.90042042511541}
{"step": 16650, "global_schedule": 0.989444375038147, "l2_grads": 1.2228885889053345, "l2_params": 320.5709228515625, "l2_updates": 1.1106159687042236, "training_loss": 3.5524353981018066, "uptime": 6869.348125647986, "examples_seen": 17049600.0, "progress": 0.14935816356737264, "epoch": 13.442293364239507, "img/sec/core": 189.56484866501677, "core_hours_Tesla V100-SXM2-32GB": 24.975446055248742, "core_hours": 24.975446055248742}
{"step": 16700, "global_schedule": 0.9892855882644653, "l2_grads": 0.9414964318275452, "l2_params": 320.71868896484375, "l2_updates": 1.0077143907546997, "training_loss": 5.3029584884643555, "uptime": 6886.2231139199575, "examples_seen": 17100800.0, "progress": 0.14980668658108848, "epoch": 13.482660611579565, "img/sec/core": 189.62976142123242, "core_hours_Tesla V100-SXM2-32GB": 25.050446003124172, "core_hours": 25.050446003124172}
{"step": 16750, "global_schedule": 0.989125669002533, "l2_grads": 1.3341854810714722, "l2_params": 320.9322814941406, "l2_updates": 0.9987798929214478, "training_loss": 3.609668731689453, "uptime": 6903.092076326953, "examples_seen": 17152000.0, "progress": 0.15025520959480432, "epoch": 13.523027858919624, "img/sec/core": 189.69750022520248, "core_hours_Tesla V100-SXM2-32GB": 25.125419169377484, "core_hours": 25.125419169377484}
{"step": 16800, "global_schedule": 0.9889645576477051, "l2_grads": 1.1907191276550293, "l2_params": 321.18017578125, "l2_updates": 1.0476495027542114, "training_loss": 3.551103115081787, "uptime": 6919.962262846995, "examples_seen": 17203200.0, "progress": 0.15070373260852013, "epoch": 13.563395106259684, "img/sec/core": 189.68373563614, "core_hours_Tesla V100-SXM2-32GB": 25.200397776133226, "core_hours": 25.200397776133226}
{"step": 16850, "global_schedule": 0.9888022541999817, "l2_grads": 1.4481967687606812, "l2_params": 321.25750732421875, "l2_updates": 0.9924455285072327, "training_loss": 3.5204224586486816, "uptime": 6936.872214537987, "examples_seen": 17254400.0, "progress": 0.15115225562223597, "epoch": 13.603762353599741, "img/sec/core": 189.2376784083113, "core_hours_Tesla V100-SXM2-32GB": 25.275553116982078, "core_hours": 25.275553116982078}
{"step": 16900, "global_schedule": 0.9886387586593628, "l2_grads": 1.2108538150787354, "l2_params": 321.4634704589844, "l2_updates": 1.0541373491287231, "training_loss": 3.5494625568389893, "uptime": 6953.746919928002, "examples_seen": 17305600.0, "progress": 0.1516007786359518, "epoch": 13.6441296009398, "img/sec/core": 189.63294031156576, "core_hours_Tesla V100-SXM2-32GB": 25.350551807604365, "core_hours": 25.350551807604365}
{"step": 16950, "global_schedule": 0.9884741306304932, "l2_grads": 1.253117561340332, "l2_params": 321.6852111816406, "l2_updates": 1.1080974340438843, "training_loss": 3.5120677947998047, "uptime": 6970.621627951972, "examples_seen": 17356800.0, "progress": 0.15204930164966765, "epoch": 13.684496848279858, "img/sec/core": 189.63291071196588, "core_hours_Tesla V100-SXM2-32GB": 25.425550509933124, "core_hours": 25.425550509933124}
{"step": 17000, "global_schedule": 0.988308310508728, "l2_grads": 1.1864728927612305, "l2_params": 321.7977294921875, "l2_updates": 1.0007566213607788, "training_loss": 3.635253429412842, "uptime": 6987.488796374004, "examples_seen": 17408000.0, "progress": 0.1524978246633835, "epoch": 13.724864095619917, "img/sec/core": 189.7176763718207, "core_hours_Tesla V100-SXM2-32GB": 25.50051570291993, "core_hours": 25.50051570291993}
{"step": 17050, "global_schedule": 0.9881413578987122, "l2_grads": 0.8851511478424072, "l2_params": 321.8944091796875, "l2_updates": 0.9974582195281982, "training_loss": 5.570333003997803, "uptime": 7004.914306979976, "examples_seen": 17459200.0, "progress": 0.1529463476770993, "epoch": 13.765231342959975, "img/sec/core": 189.69267393111483, "core_hours_Tesla V100-SXM2-32GB": 25.575490776693137, "core_hours": 25.575490776693137}
{"step": 17100, "global_schedule": 0.9879732131958008, "l2_grads": 0.9521558284759521, "l2_params": 322.0379943847656, "l2_updates": 1.0426442623138428, "training_loss": 4.251349925994873, "uptime": 7021.791386601981, "examples_seen": 17510400.0, "progress": 0.15339487069081514, "epoch": 13.805598590300034, "img/sec/core": 189.6062631492058, "core_hours_Tesla V100-SXM2-32GB": 25.650500019457603, "core_hours": 25.650500019457603}
{"step": 17150, "global_schedule": 0.9878038763999939, "l2_grads": 0.9424025416374207, "l2_params": 322.2929382324219, "l2_updates": 1.0478250980377197, "training_loss": 4.520758628845215, "uptime": 7038.6749974419945, "examples_seen": 17561600.0, "progress": 0.15384339370453098, "epoch": 13.845965837640092, "img/sec/core": 189.53291628921485, "core_hours_Tesla V100-SXM2-32GB": 25.725538289857663, "core_hours": 25.725538289857663}
{"step": 17200, "global_schedule": 0.9876334071159363, "l2_grads": 1.0750031471252441, "l2_params": 322.50323486328125, "l2_updates": 1.0035008192062378, "training_loss": 4.021663665771484, "uptime": 7055.535330172977, "examples_seen": 17612800.0, "progress": 0.15429191671824682, "epoch": 13.886333084980151, "img/sec/core": 189.79459368080023, "core_hours_Tesla V100-SXM2-32GB": 25.800473101995365, "core_hours": 25.800473101995365}
{"step": 17250, "global_schedule": 0.9874617457389832, "l2_grads": 1.1680089235305786, "l2_params": 322.6554260253906, "l2_updates": 1.0815773010253906, "training_loss": 3.5502943992614746, "uptime": 7072.411720973963, "examples_seen": 17664000.0, "progress": 0.15474043973196264, "epoch": 13.92670033232021, "img/sec/core": 189.61400205386602, "core_hours_Tesla V100-SXM2-32GB": 25.875479283333085, "core_hours": 25.875479283333085}
{"step": 17300, "global_schedule": 0.9872889518737793, "l2_grads": 1.0515663623809814, "l2_params": 322.8616943359375, "l2_updates": 1.0166606903076172, "training_loss": 4.06709623336792, "uptime": 7089.286438558949, "examples_seen": 17715200.0, "progress": 0.15518896274567848, "epoch": 13.967067579660268, "img/sec/core": 189.6328032681975, "core_hours_Tesla V100-SXM2-32GB": 25.950478028155242, "core_hours": 25.950478028155242}
{"step": 17350, "global_schedule": 0.9871149063110352, "l2_grads": 1.0346513986587524, "l2_params": 322.9891662597656, "l2_updates": 1.080828309059143, "training_loss": 5.2700910568237305, "uptime": 7106.162218468962, "examples_seen": 17766400.0, "progress": 0.15563748575939432, "epoch": 14.007434827000328, "img/sec/core": 189.62086594299035, "core_hours_Tesla V100-SXM2-32GB": 26.025481494421967, "core_hours": 26.025481494421967}
{"step": 17400, "global_schedule": 0.9869397878646851, "l2_grads": 0.9063394069671631, "l2_params": 323.2317199707031, "l2_updates": 0.9889109134674072, "training_loss": 5.280081748962402, "uptime": 7123.026872052986, "examples_seen": 17817600.0, "progress": 0.15608600877311016, "epoch": 14.047802074340385, "img/sec/core": 189.74596685647202, "core_hours_Tesla V100-SXM2-32GB": 26.10043551035096, "core_hours": 26.10043551035096}
{"step": 17450, "global_schedule": 0.9867634773254395, "l2_grads": 1.0678964853286743, "l2_params": 323.3596496582031, "l2_updates": 1.024312138557434, "training_loss": 4.621310234069824, "uptime": 7139.898740364995, "examples_seen": 17868800.0, "progress": 0.15653453178682597, "epoch": 14.088169321680445, "img/sec/core": 189.66482791489068, "core_hours_Tesla V100-SXM2-32GB": 26.17542159173767, "core_hours": 26.17542159173767}
{"step": 17500, "global_schedule": 0.9865859746932983, "l2_grads": 1.2447218894958496, "l2_params": 323.50006103515625, "l2_updates": 1.0334500074386597, "training_loss": 3.5967650413513184, "uptime": 7156.776110798994, "examples_seen": 17920000.0, "progress": 0.1569830548005418, "epoch": 14.128536569020502, "img/sec/core": 189.60299606589317, "core_hours_Tesla V100-SXM2-32GB": 26.250432126999886, "core_hours": 26.250432126999886, "minival/prec@1": 0.46987199500468313, "minival/loss": 2.3988836302148377, "minival/sample count": 12812.0, "minival/attn_weight_avg": [13312, 12, 281], "minival/attn_mag": [13312, 12, 281], "minival/before_mlp": [13312, 12, 281], "z/secs/eval/minival": 2.925360699999146, "real/prec@1": 0.5075688024425133, "real/loss": 3.356227114781049, "real/sample count": 46837.0, "real/attn_weight_avg": [50176, 12, 281], "real/attn_mag": [50176, 12, 281], "real/before_mlp": [50176, 12, 281], "z/secs/eval/real": 11.156287322985008, "train/prec@1": 0.48386215509503183, "train/loss": 2.32714123062082, "train/sample count": 25623.0, "train/attn_weight_avg": [26624, 12, 281], "train/attn_mag": [26624, 12, 281], "train/before_mlp": [26624, 12, 281], "z/secs/eval/train": 6.613763685978483, "v2/prec@1": 0.3432, "v2/loss": 3.1394967041015627, "v2/sample count": 10000.0, "v2/attn_weight_avg": [10240, 12, 281], "v2/attn_mag": [10240, 12, 281], "v2/before_mlp": [10240, 12, 281], "z/secs/eval/v2": 3.358661803009454, "val/prec@1": 0.44814, "val/loss": 2.5114396923828126, "val/sample count": 50000.0, "val/attn_weight_avg": [50176, 12, 281], "val/attn_mag": [50176, 12, 281], "val/before_mlp": [50176, 12, 281], "z/secs/eval/val": 12.30876318499213}
{"step": 17550, "global_schedule": 0.9864072799682617, "l2_grads": 1.161618947982788, "l2_params": 323.67852783203125, "l2_updates": 1.1330560445785522, "training_loss": 3.6031928062438965, "uptime": 7210.0436470289715, "examples_seen": 17971200.0, "progress": 0.15743157781425765, "epoch": 14.168903816360562, "img/sec/core": 189.31964400562322, "core_hours_Tesla V100-SXM2-32GB": 26.325554929479903, "core_hours": 26.325554929479903}
{"step": 17600, "global_schedule": 0.9862275123596191, "l2_grads": 1.17344069480896, "l2_params": 323.8822326660156, "l2_updates": 1.0664243698120117, "training_loss": 3.4047040939331055, "uptime": 7226.916083688964, "examples_seen": 18022400.0, "progress": 0.1578801008279735, "epoch": 14.20927106370062, "img/sec/core": 189.65843905567755, "core_hours_Tesla V100-SXM2-32GB": 26.40054353685765, "core_hours": 26.40054353685765}
{"step": 17650, "global_schedule": 0.9860464930534363, "l2_grads": 1.0327095985412598, "l2_params": 324.1033935546875, "l2_updates": 1.0140613317489624, "training_loss": 4.903006553649902, "uptime": 7243.78945867595, "examples_seen": 18073600.0, "progress": 0.1583286238416893, "epoch": 14.249638311040679, "img/sec/core": 189.64789216550017, "core_hours_Tesla V100-SXM2-32GB": 26.47553631457759, "core_hours": 26.47553631457759}
{"step": 17700, "global_schedule": 0.9858643412590027, "l2_grads": 1.0508780479431152, "l2_params": 324.2593994140625, "l2_updates": 1.111890435218811, "training_loss": 4.606367588043213, "uptime": 7260.697267254, "examples_seen": 18124800.0, "progress": 0.15877714685540514, "epoch": 14.290005558380738, "img/sec/core": 189.261664823579, "core_hours_Tesla V100-SXM2-32GB": 26.55068213048003, "core_hours": 26.55068213048003}
{"step": 17750, "global_schedule": 0.9856810569763184, "l2_grads": 1.2315764427185059, "l2_params": 324.43182373046875, "l2_updates": 1.0435348749160767, "training_loss": 3.4483256340026855, "uptime": 7277.579750012956, "examples_seen": 18176000.0, "progress": 0.15922566986912098, "epoch": 14.330372805720796, "img/sec/core": 189.54558080637898, "core_hours_Tesla V100-SXM2-32GB": 26.625715387186503, "core_hours": 26.625715387186503}
{"step": 17800, "global_schedule": 0.9854965209960938, "l2_grads": 1.3938324451446533, "l2_params": 324.63275146484375, "l2_updates": 1.0360310077667236, "training_loss": 3.549903392791748, "uptime": 7294.469703917974, "examples_seen": 18227200.0, "progress": 0.15967419288283682, "epoch": 14.370740053060855, "img/sec/core": 189.46173672204472, "core_hours_Tesla V100-SXM2-32GB": 26.700781848986583, "core_hours": 26.700781848986583}
{"step": 17850, "global_schedule": 0.9853109121322632, "l2_grads": 0.8806642293930054, "l2_params": 324.8128662109375, "l2_updates": 1.0285323858261108, "training_loss": 5.519634246826172, "uptime": 7311.37400482496, "examples_seen": 18278400.0, "progress": 0.16012271589655266, "epoch": 14.411107300400912, "img/sec/core": 189.30093693951318, "core_hours_Tesla V100-SXM2-32GB": 26.77591207523985, "core_hours": 26.77591207523985}
{"step": 17900, "global_schedule": 0.9851241111755371, "l2_grads": 0.8617729544639587, "l2_params": 324.9425048828125, "l2_updates": 1.0249332189559937, "training_loss": 5.809337615966797, "uptime": 7328.268415072991, "examples_seen": 18329600.0, "progress": 0.16057123891026848, "epoch": 14.451474547740972, "img/sec/core": 189.41176122871582, "core_hours_Tesla V100-SXM2-32GB": 26.850998343008882, "core_hours": 26.850998343008882}
{"step": 17950, "global_schedule": 0.9849361181259155, "l2_grads": 0.8943889141082764, "l2_params": 325.05010986328125, "l2_updates": 1.0715701580047607, "training_loss": 4.8160080909729, "uptime": 7345.15354073199, "examples_seen": 18380800.0, "progress": 0.16101976192398432, "epoch": 14.49184179508103, "img/sec/core": 189.51591268108788, "core_hours_Tesla V100-SXM2-32GB": 26.926043345937764, "core_hours": 26.926043345937764}
{"step": 18000, "global_schedule": 0.9847469925880432, "l2_grads": 1.1158214807510376, "l2_params": 325.19512939453125, "l2_updates": 1.0527178049087524, "training_loss": 3.381356716156006, "uptime": 7362.060407603974, "examples_seen": 18432000.0, "progress": 0.16146828493770016, "epoch": 14.532209042421089, "img/sec/core": 189.27220662644018, "core_hours_Tesla V100-SXM2-32GB": 27.00118497647992, "core_hours": 27.00118497647992}
{"step": 18050, "global_schedule": 0.9845566749572754, "l2_grads": 1.2309304475784302, "l2_params": 325.3345642089844, "l2_updates": 1.056307315826416, "training_loss": 3.452662467956543, "uptime": 7379.727160983952, "examples_seen": 18483200.0, "progress": 0.161916807951416, "epoch": 14.572576289761148, "img/sec/core": 189.74286952400942, "core_hours_Tesla V100-SXM2-32GB": 27.07614021594636, "core_hours": 27.07614021594636}
{"step": 18100, "global_schedule": 0.9843652248382568, "l2_grads": 1.2665847539901733, "l2_params": 325.52093505859375, "l2_updates": 1.0388352870941162, "training_loss": 3.522251605987549, "uptime": 7396.5834716969985, "examples_seen": 18534400.0, "progress": 0.1623653309651318, "epoch": 14.612943537101206, "img/sec/core": 189.8398798215802, "core_hours_Tesla V100-SXM2-32GB": 27.151057152448793, "core_hours": 27.151057152448793}
{"step": 18150, "global_schedule": 0.9841726422309875, "l2_grads": 1.412811279296875, "l2_params": 325.6016540527344, "l2_updates": 1.033852458000183, "training_loss": 3.418765068054199, "uptime": 7413.46411419299, "examples_seen": 18585600.0, "progress": 0.16281385397884765, "epoch": 14.653310784441265, "img/sec/core": 189.56624433933328, "core_hours_Tesla V100-SXM2-32GB": 27.226082230208753, "core_hours": 27.226082230208753}
{"step": 18200, "global_schedule": 0.9839788675308228, "l2_grads": 1.364783763885498, "l2_params": 325.7098083496094, "l2_updates": 0.9635826349258423, "training_loss": 3.4309334754943848, "uptime": 7430.320561721979, "examples_seen": 18636800.0, "progress": 0.1632623769925635, "epoch": 14.693678031781323, "img/sec/core": 189.8383389795909, "core_hours_Tesla V100-SXM2-32GB": 27.30099977478204, "core_hours": 27.30099977478204}
{"step": 18250, "global_schedule": 0.9837839603424072, "l2_grads": 0.9514800310134888, "l2_params": 325.7717590332031, "l2_updates": 1.0616071224212646, "training_loss": 4.267490386962891, "uptime": 7447.189833790006, "examples_seen": 18688000.0, "progress": 0.16371090000627933, "epoch": 14.734045279121382, "img/sec/core": 189.69401804036264, "core_hours_Tesla V100-SXM2-32GB": 27.3759743173066, "core_hours": 27.3759743173066}
{"step": 18300, "global_schedule": 0.9835878610610962, "l2_grads": 1.1480576992034912, "l2_params": 325.9656066894531, "l2_updates": 1.0541268587112427, "training_loss": 3.5399680137634277, "uptime": 7464.076062528999, "examples_seen": 18739200.0, "progress": 0.16415942301999514, "epoch": 14.77441252646144, "img/sec/core": 189.50353269884945, "core_hours_Tesla V100-SXM2-32GB": 27.45102422281324, "core_hours": 27.45102422281324}
{"step": 18350, "global_schedule": 0.9833905696868896, "l2_grads": 1.2576963901519775, "l2_params": 325.998779296875, "l2_updates": 1.052497386932373, "training_loss": 3.401329278945923, "uptime": 7480.952719381952, "examples_seen": 18790400.0, "progress": 0.16460794603371098, "epoch": 14.814779773801499, "img/sec/core": 189.6110128849343, "core_hours_Tesla V100-SXM2-32GB": 27.52603158660414, "core_hours": 27.52603158660414}
{"step": 18400, "global_schedule": 0.9831922054290771, "l2_grads": 1.2013431787490845, "l2_params": 326.09149169921875, "l2_updates": 1.093232274055481, "training_loss": 3.4944944381713867, "uptime": 7497.8183166899835, "examples_seen": 18841600.0, "progress": 0.16505646904742682, "epoch": 14.855147021141557, "img/sec/core": 189.73534951389962, "core_hours_Tesla V100-SXM2-32GB": 27.60098979686206, "core_hours": 27.60098979686206}
{"step": 18450, "global_schedule": 0.9829926490783691, "l2_grads": 0.917005181312561, "l2_params": 326.3154296875, "l2_updates": 1.0407923460006714, "training_loss": 4.754462242126465, "uptime": 7514.711403946974, "examples_seen": 18892800.0, "progress": 0.16550499206114266, "epoch": 14.895514268481616, "img/sec/core": 189.42659511071602, "core_hours_Tesla V100-SXM2-32GB": 27.676070184670905, "core_hours": 27.676070184670905}
{"step": 18500, "global_schedule": 0.9827919006347656, "l2_grads": 1.2721033096313477, "l2_params": 326.43505859375, "l2_updates": 1.087304711341858, "training_loss": 3.4520797729492188, "uptime": 7531.606679595949, "examples_seen": 18944000.0, "progress": 0.1659535150748585, "epoch": 14.935881515821675, "img/sec/core": 189.4020592788766, "core_hours_Tesla V100-SXM2-32GB": 27.751160298666345, "core_hours": 27.751160298666345}
{"step": 18550, "global_schedule": 0.9825900197029114, "l2_grads": 1.1919636726379395, "l2_params": 326.5813293457031, "l2_updates": 1.0406341552734375, "training_loss": 3.461627960205078, "uptime": 7548.49265157897, "examples_seen": 18995200.0, "progress": 0.16640203808857432, "epoch": 14.976248763161733, "img/sec/core": 189.50641415356588, "core_hours_Tesla V100-SXM2-32GB": 27.826209063035332, "core_hours": 27.826209063035332}
{"step": 18600, "global_schedule": 0.9823869466781616, "l2_grads": 1.221732258796692, "l2_params": 326.81292724609375, "l2_updates": 1.0539720058441162, "training_loss": 3.568726062774658, "uptime": 7565.375360731967, "examples_seen": 19046400.0, "progress": 0.16685056110229016, "epoch": 15.016616010501792, "img/sec/core": 189.54303903482378, "core_hours_Tesla V100-SXM2-32GB": 27.90124332593754, "core_hours": 27.90124332593754}
{"step": 18650, "global_schedule": 0.9821827411651611, "l2_grads": 0.9114201068878174, "l2_params": 326.9483947753906, "l2_updates": 1.0451616048812866, "training_loss": 4.691920757293701, "uptime": 7582.269179441966, "examples_seen": 19097600.0, "progress": 0.167299084116006, "epoch": 15.05698325784185, "img/sec/core": 189.41839349240468, "core_hours_Tesla V100-SXM2-32GB": 27.97632696464865, "core_hours": 27.97632696464865}
{"step": 18700, "global_schedule": 0.9819774627685547, "l2_grads": 1.25361168384552, "l2_params": 327.1581726074219, "l2_updates": 1.0023002624511719, "training_loss": 5.640860557556152, "uptime": 7599.161726958002, "examples_seen": 19148800.0, "progress": 0.16774760712972184, "epoch": 15.09735050518191, "img/sec/core": 189.43264756025027, "core_hours_Tesla V100-SXM2-32GB": 28.05140495360881, "core_hours": 28.05140495360881}
{"step": 18750, "global_schedule": 0.981770932674408, "l2_grads": 1.0784472227096558, "l2_params": 327.228515625, "l2_updates": 1.0207314491271973, "training_loss": 3.933943033218384, "uptime": 7616.044903254951, "examples_seen": 19200000.0, "progress": 0.16819613014343765, "epoch": 15.137717752521967, "img/sec/core": 189.5377945308909, "core_hours_Tesla V100-SXM2-32GB": 28.12644129270636, "core_hours": 28.12644129270636}
{"step": 18800, "global_schedule": 0.9815632700920105, "l2_grads": 0.9752188920974731, "l2_params": 327.3848571777344, "l2_updates": 1.0690652132034302, "training_loss": 5.27346658706665, "uptime": 7632.919606718002, "examples_seen": 19251200.0, "progress": 0.1686446531571535, "epoch": 15.178084999862026, "img/sec/core": 189.63296196622574, "core_hours_Tesla V100-SXM2-32GB": 28.201439974764362, "core_hours": 28.201439974764362}
{"step": 18850, "global_schedule": 0.9813544750213623, "l2_grads": 1.0433443784713745, "l2_params": 327.63543701171875, "l2_updates": 1.0900118350982666, "training_loss": 4.141619682312012, "uptime": 7649.807639645005, "examples_seen": 19302400.0, "progress": 0.16909317617086933, "epoch": 15.218452247202084, "img/sec/core": 189.48328759374579, "core_hours_Tesla V100-SXM2-32GB": 28.276497898884376, "core_hours": 28.276497898884376}
{"step": 18900, "global_schedule": 0.9811444878578186, "l2_grads": 1.2758015394210815, "l2_params": 327.7960510253906, "l2_updates": 0.9752820730209351, "training_loss": 4.358972549438477, "uptime": 7666.713070038997, "examples_seen": 19353600.0, "progress": 0.16954169918458517, "epoch": 15.258819494542143, "img/sec/core": 189.28828934974916, "core_hours_Tesla V100-SXM2-32GB": 28.351633145079898, "core_hours": 28.351633145079898}
{"step": 18950, "global_schedule": 0.9809333682060242, "l2_grads": 1.329959750175476, "l2_params": 327.8914794921875, "l2_updates": 0.973159670829773, "training_loss": 3.3376071453094482, "uptime": 7683.561798398965, "examples_seen": 19404800.0, "progress": 0.16999022219830098, "epoch": 15.299186741882203, "img/sec/core": 189.92531255967674, "core_hours_Tesla V100-SXM2-32GB": 28.42651638223531, "core_hours": 28.42651638223531}
{"step": 19000, "global_schedule": 0.980721116065979, "l2_grads": 1.2815301418304443, "l2_params": 328.0376892089844, "l2_updates": 0.9746617078781128, "training_loss": 3.418236017227173, "uptime": 7700.4516862409655, "examples_seen": 19456000.0, "progress": 0.17043874521201682, "epoch": 15.33955398922226, "img/sec/core": 189.4624777816753, "core_hours_Tesla V100-SXM2-32GB": 28.50158255042198, "core_hours": 28.50158255042198}
{"step": 19050, "global_schedule": 0.9805076718330383, "l2_grads": 1.2139548063278198, "l2_params": 328.1659240722656, "l2_updates": 1.0678930282592773, "training_loss": 3.48307466506958, "uptime": 7718.085885488952, "examples_seen": 19507200.0, "progress": 0.17088726822573266, "epoch": 15.37992123656232, "img/sec/core": 189.361267481139, "core_hours_Tesla V100-SXM2-32GB": 28.57668884016858, "core_hours": 28.57668884016858}
{"step": 19100, "global_schedule": 0.9802930951118469, "l2_grads": 1.2007514238357544, "l2_params": 328.28155517578125, "l2_updates": 1.0245064496994019, "training_loss": 3.496433734893799, "uptime": 7734.950159146974, "examples_seen": 19558400.0, "progress": 0.1713357912394485, "epoch": 15.420288483902377, "img/sec/core": 189.75024153962121, "core_hours_Tesla V100-SXM2-32GB": 28.651641167537566, "core_hours": 28.651641167537566}
{"step": 19150, "global_schedule": 0.9800773859024048, "l2_grads": 1.4016501903533936, "l2_params": 328.3965759277344, "l2_updates": 1.0771080255508423, "training_loss": 3.4766530990600586, "uptime": 7751.83954654797, "examples_seen": 19609600.0, "progress": 0.17178431425316432, "epoch": 15.460655731242436, "img/sec/core": 189.46809164975335, "core_hours_Tesla V100-SXM2-32GB": 28.726705111541992, "core_hours": 28.726705111541992}
{"step": 19200, "global_schedule": 0.9798605442047119, "l2_grads": 1.2341562509536743, "l2_params": 328.55535888671875, "l2_updates": 1.0401240587234497, "training_loss": 3.9447267055511475, "uptime": 7768.724768603977, "examples_seen": 19660800.0, "progress": 0.17223283726688016, "epoch": 15.501022978582494, "img/sec/core": 189.51483074286807, "core_hours_Tesla V100-SXM2-32GB": 28.801750542902024, "core_hours": 28.801750542902024}
{"step": 19250, "global_schedule": 0.9796425104141235, "l2_grads": 1.0604833364486694, "l2_params": 328.652587890625, "l2_updates": 1.0008518695831299, "training_loss": 4.084192752838135, "uptime": 7785.611420233967, "examples_seen": 19712000.0, "progress": 0.172681360280596, "epoch": 15.541390225922553, "img/sec/core": 189.4987869778178, "core_hours_Tesla V100-SXM2-32GB": 28.876802327924203, "core_hours": 28.876802327924203}
{"step": 19300, "global_schedule": 0.9794232845306396, "l2_grads": 1.1630525588989258, "l2_params": 328.7274169921875, "l2_updates": 1.051851511001587, "training_loss": 3.561506986618042, "uptime": 7802.508075556951, "examples_seen": 19763200.0, "progress": 0.17312988329431184, "epoch": 15.581757473262611, "img/sec/core": 189.38659390460342, "core_hours_Tesla V100-SXM2-32GB": 28.951898573804126, "core_hours": 28.951898573804126}
{"step": 19350, "global_schedule": 0.9792029857635498, "l2_grads": 1.1578342914581299, "l2_params": 328.7687072753906, "l2_updates": 1.0275896787643433, "training_loss": 3.478701114654541, "uptime": 7819.415934254997, "examples_seen": 19814400.0, "progress": 0.17357840630802768, "epoch": 15.62212472060267, "img/sec/core": 189.26110379486855, "core_hours_Tesla V100-SXM2-32GB": 29.027044612462117, "core_hours": 29.027044612462117}
{"step": 19400, "global_schedule": 0.9789814949035645, "l2_grads": 1.3601118326187134, "l2_params": 328.8912048339844, "l2_updates": 1.0567176342010498, "training_loss": 3.372523784637451, "uptime": 7836.276398646005, "examples_seen": 19865600.0, "progress": 0.1740269293217435, "epoch": 15.66249196794273, "img/sec/core": 189.79311161243604, "core_hours_Tesla V100-SXM2-32GB": 29.101980009755483, "core_hours": 29.101980009755483}
{"step": 19450, "global_schedule": 0.9787589311599731, "l2_grads": 0.9209449291229248, "l2_params": 329.0270690917969, "l2_updates": 1.030378818511963, "training_loss": 5.306751728057861, "uptime": 7853.167467044957, "examples_seen": 19916800.0, "progress": 0.17447545233545933, "epoch": 15.702859215282787, "img/sec/core": 189.44923579839693, "core_hours_Tesla V100-SXM2-32GB": 29.177051424861936, "core_hours": 29.177051424861936}
{"step": 19500, "global_schedule": 0.9785351753234863, "l2_grads": 1.3496685028076172, "l2_params": 329.0699157714844, "l2_updates": 1.0196655988693237, "training_loss": 3.3211941719055176, "uptime": 7870.0501773949945, "examples_seen": 19968000.0, "progress": 0.17492397534917517, "epoch": 15.743226462622847, "img/sec/core": 189.5430255955893, "core_hours_Tesla V100-SXM2-32GB": 29.252085693084325, "core_hours": 29.252085693084325}
{"step": 19550, "global_schedule": 0.978310227394104, "l2_grads": 1.274251103401184, "l2_params": 329.2392883300781, "l2_updates": 1.056934118270874, "training_loss": 3.409263849258423, "uptime": 7886.941367533, "examples_seen": 20019200.0, "progress": 0.175372498362891, "epoch": 15.783593709962904, "img/sec/core": 189.44787039013897, "core_hours_Tesla V100-SXM2-32GB": 29.327157649253238, "core_hours": 29.327157649253238}
{"step": 19600, "global_schedule": 0.9780842065811157, "l2_grads": 1.1519827842712402, "l2_params": 329.3681640625, "l2_updates": 1.0232577323913574, "training_loss": 3.373744010925293, "uptime": 7903.809224298981, "examples_seen": 20070400.0, "progress": 0.17582102137660682, "epoch": 15.823960957302964, "img/sec/core": 189.70993436781927, "core_hours_Tesla V100-SXM2-32GB": 29.402125901546484, "core_hours": 29.402125901546484}
{"step": 19650, "global_schedule": 0.9778569936752319, "l2_grads": 1.2850303649902344, "l2_params": 329.4212646484375, "l2_updates": 1.0256205797195435, "training_loss": 3.3075990676879883, "uptime": 7920.698219996993, "examples_seen": 20121600.0, "progress": 0.17626954439032266, "epoch": 15.864328204643021, "img/sec/core": 189.47248594399875, "core_hours_Tesla V100-SXM2-32GB": 29.477188104648764, "core_hours": 29.477188104648764}
{"step": 19700, "global_schedule": 0.9776285886764526, "l2_grads": 1.0318905115127563, "l2_params": 329.5209655761719, "l2_updates": 1.0533870458602905, "training_loss": 4.373838424682617, "uptime": 7937.595361112966, "examples_seen": 20172800.0, "progress": 0.1767180674040385, "epoch": 15.90469545198308, "img/sec/core": 189.3811490379907, "core_hours_Tesla V100-SXM2-32GB": 29.552286509608642, "core_hours": 29.552286509608642}
{"step": 19750, "global_schedule": 0.9773991107940674, "l2_grads": 0.9751418828964233, "l2_params": 329.63616943359375, "l2_updates": 1.0295013189315796, "training_loss": 4.5483832359313965, "uptime": 7954.493297241977, "examples_seen": 20224000.0, "progress": 0.17716659041775434, "epoch": 15.94506269932314, "img/sec/core": 189.37223904557678, "core_hours_Tesla V100-SXM2-32GB": 29.627388447959802, "core_hours": 29.627388447959802}
{"step": 19800, "global_schedule": 0.9771684408187866, "l2_grads": 1.3017841577529907, "l2_params": 329.777099609375, "l2_updates": 1.0360815525054932, "training_loss": 3.290113925933838, "uptime": 7971.37920241995, "examples_seen": 20275200.0, "progress": 0.17761511343147016, "epoch": 15.985429946663197, "img/sec/core": 189.50716389040977, "core_hours_Tesla V100-SXM2-32GB": 29.70243691541746, "core_hours": 29.70243691541746}
{"step": 19850, "global_schedule": 0.9769366979598999, "l2_grads": 1.1070131063461304, "l2_params": 329.91973876953125, "l2_updates": 1.0674769878387451, "training_loss": 5.713017463684082, "uptime": 7988.254938858969, "examples_seen": 20326400.0, "progress": 0.178063636445186, "epoch": 16.025797194003257, "img/sec/core": 189.62135439620027, "core_hours_Tesla V100-SXM2-32GB": 29.777440188479765, "core_hours": 29.777440188479765}
{"step": 19900, "global_schedule": 0.9767037630081177, "l2_grads": 1.1174020767211914, "l2_params": 330.0522766113281, "l2_updates": 1.0434781312942505, "training_loss": 5.687281608581543, "uptime": 8005.155398478964, "examples_seen": 20377600.0, "progress": 0.17851215945890184, "epoch": 16.066164441343314, "img/sec/core": 189.34396294251903, "core_hours_Tesla V100-SXM2-32GB": 29.852553342346415, "core_hours": 29.852553342346415}
{"step": 19950, "global_schedule": 0.9764697551727295, "l2_grads": 1.343176007270813, "l2_params": 330.1546630859375, "l2_updates": 1.0847699642181396, "training_loss": 3.532747507095337, "uptime": 8022.041205856949, "examples_seen": 20428800.0, "progress": 0.17896068247261768, "epoch": 16.106531688683372, "img/sec/core": 189.50826148663003, "core_hours_Tesla V100-SXM2-32GB": 29.927601375137456, "core_hours": 29.927601375137456}
{"step": 20000, "global_schedule": 0.976234495639801, "l2_grads": 1.0914877653121948, "l2_params": 330.24725341796875, "l2_updates": 1.0139626264572144, "training_loss": 5.33206844329834, "uptime": 8038.922938144999, "examples_seen": 20480000.0, "progress": 0.17940920548633352, "epoch": 16.146898936023433, "img/sec/core": 189.55400698216607, "core_hours_Tesla V100-SXM2-32GB": 30.002631296417675, "core_hours": 30.002631296417675, "minival/prec@1": 0.5029659694036841, "minival/loss": 2.1898634782851283, "minival/sample count": 12812.0, "minival/attn_weight_avg": [13312, 12, 281], "minival/attn_mag": [13312, 12, 281], "minival/before_mlp": [13312, 12, 281], "z/secs/eval/minival": 2.9156333989812993, "real/prec@1": 0.5401285308623525, "real/loss": 3.13022881695261, "real/sample count": 46837.0, "real/attn_weight_avg": [50176, 12, 281], "real/attn_mag": [50176, 12, 281], "real/before_mlp": [50176, 12, 281], "z/secs/eval/real": 11.177209009008948, "train/prec@1": 0.5182843539007923, "train/loss": 2.1010010423069607, "train/sample count": 25623.0, "train/attn_weight_avg": [26624, 12, 281], "train/attn_mag": [26624, 12, 281], "train/before_mlp": [26624, 12, 281], "z/secs/eval/train": 6.599448376975488, "v2/prec@1": 0.3678, "v2/loss": 2.985516357421875, "v2/sample count": 10000.0, "v2/attn_weight_avg": [10240, 12, 281], "v2/attn_mag": [10240, 12, 281], "v2/before_mlp": [10240, 12, 281], "z/secs/eval/v2": 3.377918791025877, "val/prec@1": 0.47484, "val/loss": 2.3265645947265625, "val/sample count": 50000.0, "val/attn_weight_avg": [50176, 12, 281], "val/attn_mag": [50176, 12, 281], "val/before_mlp": [50176, 12, 281], "z/secs/eval/val": 12.310694893007167}
{"step": 20050, "global_schedule": 0.9759981632232666, "l2_grads": 1.2005317211151123, "l2_params": 330.35272216796875, "l2_updates": 1.076236605644226, "training_loss": 3.628091335296631, "uptime": 8092.740070841974, "examples_seen": 20531200.0, "progress": 0.17985772850004933, "epoch": 16.18726618336349, "img/sec/core": 189.02815697632604, "core_hours_Tesla V100-SXM2-32GB": 30.077869940489116, "core_hours": 30.077869940489116}
{"step": 20100, "global_schedule": 0.9757606983184814, "l2_grads": 1.1431598663330078, "l2_params": 330.4816589355469, "l2_updates": 1.0532926321029663, "training_loss": 3.9803831577301025, "uptime": 8109.610645240988, "examples_seen": 20582400.0, "progress": 0.18030625151376517, "epoch": 16.22763343070355, "img/sec/core": 189.6793745319675, "core_hours_Tesla V100-SXM2-32GB": 30.1528502711514, "core_hours": 30.1528502711514}
{"step": 20150, "global_schedule": 0.9755220413208008, "l2_grads": 0.9761708378791809, "l2_params": 330.57781982421875, "l2_updates": 0.9961594343185425, "training_loss": 5.07719612121582, "uptime": 8126.506242831005, "examples_seen": 20633600.0, "progress": 0.180754774527481, "epoch": 16.268000678043606, "img/sec/core": 189.39845027385948, "core_hours_Tesla V100-SXM2-32GB": 30.22794181599592, "core_hours": 30.22794181599592}
{"step": 20200, "global_schedule": 0.9752823114395142, "l2_grads": 1.0924512147903442, "l2_params": 330.6999206542969, "l2_updates": 1.0524638891220093, "training_loss": 4.532336235046387, "uptime": 8143.394506783981, "examples_seen": 20684800.0, "progress": 0.18120329754119685, "epoch": 16.308367925383667, "img/sec/core": 189.48069552382853, "core_hours_Tesla V100-SXM2-32GB": 30.30300076689804, "core_hours": 30.30300076689804}
{"step": 20250, "global_schedule": 0.975041389465332, "l2_grads": 1.328259825706482, "l2_params": 330.7515869140625, "l2_updates": 1.0003637075424194, "training_loss": 3.281860589981079, "uptime": 8160.273802361975, "examples_seen": 20736000.0, "progress": 0.18165182055491266, "epoch": 16.348735172723725, "img/sec/core": 189.58137116646031, "core_hours_Tesla V100-SXM2-32GB": 30.37801985835579, "core_hours": 30.37801985835579}
{"step": 20300, "global_schedule": 0.9747993350028992, "l2_grads": 1.2248364686965942, "l2_params": 330.83843994140625, "l2_updates": 1.0529168844223022, "training_loss": 3.377711534500122, "uptime": 8177.150361018954, "examples_seen": 20787200.0, "progress": 0.1821003435686285, "epoch": 16.389102420063782, "img/sec/core": 189.61211613344636, "core_hours_Tesla V100-SXM2-32GB": 30.453026785720137, "core_hours": 30.453026785720137}
{"step": 20350, "global_schedule": 0.9745561480522156, "l2_grads": 1.2171329259872437, "l2_params": 330.92041015625, "l2_updates": 1.0684154033660889, "training_loss": 3.3346335887908936, "uptime": 8194.051126523991, "examples_seen": 20838400.0, "progress": 0.18254886658234434, "epoch": 16.429469667403843, "img/sec/core": 189.34053602756873, "core_hours_Tesla V100-SXM2-32GB": 30.52814129907586, "core_hours": 30.52814129907586}
{"step": 20400, "global_schedule": 0.9743118286132812, "l2_grads": 1.1870718002319336, "l2_params": 331.0267028808594, "l2_updates": 1.1008788347244263, "training_loss": 3.288027763366699, "uptime": 8210.926486425975, "examples_seen": 20889600.0, "progress": 0.18299738959606018, "epoch": 16.4698369147439, "img/sec/core": 189.62558538522364, "core_hours_Tesla V100-SXM2-32GB": 30.603142898640233, "core_hours": 30.603142898640233}
{"step": 20450, "global_schedule": 0.9740663766860962, "l2_grads": 1.4467792510986328, "l2_params": 331.0952453613281, "l2_updates": 0.9906981587409973, "training_loss": 3.2712435722351074, "uptime": 8227.79544244497, "examples_seen": 20940800.0, "progress": 0.183445912609776, "epoch": 16.51020416208396, "img/sec/core": 189.69757206056573, "core_hours_Tesla V100-SXM2-32GB": 30.678116036502438, "core_hours": 30.678116036502438}
{"step": 20500, "global_schedule": 0.9738197326660156, "l2_grads": 0.8908922076225281, "l2_params": 331.1385803222656, "l2_updates": 0.9481408596038818, "training_loss": 5.379673480987549, "uptime": 8244.677398148982, "examples_seen": 20992000.0, "progress": 0.18389443562349184, "epoch": 16.550571409424016, "img/sec/core": 189.5514984226393, "core_hours_Tesla V100-SXM2-32GB": 30.753146950742487, "core_hours": 30.753146950742487}
{"step": 20550, "global_schedule": 0.9735720157623291, "l2_grads": 0.9288806915283203, "l2_params": 331.2849426269531, "l2_updates": 0.979770839214325, "training_loss": 4.697421550750732, "uptime": 8261.569332515006, "examples_seen": 21043200.0, "progress": 0.18434295863720768, "epoch": 16.590938656764077, "img/sec/core": 189.43952366026633, "core_hours_Tesla V100-SXM2-32GB": 30.828222214591484, "core_hours": 30.828222214591484}
{"step": 20600, "global_schedule": 0.9733231663703918, "l2_grads": 1.2934011220932007, "l2_params": 331.31500244140625, "l2_updates": 0.9950243830680847, "training_loss": 3.3033127784729004, "uptime": 8278.447392122005, "examples_seen": 21094400.0, "progress": 0.18479148165092352, "epoch": 16.631305904104135, "img/sec/core": 189.5952541056907, "core_hours_Tesla V100-SXM2-32GB": 30.903235812844812, "core_hours": 30.903235812844812}
{"step": 20650, "global_schedule": 0.9730731844902039, "l2_grads": 1.1899892091751099, "l2_params": 331.321533203125, "l2_updates": 1.031489372253418, "training_loss": 3.2144975662231445, "uptime": 8295.305724039965, "examples_seen": 21145600.0, "progress": 0.18524000466463933, "epoch": 16.671673151444192, "img/sec/core": 189.8171192483721, "core_hours_Tesla V100-SXM2-32GB": 30.97816173248019, "core_hours": 30.97816173248019}
{"step": 20700, "global_schedule": 0.9728220701217651, "l2_grads": 1.1803537607192993, "l2_params": 331.4386291503906, "l2_updates": 1.0932191610336304, "training_loss": 3.3262205123901367, "uptime": 8312.188925749972, "examples_seen": 21196800.0, "progress": 0.18568852767835517, "epoch": 16.712040398784254, "img/sec/core": 189.53750923341497, "core_hours_Tesla V100-SXM2-32GB": 31.053198184524664, "core_hours": 31.053198184524664}
{"step": 20750, "global_schedule": 0.9725698232650757, "l2_grads": 1.1021077632904053, "l2_params": 331.5697326660156, "l2_updates": 1.0502829551696777, "training_loss": 3.9798924922943115, "uptime": 8329.06450720696, "examples_seen": 21248000.0, "progress": 0.186137050692071, "epoch": 16.75240764612431, "img/sec/core": 189.6230958415245, "core_hours_Tesla V100-SXM2-32GB": 31.128200768777948, "core_hours": 31.128200768777948}
{"step": 20800, "global_schedule": 0.9723163843154907, "l2_grads": 0.9654091000556946, "l2_params": 331.6658630371094, "l2_updates": 1.019263744354248, "training_loss": 5.179737091064453, "uptime": 8345.959077163949, "examples_seen": 21299200.0, "progress": 0.18658557370578685, "epoch": 16.79277489346437, "img/sec/core": 189.4099706679007, "core_hours_Tesla V100-SXM2-32GB": 31.20328774636456, "core_hours": 31.20328774636456}
{"step": 20850, "global_schedule": 0.9720618724822998, "l2_grads": 1.2254829406738281, "l2_params": 331.7642822265625, "l2_updates": 1.0343778133392334, "training_loss": 3.378053903579712, "uptime": 8362.802873938985, "examples_seen": 21350400.0, "progress": 0.1870340967195027, "epoch": 16.833142140804426, "img/sec/core": 189.98091954794177, "core_hours_Tesla V100-SXM2-32GB": 31.278149065364723, "core_hours": 31.278149065364723}
{"step": 20900, "global_schedule": 0.9718061685562134, "l2_grads": 1.155852198600769, "l2_params": 331.83331298828125, "l2_updates": 1.073850393295288, "training_loss": 3.4327642917633057, "uptime": 8379.678239434958, "examples_seen": 21401600.0, "progress": 0.1874826197332185, "epoch": 16.873509388144488, "img/sec/core": 189.62552252652895, "core_hours_Tesla V100-SXM2-32GB": 31.353150689791267, "core_hours": 31.353150689791267}
{"step": 20950, "global_schedule": 0.971549391746521, "l2_grads": 1.3304646015167236, "l2_params": 331.877197265625, "l2_updates": 0.9961987137794495, "training_loss": 3.351799964904785, "uptime": 8396.862973429961, "examples_seen": 21452800.0, "progress": 0.18793114274693434, "epoch": 16.913876635484545, "img/sec/core": 186.2117854678684, "core_hours_Tesla V100-SXM2-32GB": 31.429527285324617, "core_hours": 31.429527285324617}
{"step": 21000, "global_schedule": 0.9712915420532227, "l2_grads": 1.1354421377182007, "l2_params": 331.89727783203125, "l2_updates": 0.9570313096046448, "training_loss": 4.204392433166504, "uptime": 8413.747416094993, "examples_seen": 21504000.0, "progress": 0.18837966576065018, "epoch": 16.954243882824603, "img/sec/core": 189.5235788047206, "core_hours_Tesla V100-SXM2-32GB": 31.50456925272476, "core_hours": 31.50456925272476}
{"step": 21050, "global_schedule": 0.971032440662384, "l2_grads": 1.268286943435669, "l2_params": 331.9740295410156, "l2_updates": 1.0195941925048828, "training_loss": 3.521914005279541, "uptime": 8431.174124301993, "examples_seen": 21555200.0, "progress": 0.18882818877436602, "epoch": 16.994611130164664, "img/sec/core": 189.6948949027566, "core_hours_Tesla V100-SXM2-32GB": 31.57954344868039, "core_hours": 31.57954344868039}
{"step": 21100, "global_schedule": 0.9707722663879395, "l2_grads": 1.3160128593444824, "l2_params": 332.0320739746094, "l2_updates": 1.0528961420059204, "training_loss": 3.3288776874542236, "uptime": 8448.051571628952, "examples_seen": 21606400.0, "progress": 0.18927671178808184, "epoch": 17.03497837750472, "img/sec/core": 189.60213224239092, "core_hours_Tesla V100-SXM2-32GB": 31.654554325689098, "core_hours": 31.654554325689098}
{"step": 21150, "global_schedule": 0.9705109596252441, "l2_grads": 1.2792729139328003, "l2_params": 332.0718994140625, "l2_updates": 1.08920419216156, "training_loss": 3.2472405433654785, "uptime": 8464.935543621948, "examples_seen": 21657600.0, "progress": 0.18972523480179768, "epoch": 17.07534562484478, "img/sec/core": 189.5288621260069, "core_hours_Tesla V100-SXM2-32GB": 31.729594201213523, "core_hours": 31.729594201213523}
{"step": 21200, "global_schedule": 0.9702485799789429, "l2_grads": 1.2067961692810059, "l2_params": 332.2117919921875, "l2_updates": 1.0248557329177856, "training_loss": 3.1971514225006104, "uptime": 8481.813752753951, "examples_seen": 21708800.0, "progress": 0.19017375781551352, "epoch": 17.115712872184837, "img/sec/core": 189.59357447067651, "core_hours_Tesla V100-SXM2-32GB": 31.804608464022426, "core_hours": 31.804608464022426}
{"step": 21250, "global_schedule": 0.9699850082397461, "l2_grads": 1.1849498748779297, "l2_params": 332.3231201171875, "l2_updates": 1.0520775318145752, "training_loss": 3.348665475845337, "uptime": 8498.692292088002, "examples_seen": 21760000.0, "progress": 0.19062228082922936, "epoch": 17.156080119524898, "img/sec/core": 189.58986537088649, "core_hours_Tesla V100-SXM2-32GB": 31.879624194395987, "core_hours": 31.879624194395987}
{"step": 21300, "global_schedule": 0.9697203040122986, "l2_grads": 1.305057168006897, "l2_params": 332.437255859375, "l2_updates": 1.039494514465332, "training_loss": 3.27629017829895, "uptime": 8515.572114434966, "examples_seen": 21811200.0, "progress": 0.19107080384294517, "epoch": 17.196447366864955, "img/sec/core": 189.57545489663084, "core_hours_Tesla V100-SXM2-32GB": 31.95464562704916, "core_hours": 31.95464562704916}
{"step": 21350, "global_schedule": 0.9694545269012451, "l2_grads": 1.0465291738510132, "l2_params": 332.47393798828125, "l2_updates": 1.0013471841812134, "training_loss": 4.855647087097168, "uptime": 8532.480782155995, "examples_seen": 21862400.0, "progress": 0.191519326856661, "epoch": 17.236814614205013, "img/sec/core": 189.2520482864677, "core_hours_Tesla V100-SXM2-32GB": 32.029795261364846, "core_hours": 32.029795261364846}
{"step": 21400, "global_schedule": 0.9691875576972961, "l2_grads": 1.2026407718658447, "l2_params": 332.5265197753906, "l2_updates": 1.0549973249435425, "training_loss": 3.4848437309265137, "uptime": 8549.341915194003, "examples_seen": 21913600.0, "progress": 0.19196784987037685, "epoch": 17.27718186154507, "img/sec/core": 189.78558515531589, "core_hours_Tesla V100-SXM2-32GB": 32.10473363042266, "core_hours": 32.10473363042266}
{"step": 21450, "global_schedule": 0.9689195156097412, "l2_grads": 1.113244891166687, "l2_params": 332.5435791015625, "l2_updates": 1.0743231773376465, "training_loss": 3.4352498054504395, "uptime": 8566.217082755, "examples_seen": 21964800.0, "progress": 0.1924163728840927, "epoch": 17.31754910888513, "img/sec/core": 189.62774671323254, "core_hours_Tesla V100-SXM2-32GB": 32.1797343751382, "core_hours": 32.1797343751382}
{"step": 21500, "global_schedule": 0.9686503410339355, "l2_grads": 1.2149666547775269, "l2_params": 332.6255187988281, "l2_updates": 1.0821346044540405, "training_loss": 3.2311787605285645, "uptime": 8583.090515193006, "examples_seen": 22016000.0, "progress": 0.19286489589780853, "epoch": 17.35791635622519, "img/sec/core": 189.6472464483471, "core_hours_Tesla V100-SXM2-32GB": 32.254727408196, "core_hours": 32.254727408196}
{"step": 21550, "global_schedule": 0.9683799743652344, "l2_grads": 1.2682154178619385, "l2_params": 332.71038818359375, "l2_updates": 0.9884124994277954, "training_loss": 3.164306402206421, "uptime": 8599.99070059997, "examples_seen": 22067200.0, "progress": 0.19331341891152434, "epoch": 17.398283603565247, "img/sec/core": 189.34703513259964, "core_hours_Tesla V100-SXM2-32GB": 32.329839343338065, "core_hours": 32.329839343338065}
{"step": 21600, "global_schedule": 0.9681085348129272, "l2_grads": 0.9501192569732666, "l2_params": 332.7623291015625, "l2_updates": 1.0490937232971191, "training_loss": 4.429393768310547, "uptime": 8616.858304349997, "examples_seen": 22118400.0, "progress": 0.19376194192524018, "epoch": 17.438650850905308, "img/sec/core": 189.71278003818455, "core_hours_Tesla V100-SXM2-32GB": 32.40480647111596, "core_hours": 32.40480647111596}
{"step": 21650, "global_schedule": 0.9678360223770142, "l2_grads": 1.2054803371429443, "l2_params": 332.8697204589844, "l2_updates": 1.0845893621444702, "training_loss": 3.279372453689575, "uptime": 8633.722558140988, "examples_seen": 22169600.0, "progress": 0.19421046493895602, "epoch": 17.479018098245366, "img/sec/core": 189.75046507598682, "core_hours_Tesla V100-SXM2-32GB": 32.479758710187035, "core_hours": 32.479758710187035}
{"step": 21700, "global_schedule": 0.9675623178482056, "l2_grads": 0.9041563868522644, "l2_params": 332.9295349121094, "l2_updates": 1.0294339656829834, "training_loss": 5.082696437835693, "uptime": 8650.607623132004, "examples_seen": 22220800.0, "progress": 0.19465898795267186, "epoch": 17.519385345585423, "img/sec/core": 189.5165936111315, "core_hours_Tesla V100-SXM2-32GB": 32.55480344348044, "core_hours": 32.55480344348044}
{"step": 21750, "global_schedule": 0.967287540435791, "l2_grads": 0.960595428943634, "l2_params": 332.9870300292969, "l2_updates": 1.0188137292861938, "training_loss": 5.079840183258057, "uptime": 8667.466019604006, "examples_seen": 22272000.0, "progress": 0.19510751096638768, "epoch": 17.55975259292548, "img/sec/core": 189.81639240211817, "core_hours_Tesla V100-SXM2-32GB": 32.62972965002267, "core_hours": 32.62972965002267}
{"step": 21800, "global_schedule": 0.9670116901397705, "l2_grads": 1.2525333166122437, "l2_params": 333.02191162109375, "l2_updates": 1.0702459812164307, "training_loss": 3.2152745723724365, "uptime": 8684.363000675978, "examples_seen": 22323200.0, "progress": 0.19555603398010352, "epoch": 17.600119840265542, "img/sec/core": 189.38294280911865, "core_hours_Tesla V100-SXM2-32GB": 32.70482734367587, "core_hours": 32.70482734367587}
{"step": 21850, "global_schedule": 0.9667346477508545, "l2_grads": 1.2842799425125122, "l2_params": 333.0994873046875, "l2_updates": 1.027325987815857, "training_loss": 3.3211379051208496, "uptime": 8701.233889297, "examples_seen": 22374400.0, "progress": 0.19600455699381936, "epoch": 17.6404870876056, "img/sec/core": 189.67584173441506, "core_hours_Tesla V100-SXM2-32GB": 32.77980907088042, "core_hours": 32.77980907088042}
{"step": 21900, "global_schedule": 0.9664564728736877, "l2_grads": 1.0125759840011597, "l2_params": 333.19305419921875, "l2_updates": 1.0106422901153564, "training_loss": 5.108524322509766, "uptime": 8718.118231592991, "examples_seen": 22425600.0, "progress": 0.1964530800075352, "epoch": 17.680854334945657, "img/sec/core": 189.52470542840416, "core_hours_Tesla V100-SXM2-32GB": 32.85485059219594, "core_hours": 32.85485059219594}
{"step": 21950, "global_schedule": 0.966177225112915, "l2_grads": 1.2603249549865723, "l2_params": 333.2590637207031, "l2_updates": 1.030788540840149, "training_loss": 3.065610885620117, "uptime": 8734.998773317959, "examples_seen": 22476800.0, "progress": 0.196901603021251, "epoch": 17.721221582285718, "img/sec/core": 189.5673759845589, "core_hours_Tesla V100-SXM2-32GB": 32.92987522208468, "core_hours": 32.92987522208468}
{"step": 22000, "global_schedule": 0.9658968448638916, "l2_grads": 1.1935659646987915, "l2_params": 333.3094177246094, "l2_updates": 1.073675513267517, "training_loss": 3.1981167793273926, "uptime": 8751.873945810948, "examples_seen": 22528000.0, "progress": 0.19735012603496685, "epoch": 17.761588829625776, "img/sec/core": 189.6276912920047, "core_hours_Tesla V100-SXM2-32GB": 33.004875988720194, "core_hours": 33.004875988720194}
{"step": 22050, "global_schedule": 0.9656153321266174, "l2_grads": 1.2449969053268433, "l2_params": 333.3214111328125, "l2_updates": 1.0279582738876343, "training_loss": 3.1388132572174072, "uptime": 8769.54958661599, "examples_seen": 22579200.0, "progress": 0.1977986490486827, "epoch": 17.801956076965833, "img/sec/core": 189.63144060642512, "core_hours_Tesla V100-SXM2-32GB": 33.07987527247156, "core_hours": 33.07987527247156}
{"step": 22100, "global_schedule": 0.9653327465057373, "l2_grads": 1.1590608358383179, "l2_params": 333.4339294433594, "l2_updates": 1.064681053161621, "training_loss": 3.205899238586426, "uptime": 8786.428111280955, "examples_seen": 22630400.0, "progress": 0.19824717206239853, "epoch": 17.84232332430589, "img/sec/core": 189.5900301430056, "core_hours_Tesla V100-SXM2-32GB": 33.15489093764918, "core_hours": 33.15489093764918}
{"step": 22150, "global_schedule": 0.9650489687919617, "l2_grads": 1.1841312646865845, "l2_params": 333.5155334472656, "l2_updates": 1.0669727325439453, "training_loss": 3.75819993019104, "uptime": 8803.29195829999, "examples_seen": 22681600.0, "progress": 0.19869569507611434, "epoch": 17.882690571645952, "img/sec/core": 189.75504203685668, "core_hours_Tesla V100-SXM2-32GB": 33.22984136884489, "core_hours": 33.22984136884489}
{"step": 22200, "global_schedule": 0.9647641181945801, "l2_grads": 1.167219877243042, "l2_params": 333.593017578125, "l2_updates": 1.0549342632293701, "training_loss": 3.66621732711792, "uptime": 8820.174402622972, "examples_seen": 22732800.0, "progress": 0.19914421808983018, "epoch": 17.92305781898601, "img/sec/core": 189.5460123415772, "core_hours_Tesla V100-SXM2-32GB": 33.30487445472481, "core_hours": 33.30487445472481}
{"step": 22250, "global_schedule": 0.9644781947135925, "l2_grads": 1.4251798391342163, "l2_params": 333.6697998046875, "l2_updates": 0.9700106382369995, "training_loss": 3.2498364448547363, "uptime": 8837.061638946005, "examples_seen": 22784000.0, "progress": 0.19959274110354602, "epoch": 17.963425066326067, "img/sec/core": 189.49222589106702, "core_hours_Tesla V100-SXM2-32GB": 33.37992883838273, "core_hours": 33.37992883838273}
{"step": 22300, "global_schedule": 0.9641910791397095, "l2_grads": 1.2056230306625366, "l2_params": 333.6922302246094, "l2_updates": 1.0284477472305298, "training_loss": 3.344372034072876, "uptime": 8853.936747336993, "examples_seen": 22835200.0, "progress": 0.20004126411726186, "epoch": 18.003792313666125, "img/sec/core": 189.62841161416605, "core_hours_Tesla V100-SXM2-32GB": 33.454929320120456, "core_hours": 33.454929320120456}
{"step": 22350, "global_schedule": 0.9639029502868652, "l2_grads": 1.127867341041565, "l2_params": 333.7472229003906, "l2_updates": 1.0658477544784546, "training_loss": 3.711822032928467, "uptime": 8870.812377260998, "examples_seen": 22886400.0, "progress": 0.2004897871309777, "epoch": 18.044159561006186, "img/sec/core": 189.62255124166535, "core_hours_Tesla V100-SXM2-32GB": 33.52993211978271, "core_hours": 33.52993211978271}
{"step": 22400, "global_schedule": 0.9636136293411255, "l2_grads": 0.915367066860199, "l2_params": 333.8324279785156, "l2_updates": 0.9751721024513245, "training_loss": 5.270962715148926, "uptime": 8887.691835708974, "examples_seen": 22937600.0, "progress": 0.20093831014469352, "epoch": 18.084526808346244, "img/sec/core": 189.57954189481794, "core_hours_Tesla V100-SXM2-32GB": 33.604951935107046, "core_hours": 33.604951935107046}
{"step": 22450, "global_schedule": 0.9633232355117798, "l2_grads": 1.3552402257919312, "l2_params": 333.8642883300781, "l2_updates": 1.0091255903244019, "training_loss": 3.09431791305542, "uptime": 8904.566301633953, "examples_seen": 22988800.0, "progress": 0.20138683315840936, "epoch": 18.1248940556863, "img/sec/core": 189.63563138689588, "core_hours_Tesla V100-SXM2-32GB": 33.67994956144028, "core_hours": 33.67994956144028}
{"step": 22500, "global_schedule": 0.9630317091941833, "l2_grads": 1.2273756265640259, "l2_params": 333.85443115234375, "l2_updates": 1.0553414821624756, "training_loss": 3.095228672027588, "uptime": 8921.448940592993, "examples_seen": 23040000.0, "progress": 0.2018353561721252, "epoch": 18.165261303026362, "img/sec/core": 189.54382710924614, "core_hours_Tesla V100-SXM2-32GB": 33.75498351236935, "core_hours": 33.75498351236935, "minival/prec@1": 0.5220106150483921, "minival/loss": 2.062638181840633, "minival/sample count": 12812.0, "minival/attn_weight_avg": [13312, 12, 281], "minival/attn_mag": [13312, 12, 281], "minival/before_mlp": [13312, 12, 281], "z/secs/eval/minival": 2.9149747460032813, "real/prec@1": 0.5666460277131328, "real/loss": 2.9676505514220195, "real/sample count": 46837.0, "real/attn_weight_avg": [50176, 12, 281], "real/attn_mag": [50176, 12, 281], "real/before_mlp": [50176, 12, 281], "z/secs/eval/real": 11.136142922041472, "train/prec@1": 0.5465011903368068, "train/loss": 1.9613627402624165, "train/sample count": 25623.0, "train/attn_weight_avg": [26624, 12, 281], "train/attn_mag": [26624, 12, 281], "train/before_mlp": [26624, 12, 281], "z/secs/eval/train": 6.559256314008962, "v2/prec@1": 0.3948, "v2/loss": 2.8218640380859377, "v2/sample count": 10000.0, "v2/attn_weight_avg": [10240, 12, 281], "v2/attn_mag": [10240, 12, 281], "v2/before_mlp": [10240, 12, 281], "z/secs/eval/v2": 3.3544716269825585, "val/prec@1": 0.50144, "val/loss": 2.1795571484375, "val/sample count": 50000.0, "val/attn_weight_avg": [50176, 12, 281], "val/attn_mag": [50176, 12, 281], "val/before_mlp": [50176, 12, 281], "z/secs/eval/val": 12.298040964000393}
{"step": 22550, "global_schedule": 0.962739109992981, "l2_grads": 1.282109022140503, "l2_params": 333.9458923339844, "l2_updates": 1.040485143661499, "training_loss": 3.1899588108062744, "uptime": 8974.631007741962, "examples_seen": 23091200.0, "progress": 0.20228387918584104, "epoch": 18.20562855036642, "img/sec/core": 189.1553360374259, "core_hours_Tesla V100-SXM2-32GB": 33.83017156955113, "core_hours": 33.83017156955113}
{"step": 22600, "global_schedule": 0.9624453783035278, "l2_grads": 0.8868632316589355, "l2_params": 334.0148010253906, "l2_updates": 0.971666693687439, "training_loss": 4.934667110443115, "uptime": 8991.494723110984, "examples_seen": 23142400.0, "progress": 0.20273240219955685, "epoch": 18.245995797706478, "img/sec/core": 189.7565233980626, "core_hours_Tesla V100-SXM2-32GB": 33.90512141563567, "core_hours": 33.90512141563567}
{"step": 22650, "global_schedule": 0.962150514125824, "l2_grads": 1.2704124450683594, "l2_params": 334.0224914550781, "l2_updates": 1.0333136320114136, "training_loss": 3.2938480377197266, "uptime": 9008.369356616982, "examples_seen": 23193600.0, "progress": 0.2031809252132727, "epoch": 18.286363045046535, "img/sec/core": 189.63374812628993, "core_hours_Tesla V100-SXM2-32GB": 33.98011978677344, "core_hours": 33.98011978677344}
{"step": 22700, "global_schedule": 0.9618545770645142, "l2_grads": 1.2410136461257935, "l2_params": 334.0605773925781, "l2_updates": 1.0461400747299194, "training_loss": 3.2574901580810547, "uptime": 9025.251512365998, "examples_seen": 23244800.0, "progress": 0.20362944822698853, "epoch": 18.326730292386596, "img/sec/core": 189.54925233328743, "core_hours_Tesla V100-SXM2-32GB": 34.055151590102405, "core_hours": 34.055151590102405}
{"step": 22750, "global_schedule": 0.9615575075149536, "l2_grads": 1.3934540748596191, "l2_params": 334.13128662109375, "l2_updates": 0.9786737561225891, "training_loss": 3.382855176925659, "uptime": 9042.13229671598, "examples_seen": 23296000.0, "progress": 0.20407797124070437, "epoch": 18.367097539726654, "img/sec/core": 189.5646513607331, "core_hours_Tesla V100-SXM2-32GB": 34.13017729832455, "core_hours": 34.13017729832455}
{"step": 22800, "global_schedule": 0.9612593650817871, "l2_grads": 0.9383063912391663, "l2_params": 334.1441650390625, "l2_updates": 1.0014022588729858, "training_loss": 5.37777042388916, "uptime": 9059.00522292999, "examples_seen": 23347200.0, "progress": 0.20452649425442018, "epoch": 18.40746478706671, "img/sec/core": 189.65293627270768, "core_hours_Tesla V100-SXM2-32GB": 34.20516808149793, "core_hours": 34.20516808149793}
{"step": 22850, "global_schedule": 0.9609600901603699, "l2_grads": 0.994763195514679, "l2_params": 334.177490234375, "l2_updates": 0.9926596283912659, "training_loss": 5.513468265533447, "uptime": 9075.892941606988, "examples_seen": 23398400.0, "progress": 0.20497501726813602, "epoch": 18.447832034406773, "img/sec/core": 189.4868135362053, "core_hours_Tesla V100-SXM2-32GB": 34.28022460895125, "core_hours": 34.28022460895125}
{"step": 22900, "global_schedule": 0.9606597423553467, "l2_grads": 1.272021770477295, "l2_params": 334.19171142578125, "l2_updates": 1.0356777906417847, "training_loss": 3.171654224395752, "uptime": 9092.760121594998, "examples_seen": 23449600.0, "progress": 0.20542354028185186, "epoch": 18.48819928174683, "img/sec/core": 189.71754628068547, "core_hours_Tesla V100-SXM2-32GB": 34.3551898533424, "core_hours": 34.3551898533424}
{"step": 22950, "global_schedule": 0.9603582620620728, "l2_grads": 1.3140192031860352, "l2_params": 334.2789306640625, "l2_updates": 1.036217212677002, "training_loss": 3.2939043045043945, "uptime": 9109.64036202099, "examples_seen": 23500800.0, "progress": 0.2058720632955677, "epoch": 18.528566529086888, "img/sec/core": 189.57075961268882, "core_hours_Tesla V100-SXM2-32GB": 34.430213144124586, "core_hours": 34.430213144124586}
{"step": 23000, "global_schedule": 0.9600556492805481, "l2_grads": 1.1447815895080566, "l2_params": 334.3304138183594, "l2_updates": 1.043591022491455, "training_loss": 3.4749929904937744, "uptime": 9126.515944714949, "examples_seen": 23552000.0, "progress": 0.20632058630928352, "epoch": 18.568933776426945, "img/sec/core": 189.62308194225506, "core_hours_Tesla V100-SXM2-32GB": 34.50521573387552, "core_hours": 34.50521573387552}
{"step": 23050, "global_schedule": 0.9597519636154175, "l2_grads": 0.9775564670562744, "l2_params": 334.3683166503906, "l2_updates": 1.0098998546600342, "training_loss": 5.026297569274902, "uptime": 9143.92779796297, "examples_seen": 23603200.0, "progress": 0.20676910932299936, "epoch": 18.609301023767006, "img/sec/core": 189.57038807998137, "core_hours_Tesla V100-SXM2-32GB": 34.580239171693364, "core_hours": 34.580239171693364}
{"step": 23100, "global_schedule": 0.9594472050666809, "l2_grads": 1.2877355813980103, "l2_params": 334.4027404785156, "l2_updates": 1.0323761701583862, "training_loss": 3.3518853187561035, "uptime": 9160.807155169954, "examples_seen": 23654400.0, "progress": 0.2072176323367152, "epoch": 18.649668271107064, "img/sec/core": 189.58067897727102, "core_hours_Tesla V100-SXM2-32GB": 34.65525853705774, "core_hours": 34.65525853705774}
{"step": 23150, "global_schedule": 0.9591413140296936, "l2_grads": 1.2948966026306152, "l2_params": 334.4476623535156, "l2_updates": 1.036719560623169, "training_loss": 3.6528351306915283, "uptime": 9177.693485345982, "examples_seen": 23705600.0, "progress": 0.20766615535043104, "epoch": 18.69003551844712, "img/sec/core": 189.50239434158829, "core_hours_Tesla V100-SXM2-32GB": 34.73030889339564, "core_hours": 34.73030889339564}
{"step": 23200, "global_schedule": 0.9588342905044556, "l2_grads": 1.4633525609970093, "l2_params": 334.4996337890625, "l2_updates": 0.990563154220581, "training_loss": 3.118171453475952, "uptime": 9194.576140586985, "examples_seen": 23756800.0, "progress": 0.20811467836414688, "epoch": 18.730402765787183, "img/sec/core": 189.54364430946745, "core_hours_Tesla V100-SXM2-32GB": 34.805342916688986, "core_hours": 34.805342916688986}
{"step": 23250, "global_schedule": 0.9585262537002563, "l2_grads": 1.3671786785125732, "l2_params": 334.5096435546875, "l2_updates": 1.0328447818756104, "training_loss": 3.0694854259490967, "uptime": 9211.46355997998, "examples_seen": 23808000.0, "progress": 0.2085632013778627, "epoch": 18.77077001312724, "img/sec/core": 189.49017167936063, "core_hours_Tesla V100-SXM2-32GB": 34.880398113991184, "core_hours": 34.880398113991184}
{"step": 23300, "global_schedule": 0.9582170248031616, "l2_grads": 0.9685074687004089, "l2_params": 334.5643310546875, "l2_updates": 1.0412989854812622, "training_loss": 4.217556476593018, "uptime": 9228.339208490972, "examples_seen": 23859200.0, "progress": 0.20901172439157853, "epoch": 18.811137260467298, "img/sec/core": 189.62234238973085, "core_hours_Tesla V100-SXM2-32GB": 34.955400996262256, "core_hours": 34.955400996262256}
{"step": 23350, "global_schedule": 0.9579067826271057, "l2_grads": 1.345914602279663, "l2_params": 334.6919250488281, "l2_updates": 1.0364307165145874, "training_loss": 3.35250186920166, "uptime": 9245.222094583965, "examples_seen": 23910400.0, "progress": 0.20946024740529437, "epoch": 18.851504507807356, "img/sec/core": 189.5410525412496, "core_hours_Tesla V100-SXM2-32GB": 35.03043604556445, "core_hours": 35.03043604556445}
{"step": 23400, "global_schedule": 0.9575954079627991, "l2_grads": 1.0427175760269165, "l2_params": 334.74041748046875, "l2_updates": 0.9865315556526184, "training_loss": 4.151738166809082, "uptime": 9262.104391682951, "examples_seen": 23961600.0, "progress": 0.2099087704190102, "epoch": 18.891871755147417, "img/sec/core": 189.5476652991864, "core_hours_Tesla V100-SXM2-32GB": 35.1054684771155, "core_hours": 35.1054684771155}
{"step": 23450, "global_schedule": 0.9572829008102417, "l2_grads": 0.9924672842025757, "l2_params": 334.7326354980469, "l2_updates": 0.9949367046356201, "training_loss": 5.6110992431640625, "uptime": 9278.988620436983, "examples_seen": 24012800.0, "progress": 0.21035729343272602, "epoch": 18.932239002487474, "img/sec/core": 189.5259799317658, "core_hours_Tesla V100-SXM2-32GB": 35.18050949380009, "core_hours": 35.18050949380009}
{"step": 23500, "global_schedule": 0.9569693803787231, "l2_grads": 1.0126638412475586, "l2_params": 334.71502685546875, "l2_updates": 1.0156519412994385, "training_loss": 5.384921073913574, "uptime": 9295.840216929966, "examples_seen": 24064000.0, "progress": 0.21080581644644186, "epoch": 18.972606249827532, "img/sec/core": 189.89298736962348, "core_hours_Tesla V100-SXM2-32GB": 35.25540547821334, "core_hours": 35.25540547821334}
{"step": 23550, "global_schedule": 0.9566546678543091, "l2_grads": 1.2345914840698242, "l2_params": 334.69525146484375, "l2_updates": 1.0430697202682495, "training_loss": 3.2577455043792725, "uptime": 9312.727294049982, "examples_seen": 24115200.0, "progress": 0.2112543394601577, "epoch": 19.01297349716759, "img/sec/core": 189.49401233011636, "core_hours_Tesla V100-SXM2-32GB": 35.330459154302304, "core_hours": 35.330459154302304}
{"step": 23600, "global_schedule": 0.9563389420509338, "l2_grads": 1.1642587184906006, "l2_params": 334.73590087890625, "l2_updates": 1.03694748878479, "training_loss": 3.222600221633911, "uptime": 9329.59951936896, "examples_seen": 24166400.0, "progress": 0.21170286247387354, "epoch": 19.05334074450765, "img/sec/core": 189.66081471190284, "core_hours_Tesla V100-SXM2-32GB": 35.40544682238665, "core_hours": 35.40544682238665}
{"step": 23650, "global_schedule": 0.9560220837593079, "l2_grads": 1.3159180879592896, "l2_params": 334.8535461425781, "l2_updates": 1.042339563369751, "training_loss": 3.224431037902832, "uptime": 9346.472128094989, "examples_seen": 24217600.0, "progress": 0.21215138548758936, "epoch": 19.093707991847708, "img/sec/core": 189.65650492821402, "core_hours_Tesla V100-SXM2-32GB": 35.48043619450233, "core_hours": 35.48043619450233}
{"step": 23700, "global_schedule": 0.9557041525840759, "l2_grads": 1.3030548095703125, "l2_params": 334.861083984375, "l2_updates": 1.0227015018463135, "training_loss": 3.056699752807617, "uptime": 9363.35882357898, "examples_seen": 24268800.0, "progress": 0.2125999085013052, "epoch": 19.134075239187766, "img/sec/core": 189.49829485785284, "core_hours_Tesla V100-SXM2-32GB": 35.55548817443118, "core_hours": 35.55548817443118}
{"step": 23750, "global_schedule": 0.9553850889205933, "l2_grads": 1.1632834672927856, "l2_params": 334.9471740722656, "l2_updates": 1.0159940719604492, "training_loss": 3.372612476348877, "uptime": 9380.256656133977, "examples_seen": 24320000.0, "progress": 0.21304843151502104, "epoch": 19.174442486527827, "img/sec/core": 189.37339978869272, "core_hours_Tesla V100-SXM2-32GB": 35.630589652453395, "core_hours": 35.630589652453395}
{"step": 23800, "global_schedule": 0.9550650119781494, "l2_grads": 0.8633044958114624, "l2_params": 334.98956298828125, "l2_updates": 0.9864528775215149, "training_loss": 5.239388465881348, "uptime": 9397.121289514005, "examples_seen": 24371200.0, "progress": 0.21349695452873688, "epoch": 19.214809733867884, "img/sec/core": 189.7461941739937, "core_hours_Tesla V100-SXM2-32GB": 35.70554357858685, "core_hours": 35.70554357858685}
{"step": 23850, "global_schedule": 0.9547437429428101, "l2_grads": 1.1120986938476562, "l2_params": 335.02392578125, "l2_updates": 1.0168075561523438, "training_loss": 3.2577743530273438, "uptime": 9414.001485081972, "examples_seen": 24422400.0, "progress": 0.21394547754245272, "epoch": 19.255176981207942, "img/sec/core": 189.57126338468748, "core_hours_Tesla V100-SXM2-32GB": 35.780566670000034, "core_hours": 35.780566670000034}
{"step": 23900, "global_schedule": 0.9544214606285095, "l2_grads": 1.1505526304244995, "l2_params": 335.0934753417969, "l2_updates": 1.0213799476623535, "training_loss": 3.489014148712158, "uptime": 9430.890768549987, "examples_seen": 24473600.0, "progress": 0.21439400055616853, "epoch": 19.295544228548, "img/sec/core": 189.46925759521304, "core_hours_Tesla V100-SXM2-32GB": 35.85563015208011, "core_hours": 35.85563015208011}
{"step": 23950, "global_schedule": 0.954098105430603, "l2_grads": 1.347083330154419, "l2_params": 335.1778259277344, "l2_updates": 1.0061190128326416, "training_loss": 3.1832895278930664, "uptime": 9447.75662184495, "examples_seen": 24524800.0, "progress": 0.21484252356988437, "epoch": 19.33591147588806, "img/sec/core": 189.73246974439647, "core_hours_Tesla V100-SXM2-32GB": 35.93058950005772, "core_hours": 35.93058950005772}
{"step": 24000, "global_schedule": 0.9537736177444458, "l2_grads": 1.0519862174987793, "l2_params": 335.2279968261719, "l2_updates": 1.042533278465271, "training_loss": 3.8619914054870605, "uptime": 9464.639732185984, "examples_seen": 24576000.0, "progress": 0.2152910465836002, "epoch": 19.37627872322812, "img/sec/core": 189.5385349832427, "core_hours_Tesla V100-SXM2-32GB": 36.00562554601787, "core_hours": 36.00562554601787}
{"step": 24050, "global_schedule": 0.9534479975700378, "l2_grads": 1.2375534772872925, "l2_params": 335.2485656738281, "l2_updates": 1.0162968635559082, "training_loss": 3.2757699489593506, "uptime": 9482.063247173966, "examples_seen": 24627200.0, "progress": 0.21573956959731605, "epoch": 19.416645970568176, "img/sec/core": 189.7694602699685, "core_hours_Tesla V100-SXM2-32GB": 36.08057028265773, "core_hours": 36.08057028265773}
{"step": 24100, "global_schedule": 0.9531213641166687, "l2_grads": 1.003920316696167, "l2_params": 335.2620849609375, "l2_updates": 1.0108171701431274, "training_loss": 4.470340728759766, "uptime": 9498.939805884962, "examples_seen": 24678400.0, "progress": 0.21618809261103186, "epoch": 19.457013217908237, "img/sec/core": 189.6121155265559, "core_hours_Tesla V100-SXM2-32GB": 36.15557721026216, "core_hours": 36.15557721026216}
{"step": 24150, "global_schedule": 0.9527935981750488, "l2_grads": 1.2418559789657593, "l2_params": 335.3298034667969, "l2_updates": 1.0108158588409424, "training_loss": 3.080028772354126, "uptime": 9515.827504986955, "examples_seen": 24729600.0, "progress": 0.2166366156247477, "epoch": 19.497380465248295, "img/sec/core": 189.48703317566134, "core_hours_Tesla V100-SXM2-32GB": 36.23063365071547, "core_hours": 36.23063365071547}
{"step": 24200, "global_schedule": 0.9524648189544678, "l2_grads": 1.0803518295288086, "l2_params": 335.3504638671875, "l2_updates": 1.0294708013534546, "training_loss": 4.342265605926514, "uptime": 9532.709782703954, "examples_seen": 24780800.0, "progress": 0.21708513863846354, "epoch": 19.537747712588352, "img/sec/core": 189.5478829126171, "core_hours_Tesla V100-SXM2-32GB": 36.30566599612435, "core_hours": 36.30566599612435}
{"step": 24250, "global_schedule": 0.9521348476409912, "l2_grads": 1.0616477727890015, "l2_params": 335.3358154296875, "l2_updates": 1.0010769367218018, "training_loss": 4.904690742492676, "uptime": 9549.572815916967, "examples_seen": 24832000.0, "progress": 0.21753366165217938, "epoch": 19.57811495992841, "img/sec/core": 189.7641995706155, "core_hours_Tesla V100-SXM2-32GB": 36.3806128104044, "core_hours": 36.3806128104044}
{"step": 24300, "global_schedule": 0.9518038630485535, "l2_grads": 1.1939313411712646, "l2_params": 335.4352111816406, "l2_updates": 1.0065264701843262, "training_loss": 3.5215811729431152, "uptime": 9566.454752585967, "examples_seen": 24883200.0, "progress": 0.2179821846658952, "epoch": 19.61848220726847, "img/sec/core": 189.55171214899903, "core_hours_Tesla V100-SXM2-32GB": 36.45564364004441, "core_hours": 36.45564364004441}
{"step": 24350, "global_schedule": 0.9514718055725098, "l2_grads": 1.2378709316253662, "l2_params": 335.43475341796875, "l2_updates": 1.0306586027145386, "training_loss": 3.3760745525360107, "uptime": 9583.341093077965, "examples_seen": 24934400.0, "progress": 0.21843070767961104, "epoch": 19.65884945460853, "img/sec/core": 189.50227857341167, "core_hours_Tesla V100-SXM2-32GB": 36.53069404223106, "core_hours": 36.53069404223106}
{"step": 24400, "global_schedule": 0.9511386156082153, "l2_grads": 1.319308876991272, "l2_params": 335.4329833984375, "l2_updates": 1.0207682847976685, "training_loss": 3.2639594078063965, "uptime": 9600.228704535984, "examples_seen": 24985600.0, "progress": 0.21887923069332688, "epoch": 19.699216701948586, "img/sec/core": 189.48801658273234, "core_hours_Tesla V100-SXM2-32GB": 36.60575009315559, "core_hours": 36.60575009315559}
{"step": 24450, "global_schedule": 0.9508044123649597, "l2_grads": 1.1978811025619507, "l2_params": 335.48016357421875, "l2_updates": 1.027775764465332, "training_loss": 3.1666488647460938, "uptime": 9617.10201370297, "examples_seen": 25036800.0, "progress": 0.21932775370704272, "epoch": 19.739583949288644, "img/sec/core": 189.64863195069896, "core_hours_Tesla V100-SXM2-32GB": 36.6807425783422, "core_hours": 36.6807425783422}
{"step": 24500, "global_schedule": 0.9504690766334534, "l2_grads": 1.3120042085647583, "l2_params": 335.4898376464844, "l2_updates": 0.9584518074989319, "training_loss": 3.4701108932495117, "uptime": 9633.99663193, "examples_seen": 25088000.0, "progress": 0.21977627672075853, "epoch": 19.779951196628705, "img/sec/core": 189.40942949987675, "core_hours_Tesla V100-SXM2-32GB": 36.75582977046233, "core_hours": 36.75582977046233}
{"step": 24550, "global_schedule": 0.9501326680183411, "l2_grads": 1.3077410459518433, "l2_params": 335.4591064453125, "l2_updates": 1.0319554805755615, "training_loss": 3.0901989936828613, "uptime": 9650.872064488998, "examples_seen": 25139200.0, "progress": 0.22022479973447437, "epoch": 19.820318443968763, "img/sec/core": 189.62476895407082, "core_hours_Tesla V100-SXM2-32GB": 36.83083169294676, "core_hours": 36.83083169294676}
{"step": 24600, "global_schedule": 0.9497952461242676, "l2_grads": 1.3480613231658936, "l2_params": 335.4984436035156, "l2_updates": 0.9800628423690796, "training_loss": 3.083993434906006, "uptime": 9667.770005715953, "examples_seen": 25190400.0, "progress": 0.2206733227481902, "epoch": 19.86068569130882, "img/sec/core": 189.37218191382712, "core_hours_Tesla V100-SXM2-32GB": 36.90593365395545, "core_hours": 36.90593365395545}
{"step": 24650, "global_schedule": 0.9494566917419434, "l2_grads": 1.177432894706726, "l2_params": 335.5299072265625, "l2_updates": 1.0469239950180054, "training_loss": 2.99583101272583, "uptime": 9684.65074428398, "examples_seen": 25241600.0, "progress": 0.22112184576190605, "epoch": 19.90105293864888, "img/sec/core": 189.5651654757007, "core_hours_Tesla V100-SXM2-32GB": 36.98095915870224, "core_hours": 36.98095915870224}
{"step": 24700, "global_schedule": 0.9491170048713684, "l2_grads": 1.2608834505081177, "l2_params": 335.5284118652344, "l2_updates": 0.9972837567329407, "training_loss": 3.205829620361328, "uptime": 9701.549374592956, "examples_seen": 25292800.0, "progress": 0.2215703687756219, "epoch": 19.94142018598894, "img/sec/core": 189.36445981069255, "core_hours_Tesla V100-SXM2-32GB": 37.05606418229768, "core_hours": 37.05606418229768}
{"step": 24750, "global_schedule": 0.9487763047218323, "l2_grads": 0.971989095211029, "l2_params": 335.587890625, "l2_updates": 0.9604839086532593, "training_loss": 4.813544750213623, "uptime": 9718.430800290953, "examples_seen": 25344000.0, "progress": 0.2220188917893377, "epoch": 19.981787433328996, "img/sec/core": 189.55744954525562, "core_hours_Tesla V100-SXM2-32GB": 37.13109274095545, "core_hours": 37.13109274095545}
{"step": 24800, "global_schedule": 0.9484345316886902, "l2_grads": 1.258536458015442, "l2_params": 335.5995788574219, "l2_updates": 0.9801104664802551, "training_loss": 3.0958287715911865, "uptime": 9735.30585048796, "examples_seen": 25395200.0, "progress": 0.22246741480305354, "epoch": 20.022154680669054, "img/sec/core": 189.62906555191825, "core_hours_Tesla V100-SXM2-32GB": 37.206092964053255, "core_hours": 37.206092964053255}
{"step": 24850, "global_schedule": 0.9480916261672974, "l2_grads": 1.2087267637252808, "l2_params": 335.628662109375, "l2_updates": 1.0221844911575317, "training_loss": 3.1709461212158203, "uptime": 9752.167916137958, "examples_seen": 25446400.0, "progress": 0.22291593781676938, "epoch": 20.062521928009115, "img/sec/core": 189.77508843942974, "core_hours_Tesla V100-SXM2-32GB": 37.281035478053255, "core_hours": 37.281035478053255}
{"step": 24900, "global_schedule": 0.9477477073669434, "l2_grads": 1.2542946338653564, "l2_params": 335.5890808105469, "l2_updates": 1.001122236251831, "training_loss": 3.2467594146728516, "uptime": 9769.0517902, "examples_seen": 25497600.0, "progress": 0.22336446083048522, "epoch": 20.102889175349173, "img/sec/core": 189.52996144376093, "core_hours_Tesla V100-SXM2-32GB": 37.35607491832899, "core_hours": 37.35607491832899}
{"step": 24950, "global_schedule": 0.9474027156829834, "l2_grads": 1.216722846031189, "l2_params": 335.6119079589844, "l2_updates": 1.0427520275115967, "training_loss": 3.2847914695739746, "uptime": 9785.91258951195, "examples_seen": 25548800.0, "progress": 0.22381298384420104, "epoch": 20.14325642268923, "img/sec/core": 189.78934158428518, "core_hours_Tesla V100-SXM2-32GB": 37.43101180415989, "core_hours": 37.43101180415989}
{"step": 25000, "global_schedule": 0.9470566511154175, "l2_grads": 1.090158224105835, "l2_params": 335.64605712890625, "l2_updates": 1.0226902961730957, "training_loss": 3.6560072898864746, "uptime": 9802.81159338099, "examples_seen": 25600000.0, "progress": 0.22426150685791688, "epoch": 20.18362367002929, "img/sec/core": 189.3602738243514, "core_hours_Tesla V100-SXM2-32GB": 37.50611848802228, "core_hours": 37.50611848802228, "minival/prec@1": 0.5533093974399, "minival/loss": 1.9446644468900005, "minival/sample count": 12812.0, "minival/attn_weight_avg": [13312, 12, 281], "minival/attn_mag": [13312, 12, 281], "minival/before_mlp": [13312, 12, 281], "z/secs/eval/minival": 2.8896285980008543, "real/prec@1": 0.5902811879496979, "real/loss": 2.848219659862595, "real/sample count": 46837.0, "real/attn_weight_avg": [50176, 12, 281], "real/attn_mag": [50176, 12, 281], "real/before_mlp": [50176, 12, 281], "z/secs/eval/real": 11.145757251011673, "train/prec@1": 0.5678491979861843, "train/loss": 1.848510165211375, "train/sample count": 25623.0, "train/attn_weight_avg": [26624, 12, 281], "train/attn_mag": [26624, 12, 281], "train/before_mlp": [26624, 12, 281], "z/secs/eval/train": 6.601830661995336, "v2/prec@1": 0.4098, "v2/loss": 2.7585819580078126, "v2/sample count": 10000.0, "v2/attn_weight_avg": [10240, 12, 281], "v2/attn_mag": [10240, 12, 281], "v2/before_mlp": [10240, 12, 281], "z/secs/eval/v2": 3.3605064230505377, "val/prec@1": 0.52238, "val/loss": 2.08307994140625, "val/sample count": 50000.0, "val/attn_weight_avg": [50176, 12, 281], "val/attn_mag": [50176, 12, 281], "val/before_mlp": [50176, 12, 281], "z/secs/eval/val": 12.306730156007688}
{"step": 25050, "global_schedule": 0.9467095136642456, "l2_grads": 1.127886414527893, "l2_params": 335.7013854980469, "l2_updates": 1.0050708055496216, "training_loss": 4.14879035949707, "uptime": 9856.607697942993, "examples_seen": 25651200.0, "progress": 0.22471002987163272, "epoch": 20.22399091736935, "img/sec/core": 189.07541779270514, "core_hours_Tesla V100-SXM2-32GB": 37.581338325631286, "core_hours": 37.581338325631286}
{"step": 25100, "global_schedule": 0.9463613033294678, "l2_grads": 1.0393569469451904, "l2_params": 335.73199462890625, "l2_updates": 0.9900184273719788, "training_loss": 5.370837211608887, "uptime": 9873.493829962972, "examples_seen": 25702400.0, "progress": 0.22515855288534856, "epoch": 20.264358164709407, "img/sec/core": 189.5046181217705, "core_hours_Tesla V100-SXM2-32GB": 37.65638780127564, "core_hours": 37.65638780127564}
{"step": 25150, "global_schedule": 0.946012020111084, "l2_grads": 1.185085654258728, "l2_params": 335.7388610839844, "l2_updates": 0.9518360495567322, "training_loss": 4.444843769073486, "uptime": 9890.37596032297, "examples_seen": 25753600.0, "progress": 0.22560707589906437, "epoch": 20.304725412049464, "img/sec/core": 189.54953739620242, "core_hours_Tesla V100-SXM2-32GB": 37.73141949176452, "core_hours": 37.73141949176452}
{"step": 25200, "global_schedule": 0.9456616640090942, "l2_grads": 1.3268890380859375, "l2_params": 335.74005126953125, "l2_updates": 1.0436903238296509, "training_loss": 2.9848761558532715, "uptime": 9907.249072713952, "examples_seen": 25804800.0, "progress": 0.2260555989127802, "epoch": 20.345092659389525, "img/sec/core": 189.6508436529039, "core_hours_Tesla V100-SXM2-32GB": 37.8064111023911, "core_hours": 37.8064111023911}
{"step": 25250, "global_schedule": 0.9453102350234985, "l2_grads": 1.0318195819854736, "l2_params": 335.7805480957031, "l2_updates": 0.98984694480896, "training_loss": 5.246224403381348, "uptime": 9924.112265575968, "examples_seen": 25856000.0, "progress": 0.22650412192649605, "epoch": 20.385459906729583, "img/sec/core": 189.7624030149063, "core_hours_Tesla V100-SXM2-32GB": 37.881358626222294, "core_hours": 37.881358626222294}
{"step": 25300, "global_schedule": 0.9449577331542969, "l2_grads": 1.4181926250457764, "l2_params": 335.767578125, "l2_updates": 0.9946083426475525, "training_loss": 3.0623834133148193, "uptime": 9940.986133515951, "examples_seen": 25907200.0, "progress": 0.2269526449402119, "epoch": 20.42582715406964, "img/sec/core": 189.64235179401425, "core_hours_Tesla V100-SXM2-32GB": 37.95635359484444, "core_hours": 37.95635359484444}
{"step": 25350, "global_schedule": 0.9446041584014893, "l2_grads": 1.2776659727096558, "l2_params": 335.7889099121094, "l2_updates": 1.0278934240341187, "training_loss": 2.961350917816162, "uptime": 9957.85305294895, "examples_seen": 25958400.0, "progress": 0.22740116795392773, "epoch": 20.4661944014097, "img/sec/core": 189.72047697929395, "core_hours_Tesla V100-SXM2-32GB": 38.031317681213324, "core_hours": 38.031317681213324}
{"step": 25400, "global_schedule": 0.9442495107650757, "l2_grads": 1.4704320430755615, "l2_params": 335.79876708984375, "l2_updates": 0.9714903831481934, "training_loss": 3.307434558868408, "uptime": 9974.712568685005, "examples_seen": 26009600.0, "progress": 0.22784969096764354, "epoch": 20.50656164874976, "img/sec/core": 189.8037909331395, "core_hours_Tesla V100-SXM2-32GB": 38.106248862262454, "core_hours": 38.106248862262454}
{"step": 25450, "global_schedule": 0.9438937902450562, "l2_grads": 1.3259704113006592, "l2_params": 335.8563232421875, "l2_updates": 0.9994152784347534, "training_loss": 3.127065658569336, "uptime": 9991.59623586398, "examples_seen": 26060800.0, "progress": 0.22829821398135938, "epoch": 20.546928896089817, "img/sec/core": 189.5322838384749, "core_hours_Tesla V100-SXM2-32GB": 38.1812873830579, "core_hours": 38.1812873830579}
{"step": 25500, "global_schedule": 0.9435371160507202, "l2_grads": 0.9381786584854126, "l2_params": 335.8346862792969, "l2_updates": 1.0071715116500854, "training_loss": 4.102085113525391, "uptime": 10008.455152941984, "examples_seen": 26112000.0, "progress": 0.22874673699507522, "epoch": 20.587296143429874, "img/sec/core": 189.8105308421742, "core_hours_Tesla V100-SXM2-32GB": 38.25621590340459, "core_hours": 38.25621590340459}
{"step": 25550, "global_schedule": 0.9431792497634888, "l2_grads": 1.0369826555252075, "l2_params": 335.8863220214844, "l2_updates": 1.039552092552185, "training_loss": 4.535545349121094, "uptime": 10025.338263195998, "examples_seen": 26163200.0, "progress": 0.22919526000879106, "epoch": 20.627663390769936, "img/sec/core": 189.53853596017933, "core_hours_Tesla V100-SXM2-32GB": 38.33125194897798, "core_hours": 38.33125194897798}
{"step": 25600, "global_schedule": 0.9428204298019409, "l2_grads": 1.122283935546875, "l2_params": 335.9165954589844, "l2_updates": 1.0344903469085693, "training_loss": 3.902024507522583, "uptime": 10042.221354259993, "examples_seen": 26214400.0, "progress": 0.22964378302250688, "epoch": 20.668030638109993, "img/sec/core": 189.53875139750153, "core_hours_Tesla V100-SXM2-32GB": 38.406287909262396, "core_hours": 38.406287909262396}
{"step": 25650, "global_schedule": 0.9424604177474976, "l2_grads": 1.302212119102478, "l2_params": 335.9421691894531, "l2_updates": 1.020023226737976, "training_loss": 3.058469772338867, "uptime": 10059.113531466981, "examples_seen": 26265600.0, "progress": 0.23009230603622272, "epoch": 20.70839788545005, "img/sec/core": 189.43680028861047, "core_hours_Tesla V100-SXM2-32GB": 38.48136425240457, "core_hours": 38.48136425240457}
{"step": 25700, "global_schedule": 0.9420994520187378, "l2_grads": 1.1970508098602295, "l2_params": 335.9669189453125, "l2_updates": 1.0051844120025635, "training_loss": 2.955056667327881, "uptime": 10076.000913302996, "examples_seen": 26316800.0, "progress": 0.23054082904993856, "epoch": 20.74876513279011, "img/sec/core": 189.49059309924797, "core_hours_Tesla V100-SXM2-32GB": 38.556419282786855, "core_hours": 38.556419282786855}
{"step": 25750, "global_schedule": 0.9417374134063721, "l2_grads": 1.325107455253601, "l2_params": 335.9363708496094, "l2_updates": 1.0089668035507202, "training_loss": 3.2375104427337646, "uptime": 10092.90836373798, "examples_seen": 26368000.0, "progress": 0.2309893520636544, "epoch": 20.78913238013017, "img/sec/core": 189.2656738699413, "core_hours_Tesla V100-SXM2-32GB": 38.63156350694235, "core_hours": 38.63156350694235}
{"step": 25800, "global_schedule": 0.9413743019104004, "l2_grads": 1.1183282136917114, "l2_params": 335.93035888671875, "l2_updates": 1.0144740343093872, "training_loss": 3.5834789276123047, "uptime": 10109.800104848982, "examples_seen": 26419200.0, "progress": 0.2314378750773702, "epoch": 20.829499627470227, "img/sec/core": 189.4416909998617, "core_hours_Tesla V100-SXM2-32GB": 38.70663791188013, "core_hours": 38.70663791188013}
{"step": 25850, "global_schedule": 0.9410101175308228, "l2_grads": 1.294211745262146, "l2_params": 335.95257568359375, "l2_updates": 1.0051883459091187, "training_loss": 3.0145442485809326, "uptime": 10126.68216370995, "examples_seen": 26470400.0, "progress": 0.23188639809108605, "epoch": 20.869866874810285, "img/sec/core": 189.5503401779229, "core_hours_Tesla V100-SXM2-32GB": 38.78166928459554, "core_hours": 38.78166928459554}
{"step": 25900, "global_schedule": 0.9406448602676392, "l2_grads": 1.3498765230178833, "l2_params": 335.94561767578125, "l2_updates": 1.0223963260650635, "training_loss": 3.116929054260254, "uptime": 10143.584356706997, "examples_seen": 26521600.0, "progress": 0.2323349211048019, "epoch": 20.910234122150346, "img/sec/core": 189.32454507879226, "core_hours_Tesla V100-SXM2-32GB": 38.8567901423602, "core_hours": 38.8567901423602}
{"step": 25950, "global_schedule": 0.9402785897254944, "l2_grads": 1.354471206665039, "l2_params": 335.9509582519531, "l2_updates": 0.9729385375976562, "training_loss": 3.134902000427246, "uptime": 10160.462048542977, "examples_seen": 26572800.0, "progress": 0.23278344411851773, "epoch": 20.950601369490403, "img/sec/core": 189.59938545496055, "core_hours_Tesla V100-SXM2-32GB": 38.931802106075665, "core_hours": 38.931802106075665}
{"step": 26000, "global_schedule": 0.9399112462997437, "l2_grads": 1.2104169130325317, "l2_params": 335.9245300292969, "l2_updates": 1.0273555517196655, "training_loss": 3.4131667613983154, "uptime": 10177.348526665999, "examples_seen": 26624000.0, "progress": 0.23323196713223354, "epoch": 20.99096861683046, "img/sec/core": 189.5007340599499, "core_hours_Tesla V100-SXM2-32GB": 39.00685311995576, "core_hours": 39.00685311995576}
{"step": 26050, "global_schedule": 0.9395428895950317, "l2_grads": 1.348163366317749, "l2_params": 335.9399719238281, "l2_updates": 1.012816071510315, "training_loss": 3.6048285961151123, "uptime": 10195.159258712956, "examples_seen": 26675200.0, "progress": 0.23368049014594938, "epoch": 21.03133586417052, "img/sec/core": 189.2991776553524, "core_hours_Tesla V100-SXM2-32GB": 39.08198404444459, "core_hours": 39.08198404444459}
{"step": 26100, "global_schedule": 0.9391734004020691, "l2_grads": 1.2969143390655518, "l2_params": 335.9765625, "l2_updates": 1.0013171434402466, "training_loss": 3.161694049835205, "uptime": 10212.046888762969, "examples_seen": 26726400.0, "progress": 0.23412901315966522, "epoch": 21.07170311151058, "img/sec/core": 189.48780797087954, "core_hours_Tesla V100-SXM2-32GB": 39.1570401780002, "core_hours": 39.1570401780002}
{"step": 26150, "global_schedule": 0.9388028979301453, "l2_grads": 1.4555916786193848, "l2_params": 335.9682922363281, "l2_updates": 0.9414694309234619, "training_loss": 3.0243470668792725, "uptime": 10228.957272487984, "examples_seen": 26777600.0, "progress": 0.23457753617338106, "epoch": 21.112070358850637, "img/sec/core": 189.2328436797294, "core_hours_Tesla V100-SXM2-32GB": 39.232197439000274, "core_hours": 39.232197439000274}
{"step": 26200, "global_schedule": 0.9384313821792603, "l2_grads": 1.0297726392745972, "l2_params": 335.95257568359375, "l2_updates": 1.0177245140075684, "training_loss": 5.450806617736816, "uptime": 10245.856966699997, "examples_seen": 26828800.0, "progress": 0.2350260591870969, "epoch": 21.152437606190695, "img/sec/core": 189.35253856399046, "core_hours_Tesla V100-SXM2-32GB": 39.30730719105366, "core_hours": 39.30730719105366}
{"step": 26250, "global_schedule": 0.9380587339401245, "l2_grads": 1.1360211372375488, "l2_params": 335.9849853515625, "l2_updates": 1.040415644645691, "training_loss": 3.5900301933288574, "uptime": 10262.740440619993, "examples_seen": 26880000.0, "progress": 0.23547458220081272, "epoch": 21.192804853530756, "img/sec/core": 189.53445334553726, "core_hours_Tesla V100-SXM2-32GB": 39.382344852920305, "core_hours": 39.382344852920305}
{"step": 26300, "global_schedule": 0.9376851320266724, "l2_grads": 1.231819987297058, "l2_params": 336.00640869140625, "l2_updates": 1.0185900926589966, "training_loss": 2.9971673488616943, "uptime": 10279.623346813954, "examples_seen": 26931200.0, "progress": 0.23592310521452856, "epoch": 21.233172100870814, "img/sec/core": 189.54082687165337, "core_hours_Tesla V100-SXM2-32GB": 39.45737999156014, "core_hours": 39.45737999156014}
{"step": 26350, "global_schedule": 0.9373103976249695, "l2_grads": 1.2219820022583008, "l2_params": 336.00421142578125, "l2_updates": 0.9577328562736511, "training_loss": 5.365494251251221, "uptime": 10296.522955383989, "examples_seen": 26982400.0, "progress": 0.2363716282282444, "epoch": 21.27353934821087, "img/sec/core": 189.35349814397773, "core_hours_Tesla V100-SXM2-32GB": 39.53248936298251, "core_hours": 39.53248936298251}
{"step": 26400, "global_schedule": 0.9369346499443054, "l2_grads": 1.3372703790664673, "l2_params": 336.0323791503906, "l2_updates": 1.0180314779281616, "training_loss": 3.0238914489746094, "uptime": 10313.404222477984, "examples_seen": 27033600.0, "progress": 0.23682015124196024, "epoch": 21.31390659555093, "img/sec/core": 189.55923048799343, "core_hours_Tesla V100-SXM2-32GB": 39.607517216733605, "core_hours": 39.607517216733605}
{"step": 26450, "global_schedule": 0.9365578889846802, "l2_grads": 1.1327582597732544, "l2_params": 336.05535888671875, "l2_updates": 1.0073522329330444, "training_loss": 3.104274272918701, "uptime": 10330.284432985005, "examples_seen": 27084800.0, "progress": 0.23726867425567605, "epoch": 21.35427384289099, "img/sec/core": 189.5710956133548, "core_hours_Tesla V100-SXM2-32GB": 39.68254037454258, "core_hours": 39.68254037454258}
{"step": 26500, "global_schedule": 0.9361799955368042, "l2_grads": 1.1428813934326172, "l2_params": 336.08966064453125, "l2_updates": 1.0327413082122803, "training_loss": 3.9426069259643555, "uptime": 10347.175543300982, "examples_seen": 27136000.0, "progress": 0.2377171972693919, "epoch": 21.394641090231048, "img/sec/core": 189.44876566066546, "core_hours_Tesla V100-SXM2-32GB": 39.75761197594693, "core_hours": 39.75761197594693}
{"step": 26550, "global_schedule": 0.9358011484146118, "l2_grads": 1.31242835521698, "l2_params": 336.1376953125, "l2_updates": 0.9929749369621277, "training_loss": 3.0179452896118164, "uptime": 10364.06853147695, "examples_seen": 27187200.0, "progress": 0.23816572028310773, "epoch": 21.435008337571105, "img/sec/core": 189.42770613858627, "core_hours_Tesla V100-SXM2-32GB": 39.83269192339568, "core_hours": 39.83269192339568}
{"step": 26600, "global_schedule": 0.9354212284088135, "l2_grads": 1.0983599424362183, "l2_params": 336.1882019042969, "l2_updates": 0.9971152544021606, "training_loss": 4.26173734664917, "uptime": 10380.954524782952, "examples_seen": 27238400.0, "progress": 0.23861424329682357, "epoch": 21.475375584911163, "img/sec/core": 189.50617485219178, "core_hours_Tesla V100-SXM2-32GB": 39.90774078253346, "core_hours": 39.90774078253346}
{"step": 26650, "global_schedule": 0.9350402355194092, "l2_grads": 1.3725069761276245, "l2_params": 336.17254638671875, "l2_updates": 0.9941755533218384, "training_loss": 3.0120973587036133, "uptime": 10397.840159841988, "examples_seen": 27289600.0, "progress": 0.23906276631053938, "epoch": 21.515742832251224, "img/sec/core": 189.5101954301455, "core_hours_Tesla V100-SXM2-32GB": 39.98278804946251, "core_hours": 39.98278804946251}
{"step": 26700, "global_schedule": 0.9346581697463989, "l2_grads": 1.1208105087280273, "l2_params": 336.1680603027344, "l2_updates": 0.9976984858512878, "training_loss": 3.2878222465515137, "uptime": 10414.716473670967, "examples_seen": 27340800.0, "progress": 0.23951128932425522, "epoch": 21.55611007959128, "img/sec/core": 189.6148668736554, "core_hours_Tesla V100-SXM2-32GB": 40.05779388870242, "core_hours": 40.05779388870242}
{"step": 26750, "global_schedule": 0.9342751502990723, "l2_grads": 1.2988337278366089, "l2_params": 336.1513977050781, "l2_updates": 1.0221441984176636, "training_loss": 3.1418368816375732, "uptime": 10431.591738245974, "examples_seen": 27392000.0, "progress": 0.23995981233797106, "epoch": 21.59647732693134, "img/sec/core": 189.6266565645107, "core_hours_Tesla V100-SXM2-32GB": 40.13279506459134, "core_hours": 40.13279506459134}
{"step": 26800, "global_schedule": 0.9338910579681396, "l2_grads": 1.2582379579544067, "l2_params": 336.1747741699219, "l2_updates": 1.005542516708374, "training_loss": 2.945434093475342, "uptime": 10448.491060551954, "examples_seen": 27443200.0, "progress": 0.2404083353516869, "epoch": 21.6368445742714, "img/sec/core": 189.35670567496854, "core_hours_Tesla V100-SXM2-32GB": 40.20790316372903, "core_hours": 40.20790316372903}
{"step": 26850, "global_schedule": 0.9335058927536011, "l2_grads": 1.3318614959716797, "l2_params": 336.177001953125, "l2_updates": 0.9876315593719482, "training_loss": 3.1111690998077393, "uptime": 10465.358341671992, "examples_seen": 27494400.0, "progress": 0.24085685836540272, "epoch": 21.677211821611458, "img/sec/core": 189.71640878140857, "core_hours_Tesla V100-SXM2-32GB": 40.282868857595865, "core_hours": 40.282868857595865}
{"step": 26900, "global_schedule": 0.9331197142601013, "l2_grads": 1.2496620416641235, "l2_params": 336.1916198730469, "l2_updates": 0.968902587890625, "training_loss": 2.9839529991149902, "uptime": 10482.23660526995, "examples_seen": 27545600.0, "progress": 0.24130538137911856, "epoch": 21.717579068951515, "img/sec/core": 189.59296265446477, "core_hours_Tesla V100-SXM2-32GB": 40.35788336247568, "core_hours": 40.35788336247568}
{"step": 26950, "global_schedule": 0.9327325224876404, "l2_grads": 1.282332420349121, "l2_params": 336.217041015625, "l2_updates": 1.00697922706604, "training_loss": 3.002476215362549, "uptime": 10499.118259060953, "examples_seen": 27596800.0, "progress": 0.2417539043928344, "epoch": 21.757946316291573, "img/sec/core": 189.55488837862123, "core_hours_Tesla V100-SXM2-32GB": 40.432912934880136, "core_hours": 40.432912934880136}
{"step": 27000, "global_schedule": 0.9323442578315735, "l2_grads": 1.110987901687622, "l2_params": 336.20892333984375, "l2_updates": 0.9616453051567078, "training_loss": 4.1463799476623535, "uptime": 10515.995361897978, "examples_seen": 27648000.0, "progress": 0.24220242740655024, "epoch": 21.798313563631634, "img/sec/core": 189.60600233944717, "core_hours_Tesla V100-SXM2-32GB": 40.50792228082246, "core_hours": 40.50792228082246}
{"step": 27050, "global_schedule": 0.9319549798965454, "l2_grads": 1.2517129182815552, "l2_params": 336.2046203613281, "l2_updates": 1.005516767501831, "training_loss": 2.9676742553710938, "uptime": 10533.39906417299, "examples_seen": 27699200.0, "progress": 0.24265095042026608, "epoch": 21.83868081097169, "img/sec/core": 189.4708429920625, "core_hours_Tesla V100-SXM2-32GB": 40.58298513480902, "core_hours": 40.58298513480902}
{"step": 27100, "global_schedule": 0.9315646886825562, "l2_grads": 1.0677040815353394, "l2_params": 336.2264709472656, "l2_updates": 0.9670982360839844, "training_loss": 5.36417293548584, "uptime": 10550.284594960976, "examples_seen": 27750400.0, "progress": 0.2430994734339819, "epoch": 21.87904805831175, "img/sec/core": 189.51136568812115, "core_hours_Tesla V100-SXM2-32GB": 40.658031938311176, "core_hours": 40.658031938311176}
{"step": 27150, "global_schedule": 0.9311733245849609, "l2_grads": 0.9638767838478088, "l2_params": 336.2283935546875, "l2_updates": 0.9583303332328796, "training_loss": 5.463204383850098, "uptime": 10567.166524498956, "examples_seen": 27801600.0, "progress": 0.24354799644769773, "epoch": 21.91941530565181, "img/sec/core": 189.5517922166921, "core_hours_Tesla V100-SXM2-32GB": 40.73306273625776, "core_hours": 40.73306273625776}
{"step": 27200, "global_schedule": 0.9307808876037598, "l2_grads": 1.2649199962615967, "l2_params": 336.24395751953125, "l2_updates": 1.0174484252929688, "training_loss": 2.909984588623047, "uptime": 10584.051523061993, "examples_seen": 27852800.0, "progress": 0.24399651946141357, "epoch": 21.959782552991868, "img/sec/core": 189.5173391962952, "core_hours_Tesla V100-SXM2-32GB": 40.8081071743157, "core_hours": 40.8081071743157}
{"step": 27250, "global_schedule": 0.9303874969482422, "l2_grads": 1.2476859092712402, "l2_params": 336.25311279296875, "l2_updates": 1.0151495933532715, "training_loss": 2.879727840423584, "uptime": 10600.93881250295, "examples_seen": 27904000.0, "progress": 0.2444450424751294, "epoch": 22.000149800331926, "img/sec/core": 189.49162985498631, "core_hours_Tesla V100-SXM2-32GB": 40.88316179405329, "core_hours": 40.88316179405329}
{"step": 27300, "global_schedule": 0.9299930334091187, "l2_grads": 1.1192182302474976, "l2_params": 336.2894287109375, "l2_updates": 1.0390331745147705, "training_loss": 3.982301712036133, "uptime": 10617.810946485959, "examples_seen": 27955200.0, "progress": 0.24489356548884522, "epoch": 22.040517047671983, "img/sec/core": 189.66184142579212, "core_hours_Tesla V100-SXM2-32GB": 40.95814905619999, "core_hours": 40.95814905619999}
{"step": 27350, "global_schedule": 0.9295974969863892, "l2_grads": 1.2677208185195923, "l2_params": 336.3049621582031, "l2_updates": 0.9442909359931946, "training_loss": 3.081342935562134, "uptime": 10634.682432817004, "examples_seen": 28006400.0, "progress": 0.24534208850256106, "epoch": 22.080884295012044, "img/sec/core": 189.66912204478933, "core_hours_Tesla V100-SXM2-32GB": 41.033133439893525, "core_hours": 41.033133439893525}
{"step": 27400, "global_schedule": 0.9292010068893433, "l2_grads": 1.2983239889144897, "l2_params": 336.241455078125, "l2_updates": 1.0010186433792114, "training_loss": 3.1272289752960205, "uptime": 10651.564519832958, "examples_seen": 28057600.0, "progress": 0.2457906115162769, "epoch": 22.121251542352102, "img/sec/core": 189.55002405661455, "core_hours_Tesla V100-SXM2-32GB": 41.10816493774221, "core_hours": 41.10816493774221}
{"step": 27450, "global_schedule": 0.9288034439086914, "l2_grads": 0.9438691735267639, "l2_params": 336.2285461425781, "l2_updates": 0.9690049886703491, "training_loss": 4.866110801696777, "uptime": 10668.440317477973, "examples_seen": 28108800.0, "progress": 0.24623913452999274, "epoch": 22.16161878969216, "img/sec/core": 189.62066666788945, "core_hours_Tesla V100-SXM2-32GB": 41.183168482831164, "core_hours": 41.183168482831164}
{"step": 27500, "global_schedule": 0.9284049272537231, "l2_grads": 1.0063331127166748, "l2_params": 336.24041748046875, "l2_updates": 1.0044794082641602, "training_loss": 4.199045658111572, "uptime": 10685.33565755398, "examples_seen": 28160000.0, "progress": 0.24668765754370856, "epoch": 22.20198603703222, "img/sec/core": 189.40133703163679, "core_hours_Tesla V100-SXM2-32GB": 41.25825888316897, "core_hours": 41.25825888316897, "minival/prec@1": 0.5592413362472682, "minival/loss": 1.9257229397976507, "minival/sample count": 12812.0, "minival/attn_weight_avg": [13312, 12, 281], "minival/attn_mag": [13312, 12, 281], "minival/before_mlp": [13312, 12, 281], "z/secs/eval/minival": 2.8892585479770787, "real/prec@1": 0.607810064692444, "real/loss": 2.8059000506827534, "real/sample count": 46837.0, "real/attn_weight_avg": [50176, 12, 281], "real/attn_mag": [50176, 12, 281], "real/before_mlp": [50176, 12, 281], "z/secs/eval/real": 11.171786584949587, "train/prec@1": 0.5830698981383913, "train/loss": 1.827247762105013, "train/sample count": 25623.0, "train/attn_weight_avg": [26624, 12, 281], "train/attn_mag": [26624, 12, 281], "train/before_mlp": [26624, 12, 281], "z/secs/eval/train": 6.577194077020977, "v2/prec@1": 0.4201, "v2/loss": 2.714719189453125, "v2/sample count": 10000.0, "v2/attn_weight_avg": [10240, 12, 281], "v2/attn_mag": [10240, 12, 281], "v2/before_mlp": [10240, 12, 281], "z/secs/eval/v2": 3.3379534339765087, "val/prec@1": 0.5376, "val/loss": 2.05186537109375, "val/sample count": 50000.0, "val/attn_weight_avg": [50176, 12, 281], "val/attn_mag": [50176, 12, 281], "val/before_mlp": [50176, 12, 281], "z/secs/eval/val": 12.369701970019378}
{"step": 27550, "global_schedule": 0.9280053377151489, "l2_grads": 1.2676416635513306, "l2_params": 336.2459411621094, "l2_updates": 1.0148173570632935, "training_loss": 3.4057722091674805, "uptime": 10738.586642275972, "examples_seen": 28211200.0, "progress": 0.2471361805574244, "epoch": 22.242353284372278, "img/sec/core": 189.31443583500752, "core_hours_Tesla V100-SXM2-32GB": 41.33338375232907, "core_hours": 41.33338375232907}
{"step": 27600, "global_schedule": 0.9276046752929688, "l2_grads": 1.4031450748443604, "l2_params": 336.2828674316406, "l2_updates": 0.9846997261047363, "training_loss": 2.9898386001586914, "uptime": 10755.468237271998, "examples_seen": 28262400.0, "progress": 0.24758470357114024, "epoch": 22.282720531712336, "img/sec/core": 189.55554855765976, "core_hours_Tesla V100-SXM2-32GB": 41.408413063422515, "core_hours": 41.408413063422515}
{"step": 27650, "global_schedule": 0.9272030591964722, "l2_grads": 1.3923380374908447, "l2_params": 336.289306640625, "l2_updates": 1.0118238925933838, "training_loss": 2.9453744888305664, "uptime": 10772.34911523998, "examples_seen": 28313600.0, "progress": 0.24803322658485608, "epoch": 22.323087779052393, "img/sec/core": 189.5636000727824, "core_hours_Tesla V100-SXM2-32GB": 41.48343918772466, "core_hours": 41.48343918772466}
{"step": 27700, "global_schedule": 0.9268003702163696, "l2_grads": 1.0206042528152466, "l2_params": 336.28863525390625, "l2_updates": 0.9835546612739563, "training_loss": 5.338540077209473, "uptime": 10789.217986100004, "examples_seen": 28364800.0, "progress": 0.24848174959857192, "epoch": 22.363455026392455, "img/sec/core": 189.69852970914664, "core_hours_Tesla V100-SXM2-32GB": 41.55841194710254, "core_hours": 41.55841194710254}
{"step": 27750, "global_schedule": 0.9263967275619507, "l2_grads": 1.397267460823059, "l2_params": 336.2847595214844, "l2_updates": 1.003521203994751, "training_loss": 2.973937511444092, "uptime": 10806.089590228978, "examples_seen": 28416000.0, "progress": 0.24893027261228773, "epoch": 22.403822273732512, "img/sec/core": 189.66779777061322, "core_hours_Tesla V100-SXM2-32GB": 41.63339685434243, "core_hours": 41.63339685434243}
{"step": 27800, "global_schedule": 0.9259920120239258, "l2_grads": 1.195805549621582, "l2_params": 336.30853271484375, "l2_updates": 0.9906953573226929, "training_loss": 3.3685481548309326, "uptime": 10822.970833336003, "examples_seen": 28467200.0, "progress": 0.24937879562600357, "epoch": 22.44418952107257, "img/sec/core": 189.55949983732225, "core_hours_Tesla V100-SXM2-32GB": 41.708424601484765, "core_hours": 41.708424601484765}
{"step": 27850, "global_schedule": 0.9255862236022949, "l2_grads": 1.067880392074585, "l2_params": 336.3125915527344, "l2_updates": 1.0124026536941528, "training_loss": 3.7982728481292725, "uptime": 10839.853275093948, "examples_seen": 28518400.0, "progress": 0.2498273186397194, "epoch": 22.484556768412627, "img/sec/core": 189.54604114028658, "core_hours_Tesla V100-SXM2-32GB": 41.78345767596452, "core_hours": 41.78345767596452}
{"step": 27900, "global_schedule": 0.9251794815063477, "l2_grads": 1.2786203622817993, "l2_params": 336.35595703125, "l2_updates": 0.9837791919708252, "training_loss": 3.304074287414551, "uptime": 10856.721137232962, "examples_seen": 28569600.0, "progress": 0.25027584165343525, "epoch": 22.52492401575269, "img/sec/core": 189.70987393824709, "core_hours_Tesla V100-SXM2-32GB": 41.858425952137914, "core_hours": 41.858425952137914}
{"step": 27950, "global_schedule": 0.9247717261314392, "l2_grads": 1.3998953104019165, "l2_params": 336.37799072265625, "l2_updates": 0.9666997194290161, "training_loss": 3.1254515647888184, "uptime": 10873.608242112969, "examples_seen": 28620800.0, "progress": 0.2507243646671511, "epoch": 22.565291263092746, "img/sec/core": 189.49370082900586, "core_hours_Tesla V100-SXM2-32GB": 41.93347975160461, "core_hours": 41.93347975160461}
{"step": 28000, "global_schedule": 0.9243628978729248, "l2_grads": 1.2505038976669312, "l2_params": 336.3306884765625, "l2_updates": 1.0216305255889893, "training_loss": 3.003368616104126, "uptime": 10890.480277817987, "examples_seen": 28672000.0, "progress": 0.25117288768086693, "epoch": 22.605658510432804, "img/sec/core": 189.6629461878226, "core_hours_Tesla V100-SXM2-32GB": 42.008466576960245, "core_hours": 42.008466576960245}
{"step": 28050, "global_schedule": 0.923953115940094, "l2_grads": 1.3089030981063843, "l2_params": 336.3390808105469, "l2_updates": 0.9885534048080444, "training_loss": 2.884641647338867, "uptime": 10907.921546522994, "examples_seen": 28723200.0, "progress": 0.2516214106945827, "epoch": 22.646025757772865, "img/sec/core": 189.8895688241474, "core_hours_Tesla V100-SXM2-32GB": 42.083363909711544, "core_hours": 42.083363909711544}
{"step": 28100, "global_schedule": 0.9235422611236572, "l2_grads": 1.3508636951446533, "l2_params": 336.33154296875, "l2_updates": 0.9998010396957397, "training_loss": 3.2274718284606934, "uptime": 10924.809449241962, "examples_seen": 28774400.0, "progress": 0.25206993370829855, "epoch": 22.686393005112922, "img/sec/core": 189.48474853575055, "core_hours_Tesla V100-SXM2-32GB": 42.158421255129184, "core_hours": 42.158421255129184}
{"step": 28150, "global_schedule": 0.923130452632904, "l2_grads": 1.1847848892211914, "l2_params": 336.3546447753906, "l2_updates": 1.0203514099121094, "training_loss": 3.080820083618164, "uptime": 10941.67302461696, "examples_seen": 28825600.0, "progress": 0.2525184567220144, "epoch": 22.72676025245298, "img/sec/core": 189.75809867367835, "core_hours_Tesla V100-SXM2-32GB": 42.23337047901806, "core_hours": 42.23337047901806}
{"step": 28200, "global_schedule": 0.9227175712585449, "l2_grads": 1.2614686489105225, "l2_params": 336.32720947265625, "l2_updates": 0.9938231706619263, "training_loss": 2.9348926544189453, "uptime": 10958.551815523999, "examples_seen": 28876800.0, "progress": 0.25296697973573024, "epoch": 22.767127499793038, "img/sec/core": 189.58703959450693, "core_hours_Tesla V100-SXM2-32GB": 42.30838732749378, "core_hours": 42.30838732749378}
{"step": 28250, "global_schedule": 0.9223037362098694, "l2_grads": 1.2323254346847534, "l2_params": 336.3328552246094, "l2_updates": 0.956457257270813, "training_loss": 3.0905110836029053, "uptime": 10975.423800435965, "examples_seen": 28928000.0, "progress": 0.2534155027494461, "epoch": 22.8074947471331, "img/sec/core": 189.66351716747093, "core_hours_Tesla V100-SXM2-32GB": 42.383373927102525, "core_hours": 42.383373927102525}
{"step": 28300, "global_schedule": 0.9218888282775879, "l2_grads": 1.3096901178359985, "l2_params": 336.3421936035156, "l2_updates": 0.999258816242218, "training_loss": 2.925769567489624, "uptime": 10992.294248130987, "examples_seen": 28979200.0, "progress": 0.2538640257631619, "epoch": 22.847861994473156, "img/sec/core": 189.68079910197912, "core_hours_Tesla V100-SXM2-32GB": 42.45835369463596, "core_hours": 42.45835369463596}
{"step": 28350, "global_schedule": 0.92147296667099, "l2_grads": 1.3073163032531738, "l2_params": 336.2939758300781, "l2_updates": 0.9839484095573425, "training_loss": 2.972416639328003, "uptime": 11009.149934795976, "examples_seen": 29030400.0, "progress": 0.25431254877687776, "epoch": 22.888229241813214, "img/sec/core": 189.84690826311913, "core_hours_Tesla V100-SXM2-32GB": 42.53326785759147, "core_hours": 42.53326785759147}
{"step": 28400, "global_schedule": 0.9210560321807861, "l2_grads": 1.2317830324172974, "l2_params": 336.2733154296875, "l2_updates": 0.9824320673942566, "training_loss": 3.421602249145508, "uptime": 11026.027748170949, "examples_seen": 29081600.0, "progress": 0.2547610717905936, "epoch": 22.928596489153275, "img/sec/core": 189.59802012890415, "core_hours_Tesla V100-SXM2-32GB": 42.60828036148023, "core_hours": 42.60828036148023}
{"step": 28450, "global_schedule": 0.9206382036209106, "l2_grads": 1.2536637783050537, "l2_params": 336.2695617675781, "l2_updates": 0.9557976126670837, "training_loss": 2.944704532623291, "uptime": 11042.889668355987, "examples_seen": 29132800.0, "progress": 0.25520959480430944, "epoch": 22.968963736493333, "img/sec/core": 189.7767255973291, "core_hours_Tesla V100-SXM2-32GB": 42.68322222896929, "core_hours": 42.68322222896929}
{"step": 28500, "global_schedule": 0.9202193021774292, "l2_grads": 1.4106054306030273, "l2_params": 336.2292785644531, "l2_updates": 0.9671323299407959, "training_loss": 2.90960955619812, "uptime": 11059.750964284001, "examples_seen": 29184000.0, "progress": 0.2556581178180252, "epoch": 23.00933098383339, "img/sec/core": 189.78375171527082, "core_hours_Tesla V100-SXM2-32GB": 42.75816132198269, "core_hours": 42.75816132198269}
{"step": 28550, "global_schedule": 0.9197993278503418, "l2_grads": 1.2730846405029297, "l2_params": 336.2340087890625, "l2_updates": 0.9638745784759521, "training_loss": 2.8818554878234863, "uptime": 11076.623691895977, "examples_seen": 29235200.0, "progress": 0.25610664083174106, "epoch": 23.049698231173448, "img/sec/core": 189.65516860053063, "core_hours_Tesla V100-SXM2-32GB": 42.83315122248036, "core_hours": 42.83315122248036}
{"step": 28600, "global_schedule": 0.919378399848938, "l2_grads": 1.2516746520996094, "l2_params": 336.2475891113281, "l2_updates": 0.961674690246582, "training_loss": 2.863913059234619, "uptime": 11093.479414950998, "examples_seen": 29286400.0, "progress": 0.2565551638454569, "epoch": 23.09006547851351, "img/sec/core": 189.8464984002398, "core_hours_Tesla V100-SXM2-32GB": 42.90806554716934, "core_hours": 42.90806554716934}
{"step": 28650, "global_schedule": 0.9189565181732178, "l2_grads": 1.3520958423614502, "l2_params": 336.2648620605469, "l2_updates": 1.0005487203598022, "training_loss": 5.525637149810791, "uptime": 11110.348962245975, "examples_seen": 29337600.0, "progress": 0.25700368685917274, "epoch": 23.130432725853566, "img/sec/core": 189.69092317924162, "core_hours_Tesla V100-SXM2-32GB": 42.98304131292479, "core_hours": 42.98304131292479}
{"step": 28700, "global_schedule": 0.9185335636138916, "l2_grads": 1.3526124954223633, "l2_params": 336.28204345703125, "l2_updates": 0.978929340839386, "training_loss": 3.0810227394104004, "uptime": 11127.237270817976, "examples_seen": 29388800.0, "progress": 0.2574522098728886, "epoch": 23.170799973193624, "img/sec/core": 189.48019491456293, "core_hours_Tesla V100-SXM2-32GB": 43.05810046213369, "core_hours": 43.05810046213369}
{"step": 28750, "global_schedule": 0.918109655380249, "l2_grads": 1.3085498809814453, "l2_params": 336.2683410644531, "l2_updates": 0.9578112959861755, "training_loss": 2.9705581665039062, "uptime": 11144.099020356953, "examples_seen": 29440000.0, "progress": 0.2579007328866044, "epoch": 23.21116722053368, "img/sec/core": 189.77864619581536, "core_hours_Tesla V100-SXM2-32GB": 43.133041571195804, "core_hours": 43.133041571195804}
{"step": 28800, "global_schedule": 0.9176846742630005, "l2_grads": 1.2853822708129883, "l2_params": 336.2271728515625, "l2_updates": 0.9591904282569885, "training_loss": 2.841057300567627, "uptime": 11160.964324334986, "examples_seen": 29491200.0, "progress": 0.25834925590032026, "epoch": 23.251534467873743, "img/sec/core": 189.7386494882042, "core_hours_Tesla V100-SXM2-32GB": 43.20799847776484, "core_hours": 43.20799847776484}
{"step": 28850, "global_schedule": 0.9172587394714355, "l2_grads": 1.2636826038360596, "l2_params": 336.2313232421875, "l2_updates": 1.0284810066223145, "training_loss": 2.8042032718658447, "uptime": 11177.848981854971, "examples_seen": 29542400.0, "progress": 0.2587977789140361, "epoch": 23.2919017152138, "img/sec/core": 189.52116714314428, "core_hours_Tesla V100-SXM2-32GB": 43.283041400075895, "core_hours": 43.283041400075895}
{"step": 28900, "global_schedule": 0.9168317914009094, "l2_grads": 1.096181035041809, "l2_params": 336.2259826660156, "l2_updates": 0.980649471282959, "training_loss": 4.954096794128418, "uptime": 11194.708820685977, "examples_seen": 29593600.0, "progress": 0.2592463019277519, "epoch": 23.332268962553858, "img/sec/core": 189.8001536120932, "core_hours_Tesla V100-SXM2-32GB": 43.357974017102585, "core_hours": 43.357974017102585}
{"step": 28950, "global_schedule": 0.9164038896560669, "l2_grads": 1.4134334325790405, "l2_params": 336.21881103515625, "l2_updates": 0.9529528021812439, "training_loss": 2.9470834732055664, "uptime": 11211.577663053991, "examples_seen": 29644800.0, "progress": 0.25969482494146773, "epoch": 23.37263620989392, "img/sec/core": 189.69885011597935, "core_hours_Tesla V100-SXM2-32GB": 43.43294664984931, "core_hours": 43.43294664984931}
{"step": 29001, "global_schedule": 0.9159749150276184, "l2_grads": 1.216170310974121, "l2_params": 336.2150573730469, "l2_updates": 0.9964128732681274, "training_loss": 3.3464395999908447, "uptime": 11228.45835404098, "examples_seen": 29696000.0, "progress": 0.26014334795518357, "epoch": 23.413003457233977, "img/sec/core": 189.5656997966746, "core_hours_Tesla V100-SXM2-32GB": 43.50797194312482, "core_hours": 43.50797194312482}
{"step": 29050, "global_schedule": 0.9155449867248535, "l2_grads": 1.06230890750885, "l2_params": 336.2230224609375, "l2_updates": 0.944781482219696, "training_loss": 4.054617881774902, "uptime": 11245.83909629198, "examples_seen": 29747200.0, "progress": 0.2605918709688994, "epoch": 23.453370704574034, "img/sec/core": 189.85370737361467, "core_hours_Tesla V100-SXM2-32GB": 43.58288342322689, "core_hours": 43.58288342322689}
{"step": 29100, "global_schedule": 0.9151140451431274, "l2_grads": 1.3400479555130005, "l2_params": 336.2098083496094, "l2_updates": 0.9920304417610168, "training_loss": 2.9072535037994385, "uptime": 11262.723592721974, "examples_seen": 29798400.0, "progress": 0.26104039398261525, "epoch": 23.493737951914092, "img/sec/core": 189.52297530861387, "core_hours_Tesla V100-SXM2-32GB": 43.657925629582415, "core_hours": 43.657925629582415}
{"step": 29151, "global_schedule": 0.914682149887085, "l2_grads": 0.9952394366264343, "l2_params": 336.2507629394531, "l2_updates": 0.9719365239143372, "training_loss": 5.363710403442383, "uptime": 11279.588083098002, "examples_seen": 29849600.0, "progress": 0.2614889169963311, "epoch": 23.534105199254153, "img/sec/core": 189.74780314432164, "core_hours_Tesla V100-SXM2-32GB": 43.73287892014254, "core_hours": 43.73287892014254}
{"step": 29200, "global_schedule": 0.9142491817474365, "l2_grads": 1.1057039499282837, "l2_params": 336.2059631347656, "l2_updates": 0.9701423645019531, "training_loss": 3.5698015689849854, "uptime": 11296.450903374003, "examples_seen": 29900800.0, "progress": 0.26193744001004693, "epoch": 23.57447244659421, "img/sec/core": 189.76659583772044, "core_hours_Tesla V100-SXM2-32GB": 43.80782478803587, "core_hours": 43.80782478803587}
{"step": 29250, "global_schedule": 0.9138152599334717, "l2_grads": 1.2023929357528687, "l2_params": 336.16021728515625, "l2_updates": 0.9714272618293762, "training_loss": 3.1821932792663574, "uptime": 11313.30262250296, "examples_seen": 29952000.0, "progress": 0.26238596302376277, "epoch": 23.614839693934268, "img/sec/core": 189.8916054505808, "core_hours_Tesla V100-SXM2-32GB": 43.88272131749791, "core_hours": 43.88272131749791}
{"step": 29300, "global_schedule": 0.9133803844451904, "l2_grads": 1.070082426071167, "l2_params": 336.1243896484375, "l2_updates": 1.0213756561279297, "training_loss": 3.4986789226531982, "uptime": 11330.170680369949, "examples_seen": 30003200.0, "progress": 0.2628344860374786, "epoch": 23.65520694127433, "img/sec/core": 189.70767264573976, "core_hours_Tesla V100-SXM2-32GB": 43.957690463573414, "core_hours": 43.957690463573414}
{"step": 29350, "global_schedule": 0.912944495677948, "l2_grads": 1.3521653413772583, "l2_params": 336.0963439941406, "l2_updates": 0.9367990493774414, "training_loss": 3.017799139022827, "uptime": 11347.032042549981, "examples_seen": 30054400.0, "progress": 0.2632830090511944, "epoch": 23.695574188614387, "img/sec/core": 189.78300601297383, "core_hours_Tesla V100-SXM2-32GB": 44.03262985104023, "core_hours": 44.03262985104023}
{"step": 29400, "global_schedule": 0.9125075936317444, "l2_grads": 1.233331322669983, "l2_params": 336.06103515625, "l2_updates": 0.9883700013160706, "training_loss": 3.09346079826355, "uptime": 11363.895214541, "examples_seen": 30105600.0, "progress": 0.26373153206491023, "epoch": 23.735941435954445, "img/sec/core": 189.76263787763358, "core_hours_Tesla V100-SXM2-32GB": 44.107577282111414, "core_hours": 44.107577282111414}
{"step": 29450, "global_schedule": 0.9120697379112244, "l2_grads": 1.0139453411102295, "l2_params": 336.0216064453125, "l2_updates": 0.9649657607078552, "training_loss": 4.545544147491455, "uptime": 11380.76750571496, "examples_seen": 30156800.0, "progress": 0.2641800550786261, "epoch": 23.776308683294502, "img/sec/core": 189.66007443841679, "core_hours_Tesla V100-SXM2-32GB": 44.18256524288458, "core_hours": 44.18256524288458}
{"step": 29500, "global_schedule": 0.9116308689117432, "l2_grads": 1.2596900463104248, "l2_params": 336.0413513183594, "l2_updates": 0.9786876440048218, "training_loss": 2.873087167739868, "uptime": 11397.622016633977, "examples_seen": 30208000.0, "progress": 0.2646285780923419, "epoch": 23.816675930634563, "img/sec/core": 189.86015170511763, "core_hours_Tesla V100-SXM2-32GB": 44.25747418030243, "core_hours": 44.25747418030243}
{"step": 29550, "global_schedule": 0.9111909866333008, "l2_grads": 1.343068242073059, "l2_params": 336.0152587890625, "l2_updates": 0.9558709859848022, "training_loss": 2.9207663536071777, "uptime": 11414.499519829988, "examples_seen": 30259200.0, "progress": 0.26507710110605776, "epoch": 23.85704317797462, "img/sec/core": 189.6015046085988, "core_hours_Tesla V100-SXM2-32GB": 44.33248530561803, "core_hours": 44.33248530561803}
{"step": 29600, "global_schedule": 0.9107502102851868, "l2_grads": 1.0765178203582764, "l2_params": 335.9999084472656, "l2_updates": 0.9921698570251465, "training_loss": 3.784130573272705, "uptime": 11431.377980402962, "examples_seen": 30310400.0, "progress": 0.2655256241197736, "epoch": 23.89741042531468, "img/sec/core": 189.59075006661593, "core_hours_Tesla V100-SXM2-32GB": 44.40750068594236, "core_hours": 44.40750068594236}
{"step": 29650, "global_schedule": 0.9103083610534668, "l2_grads": 1.3392740488052368, "l2_params": 335.9700012207031, "l2_updates": 0.9928121566772461, "training_loss": 2.931246042251587, "uptime": 11448.235381920997, "examples_seen": 30361600.0, "progress": 0.26597414713348944, "epoch": 23.93777767265474, "img/sec/core": 189.82759570486039, "core_hours_Tesla V100-SXM2-32GB": 44.48242247046696, "core_hours": 44.48242247046696}
{"step": 29700, "global_schedule": 0.9098656177520752, "l2_grads": 1.2361750602722168, "l2_params": 335.9540100097656, "l2_updates": 0.9935777187347412, "training_loss": 3.247670888900757, "uptime": 11465.103588394995, "examples_seen": 30412800.0, "progress": 0.2664226701472053, "epoch": 23.978144919994797, "img/sec/core": 189.70600134238325, "core_hours_Tesla V100-SXM2-32GB": 44.55739227701806, "core_hours": 44.55739227701806}
{"step": 29750, "global_schedule": 0.9094218015670776, "l2_grads": 1.2507414817810059, "l2_params": 335.9088134765625, "l2_updates": 0.9709226489067078, "training_loss": 2.995008945465088, "uptime": 11481.970820789982, "examples_seen": 30464000.0, "progress": 0.26687119316092106, "epoch": 24.018512167334855, "img/sec/core": 189.7169568228094, "core_hours_Tesla V100-SXM2-32GB": 44.632357754329114, "core_hours": 44.632357754329114}
{"step": 29800, "global_schedule": 0.9089770317077637, "l2_grads": 1.1792643070220947, "l2_params": 335.8914489746094, "l2_updates": 1.0314068794250488, "training_loss": 2.8807449340820312, "uptime": 11498.834293484979, "examples_seen": 30515200.0, "progress": 0.2673197161746369, "epoch": 24.058879414674912, "img/sec/core": 189.7592540917989, "core_hours_Tesla V100-SXM2-32GB": 44.707306521862435, "core_hours": 44.707306521862435}
{"step": 29850, "global_schedule": 0.9085313081741333, "l2_grads": 1.1611533164978027, "l2_params": 335.89910888671875, "l2_updates": 0.9395066499710083, "training_loss": 4.537858486175537, "uptime": 11515.699971909984, "examples_seen": 30566400.0, "progress": 0.26776823918835274, "epoch": 24.099246662014973, "img/sec/core": 189.73443696493453, "core_hours_Tesla V100-SXM2-32GB": 44.78226509264024, "core_hours": 44.78226509264024}
{"step": 29900, "global_schedule": 0.9080846309661865, "l2_grads": 1.3901149034500122, "l2_params": 335.8778381347656, "l2_updates": 0.9753915071487427, "training_loss": 2.7599306106567383, "uptime": 11532.567975212005, "examples_seen": 30617600.0, "progress": 0.2682167622020686, "epoch": 24.13961390935503, "img/sec/core": 189.70828631605784, "core_hours_Tesla V100-SXM2-32GB": 44.85723399620477, "core_hours": 44.85723399620477}
{"step": 29951, "global_schedule": 0.9076368808746338, "l2_grads": 1.3176372051239014, "l2_params": 335.86248779296875, "l2_updates": 0.9720853567123413, "training_loss": 2.9227781295776367, "uptime": 11549.427854059963, "examples_seen": 30668800.0, "progress": 0.2686652852157844, "epoch": 24.17998115669509, "img/sec/core": 189.7997031210962, "core_hours_Tesla V100-SXM2-32GB": 44.93216679108458, "core_hours": 44.93216679108458}
{"step": 30000, "global_schedule": 0.9071882367134094, "l2_grads": 1.264219880104065, "l2_params": 335.8351135253906, "l2_updates": 0.9941408634185791, "training_loss": 3.2385711669921875, "uptime": 11566.300602999981, "examples_seen": 30720000.0, "progress": 0.26911380822950026, "epoch": 24.220348404035146, "img/sec/core": 189.6549288664049, "core_hours_Tesla V100-SXM2-32GB": 45.00715678637356, "core_hours": 45.00715678637356, "minival/prec@1": 0.5842959725257572, "minival/loss": 1.7724235503702583, "minival/sample count": 12812.0, "minival/attn_weight_avg": [13312, 12, 281], "minival/attn_mag": [13312, 12, 281], "minival/before_mlp": [13312, 12, 281], "z/secs/eval/minival": 2.8851467040367424, "real/prec@1": 0.6316373807032901, "real/loss": 2.639518175651061, "real/sample count": 46837.0, "real/attn_weight_avg": [50176, 12, 281], "real/attn_mag": [50176, 12, 281], "real/before_mlp": [50176, 12, 281], "z/secs/eval/real": 11.159317878016736, "train/prec@1": 0.608554814034266, "train/loss": 1.6626657683150632, "train/sample count": 25623.0, "train/attn_weight_avg": [26624, 12, 281], "train/attn_mag": [26624, 12, 281], "train/before_mlp": [26624, 12, 281], "z/secs/eval/train": 6.59123775199987, "v2/prec@1": 0.4352, "v2/loss": 2.5748888427734373, "v2/sample count": 10000.0, "v2/attn_weight_avg": [10240, 12, 281], "v2/attn_mag": [10240, 12, 281], "v2/before_mlp": [10240, 12, 281], "z/secs/eval/v2": 3.379902643035166, "val/prec@1": 0.56018, "val/loss": 1.9053686694335938, "val/sample count": 50000.0, "val/attn_weight_avg": [50176, 12, 281], "val/attn_mag": [50176, 12, 281], "val/before_mlp": [50176, 12, 281], "z/secs/eval/val": 12.350850605987944}
{"step": 30050, "global_schedule": 0.9067385792732239, "l2_grads": 1.264573097229004, "l2_params": 335.83465576171875, "l2_updates": 0.9841334819793701, "training_loss": 2.8867311477661133, "uptime": 11620.115993945976, "examples_seen": 30771200.0, "progress": 0.2695623312432161, "epoch": 24.260715651375207, "img/sec/core": 189.23997732898096, "core_hours_Tesla V100-SXM2-32GB": 45.08231121422205, "core_hours": 45.08231121422205}
{"step": 30100, "global_schedule": 0.9062879681587219, "l2_grads": 0.9694892764091492, "l2_params": 335.8138122558594, "l2_updates": 0.9557669758796692, "training_loss": 5.296966552734375, "uptime": 11636.981370263966, "examples_seen": 30822400.0, "progress": 0.27001085425693194, "epoch": 24.301082898715265, "img/sec/core": 189.73783565010726, "core_hours_Tesla V100-SXM2-32GB": 45.15726844230201, "core_hours": 45.15726844230201}
{"step": 30150, "global_schedule": 0.9058363437652588, "l2_grads": 1.088555932044983, "l2_params": 335.8127136230469, "l2_updates": 0.9811594486236572, "training_loss": 4.286255836486816, "uptime": 11653.82585736597, "examples_seen": 30873600.0, "progress": 0.2704593772706478, "epoch": 24.341450146055323, "img/sec/core": 189.97313368000013, "core_hours_Tesla V100-SXM2-32GB": 45.23213282942202, "core_hours": 45.23213282942202}
{"step": 30200, "global_schedule": 0.905383825302124, "l2_grads": 1.3436803817749023, "l2_params": 335.82965087890625, "l2_updates": 0.9975744485855103, "training_loss": 2.766568422317505, "uptime": 11670.695284629997, "examples_seen": 30924800.0, "progress": 0.27090790028436357, "epoch": 24.381817393395384, "img/sec/core": 189.69227288608994, "core_hours_Tesla V100-SXM2-32GB": 45.30710806170659, "core_hours": 45.30710806170659}
{"step": 30250, "global_schedule": 0.9049302339553833, "l2_grads": 1.1202774047851562, "l2_params": 335.7928466796875, "l2_updates": 0.998361349105835, "training_loss": 3.7472400665283203, "uptime": 11687.550453924981, "examples_seen": 30976000.0, "progress": 0.2713564232980794, "epoch": 24.42218464073544, "img/sec/core": 189.85273562053666, "core_hours_Tesla V100-SXM2-32GB": 45.38201992523986, "core_hours": 45.38201992523986}
{"step": 30300, "global_schedule": 0.904475748538971, "l2_grads": 1.277775764465332, "l2_params": 335.7989196777344, "l2_updates": 0.9707107543945312, "training_loss": 3.313749313354492, "uptime": 11704.428004580957, "examples_seen": 31027200.0, "progress": 0.27180494631179525, "epoch": 24.4625518880755, "img/sec/core": 189.60097144587485, "core_hours_Tesla V100-SXM2-32GB": 45.45703126148864, "core_hours": 45.45703126148864}
{"step": 30350, "global_schedule": 0.9040203094482422, "l2_grads": 1.056535005569458, "l2_params": 335.7893981933594, "l2_updates": 0.9634227156639099, "training_loss": 4.5734543800354, "uptime": 11721.318185741955, "examples_seen": 31078400.0, "progress": 0.2722534693255111, "epoch": 24.502919135415556, "img/sec/core": 189.45918753017068, "core_hours_Tesla V100-SXM2-32GB": 45.532098733315294, "core_hours": 45.532098733315294}
{"step": 30400, "global_schedule": 0.9035637974739075, "l2_grads": 1.1825748682022095, "l2_params": 335.8198547363281, "l2_updates": 0.9527472853660583, "training_loss": 3.5732548236846924, "uptime": 11738.183069209976, "examples_seen": 31129600.0, "progress": 0.27270199233922693, "epoch": 24.543286382755618, "img/sec/core": 189.7433804430288, "core_hours_Tesla V100-SXM2-32GB": 45.60705377095095, "core_hours": 45.60705377095095}
{"step": 30451, "global_schedule": 0.9031063914299011, "l2_grads": 1.1781014204025269, "l2_params": 335.771240234375, "l2_updates": 0.9526155591011047, "training_loss": 3.3147878646850586, "uptime": 11755.048685767979, "examples_seen": 31180800.0, "progress": 0.27315051535294277, "epoch": 24.583653630095675, "img/sec/core": 189.73513295495292, "core_hours_Tesla V100-SXM2-32GB": 45.682012066764294, "core_hours": 45.682012066764294}
{"step": 30500, "global_schedule": 0.9026479721069336, "l2_grads": 1.1649219989776611, "l2_params": 335.76177978515625, "l2_updates": 1.0006155967712402, "training_loss": 3.2041335105895996, "uptime": 11771.909832581994, "examples_seen": 31232000.0, "progress": 0.2735990383666586, "epoch": 24.624020877435733, "img/sec/core": 189.78543009542588, "core_hours_Tesla V100-SXM2-32GB": 45.756950497048805, "core_hours": 45.756950497048805}
{"step": 30550, "global_schedule": 0.9021886587142944, "l2_grads": 0.9407814145088196, "l2_params": 335.7673645019531, "l2_updates": 0.9448367953300476, "training_loss": 4.825942039489746, "uptime": 11788.764852811, "examples_seen": 31283200.0, "progress": 0.27404756138037445, "epoch": 24.664388124775794, "img/sec/core": 189.8544146801466, "core_hours_Tesla V100-SXM2-32GB": 45.83186169806661, "core_hours": 45.83186169806661}
{"step": 30600, "global_schedule": 0.9017283916473389, "l2_grads": 1.4593510627746582, "l2_params": 335.7604064941406, "l2_updates": 0.9815872311592102, "training_loss": 2.86958646774292, "uptime": 11805.626119706954, "examples_seen": 31334400.0, "progress": 0.27449608439409023, "epoch": 24.70475537211585, "img/sec/core": 189.78407848866092, "core_hours_Tesla V100-SXM2-32GB": 45.90680066204863, "core_hours": 45.90680066204863}
{"step": 30650, "global_schedule": 0.9012670516967773, "l2_grads": 1.2335764169692993, "l2_params": 335.7691650390625, "l2_updates": 0.9498962163925171, "training_loss": 2.8182458877563477, "uptime": 11822.492396173999, "examples_seen": 31385600.0, "progress": 0.2749446074078061, "epoch": 24.74512261945591, "img/sec/core": 189.72770938817442, "core_hours_Tesla V100-SXM2-32GB": 45.98176189079105, "core_hours": 45.98176189079105}
{"step": 30700, "global_schedule": 0.900804877281189, "l2_grads": 1.334084391593933, "l2_params": 335.7322692871094, "l2_updates": 0.9830753207206726, "training_loss": 3.044755697250366, "uptime": 11839.343977732991, "examples_seen": 31436800.0, "progress": 0.2753931304215219, "epoch": 24.785489866795967, "img/sec/core": 189.8931556541269, "core_hours_Tesla V100-SXM2-32GB": 46.05665780883101, "core_hours": 46.05665780883101}
{"step": 30750, "global_schedule": 0.9003416299819946, "l2_grads": 1.206514596939087, "l2_params": 335.74688720703125, "l2_updates": 0.9738892316818237, "training_loss": 3.1219449043273926, "uptime": 11856.212681411998, "examples_seen": 31488000.0, "progress": 0.27584165343523775, "epoch": 24.825857114136028, "img/sec/core": 189.70040975836088, "core_hours_Tesla V100-SXM2-32GB": 46.13162982518215, "core_hours": 46.13162982518215}
{"step": 30800, "global_schedule": 0.8998774886131287, "l2_grads": 1.2683039903640747, "l2_params": 335.7225646972656, "l2_updates": 0.9689886569976807, "training_loss": 2.9210712909698486, "uptime": 11873.064953289984, "examples_seen": 31539200.0, "progress": 0.2762901764489536, "epoch": 24.866224361476085, "img/sec/core": 189.88537706777404, "core_hours_Tesla V100-SXM2-32GB": 46.206528811306534, "core_hours": 46.206528811306534}
{"step": 30850, "global_schedule": 0.8994123935699463, "l2_grads": 1.1656196117401123, "l2_params": 335.686279296875, "l2_updates": 0.9302693009376526, "training_loss": 3.6080198287963867, "uptime": 11889.915438433993, "examples_seen": 31590400.0, "progress": 0.27673869946266944, "epoch": 24.906591608816143, "img/sec/core": 189.9055114824296, "core_hours_Tesla V100-SXM2-32GB": 46.28141985639102, "core_hours": 46.28141985639102}
{"step": 30900, "global_schedule": 0.8989462852478027, "l2_grads": 1.2201892137527466, "l2_params": 335.6322937011719, "l2_updates": 0.8854105472564697, "training_loss": 5.256954669952393, "uptime": 11906.786195006978, "examples_seen": 31641600.0, "progress": 0.2771872224763853, "epoch": 24.9469588561562, "img/sec/core": 189.67732633425743, "core_hours_Tesla V100-SXM2-32GB": 46.3564009967154, "core_hours": 46.3564009967154}
{"step": 30950, "global_schedule": 0.8984792828559875, "l2_grads": 1.3046679496765137, "l2_params": 335.578125, "l2_updates": 0.960054337978363, "training_loss": 2.9120192527770996, "uptime": 11923.632927019964, "examples_seen": 31692800.0, "progress": 0.2776357454901011, "epoch": 24.98732610349626, "img/sec/core": 189.94781881336908, "core_hours_Tesla V100-SXM2-32GB": 46.43127536121756, "core_hours": 46.43127536121756}
{"step": 31000, "global_schedule": 0.898011326789856, "l2_grads": 1.3777804374694824, "l2_params": 335.5478210449219, "l2_updates": 0.9683310389518738, "training_loss": 2.9706552028656006, "uptime": 11940.502282036003, "examples_seen": 31744000.0, "progress": 0.27808426850381696, "epoch": 25.02769335083632, "img/sec/core": 189.69308529920434, "core_hours_Tesla V100-SXM2-32GB": 46.50625027239995, "core_hours": 46.50625027239995}
{"step": 31050, "global_schedule": 0.8975423574447632, "l2_grads": 0.967025101184845, "l2_params": 335.54620361328125, "l2_updates": 0.9703755378723145, "training_loss": 4.6343994140625, "uptime": 11957.981118939992, "examples_seen": 31795200.0, "progress": 0.27853279151753274, "epoch": 25.068060598176377, "img/sec/core": 189.8498891507087, "core_hours_Tesla V100-SXM2-32GB": 46.58116325910669, "core_hours": 46.58116325910669}
{"step": 31100, "global_schedule": 0.8970724940299988, "l2_grads": 1.3421719074249268, "l2_params": 335.52142333984375, "l2_updates": 0.9692977666854858, "training_loss": 2.844660997390747, "uptime": 11974.854982021963, "examples_seen": 31846400.0, "progress": 0.2789813145312486, "epoch": 25.108427845516438, "img/sec/core": 189.64240639234177, "core_hours_Tesla V100-SXM2-32GB": 46.656158206137675, "core_hours": 46.656158206137675}
{"step": 31150, "global_schedule": 0.896601676940918, "l2_grads": 1.5108259916305542, "l2_params": 335.5326232910156, "l2_updates": 0.9557756185531616, "training_loss": 2.940141201019287, "uptime": 11991.720878137974, "examples_seen": 31897600.0, "progress": 0.2794298375449644, "epoch": 25.148795092856496, "img/sec/core": 189.73198803010715, "core_hours_Tesla V100-SXM2-32GB": 46.73111774443105, "core_hours": 46.73111774443105}
{"step": 31200, "global_schedule": 0.896129846572876, "l2_grads": 1.2161155939102173, "l2_params": 335.531982421875, "l2_updates": 0.9640301465988159, "training_loss": 2.8537566661834717, "uptime": 12008.599277756002, "examples_seen": 31948800.0, "progress": 0.27987836055868026, "epoch": 25.189162340196553, "img/sec/core": 189.59143475794994, "core_hours_Tesla V100-SXM2-32GB": 46.80613285384451, "core_hours": 46.80613285384451}
{"step": 31250, "global_schedule": 0.8956571817398071, "l2_grads": 1.050104022026062, "l2_params": 335.4757080078125, "l2_updates": 0.9327606558799744, "training_loss": 4.2772040367126465, "uptime": 12025.459602146992, "examples_seen": 32000000.0, "progress": 0.2803268835723961, "epoch": 25.22952958753661, "img/sec/core": 189.79468756308094, "core_hours_Tesla V100-SXM2-32GB": 46.88106762891558, "core_hours": 46.88106762891558}
{"step": 31300, "global_schedule": 0.8951834440231323, "l2_grads": 1.2870904207229614, "l2_params": 335.4629821777344, "l2_updates": 0.9587193727493286, "training_loss": 2.902132272720337, "uptime": 12042.316290255985, "examples_seen": 32051200.0, "progress": 0.28077540658611194, "epoch": 25.269896834876672, "img/sec/core": 189.83562959159673, "core_hours_Tesla V100-SXM2-32GB": 46.955986242733324, "core_hours": 46.955986242733324}
{"step": 31350, "global_schedule": 0.8947088122367859, "l2_grads": 1.1901376247406006, "l2_params": 335.46551513671875, "l2_updates": 0.979808509349823, "training_loss": 3.2171359062194824, "uptime": 12059.206739177986, "examples_seen": 32102400.0, "progress": 0.2812239295998278, "epoch": 25.31026408221673, "img/sec/core": 189.4561840705072, "core_hours_Tesla V100-SXM2-32GB": 47.03105490460889, "core_hours": 47.03105490460889}
{"step": 31400, "global_schedule": 0.894233226776123, "l2_grads": 1.116856575012207, "l2_params": 335.4261169433594, "l2_updates": 0.9146690368652344, "training_loss": 5.117556571960449, "uptime": 12076.07410296495, "examples_seen": 32153600.0, "progress": 0.2816724526135436, "epoch": 25.350631329556787, "img/sec/core": 189.7154789815415, "core_hours_Tesla V100-SXM2-32GB": 47.10602096588429, "core_hours": 47.10602096588429}
{"step": 31450, "global_schedule": 0.8937567472457886, "l2_grads": 1.2827541828155518, "l2_params": 335.3642883300781, "l2_updates": 0.9592208862304688, "training_loss": 2.8028461933135986, "uptime": 12092.970933554985, "examples_seen": 32204800.0, "progress": 0.2821209756272594, "epoch": 25.39099857689685, "img/sec/core": 189.38462943975642, "core_hours_Tesla V100-SXM2-32GB": 47.181117990728886, "core_hours": 47.181117990728886}
{"step": 31500, "global_schedule": 0.8932792544364929, "l2_grads": 1.4104171991348267, "l2_params": 335.3673400878906, "l2_updates": 0.953591525554657, "training_loss": 2.981626510620117, "uptime": 12109.845099331986, "examples_seen": 32256000.0, "progress": 0.28256949864097525, "epoch": 25.431365824236906, "img/sec/core": 189.63900451669045, "core_hours_Tesla V100-SXM2-32GB": 47.256114283071106, "core_hours": 47.256114283071106}
{"step": 31550, "global_schedule": 0.8928008079528809, "l2_grads": 1.1604748964309692, "l2_params": 335.38031005859375, "l2_updates": 0.9680977463722229, "training_loss": 3.365471124649048, "uptime": 12126.72190258, "examples_seen": 32307200.0, "progress": 0.2830180216546911, "epoch": 25.471733071576963, "img/sec/core": 189.6093681353084, "core_hours_Tesla V100-SXM2-32GB": 47.331122297506724, "core_hours": 47.331122297506724}
{"step": 31600, "global_schedule": 0.8923214673995972, "l2_grads": 1.3587888479232788, "l2_params": 335.3822937011719, "l2_updates": 0.9661991000175476, "training_loss": 2.94970965385437, "uptime": 12143.60186227999, "examples_seen": 32358400.0, "progress": 0.28346654466840693, "epoch": 25.51210031891702, "img/sec/core": 189.5739123122502, "core_hours_Tesla V100-SXM2-32GB": 47.406144340617786, "core_hours": 47.406144340617786}
{"step": 31650, "global_schedule": 0.8918411731719971, "l2_grads": 1.2837120294570923, "l2_params": 335.4000244140625, "l2_updates": 0.9772435426712036, "training_loss": 3.0694336891174316, "uptime": 12160.488675635948, "examples_seen": 32409600.0, "progress": 0.28391506768212277, "epoch": 25.552467566257082, "img/sec/core": 189.4969721371844, "core_hours_Tesla V100-SXM2-32GB": 47.48119684442205, "core_hours": 47.48119684442205}
{"step": 31700, "global_schedule": 0.8913599848747253, "l2_grads": 1.182002067565918, "l2_params": 335.38458251953125, "l2_updates": 0.9453338980674744, "training_loss": 3.991947650909424, "uptime": 12177.366641736997, "examples_seen": 32460800.0, "progress": 0.2843635906958386, "epoch": 25.59283481359714, "img/sec/core": 189.59630448607226, "core_hours_Tesla V100-SXM2-32GB": 47.55621002709338, "core_hours": 47.55621002709338}
{"step": 31750, "global_schedule": 0.8908778429031372, "l2_grads": 1.0393515825271606, "l2_params": 335.37371826171875, "l2_updates": 0.96127849817276, "training_loss": 5.305665016174316, "uptime": 12194.252279758977, "examples_seen": 32512000.0, "progress": 0.28481211370955445, "epoch": 25.633202060937197, "img/sec/core": 189.51016217654842, "core_hours_Tesla V100-SXM2-32GB": 47.63125730719107, "core_hours": 47.63125730719107}
{"step": 31800, "global_schedule": 0.8903946876525879, "l2_grads": 1.3427133560180664, "l2_params": 335.3192443847656, "l2_updates": 0.943195641040802, "training_loss": 2.663160800933838, "uptime": 12211.127521928982, "examples_seen": 32563200.0, "progress": 0.2852606367232703, "epoch": 25.67356930827726, "img/sec/core": 189.62690832893216, "core_hours_Tesla V100-SXM2-32GB": 47.7062583835022, "core_hours": 47.7062583835022}
{"step": 31850, "global_schedule": 0.8899106979370117, "l2_grads": 1.0550882816314697, "l2_params": 335.2739562988281, "l2_updates": 0.9597238898277283, "training_loss": 4.486408233642578, "uptime": 12228.011776033964, "examples_seen": 32614400.0, "progress": 0.28570915973698613, "epoch": 25.713936555617316, "img/sec/core": 189.52569536701338, "core_hours_Tesla V100-SXM2-32GB": 47.78129951285768, "core_hours": 47.78129951285768}
{"step": 31900, "global_schedule": 0.8894257545471191, "l2_grads": 1.2360159158706665, "l2_params": 335.24310302734375, "l2_updates": 0.937818169593811, "training_loss": 3.1217141151428223, "uptime": 12244.905280022998, "examples_seen": 32665600.0, "progress": 0.2861576827507019, "epoch": 25.754303802957374, "img/sec/core": 189.4219223008471, "core_hours_Tesla V100-SXM2-32GB": 47.85638175280894, "core_hours": 47.85638175280894}
{"step": 31950, "global_schedule": 0.8889397978782654, "l2_grads": 1.1975138187408447, "l2_params": 335.2139587402344, "l2_updates": 0.9780257940292358, "training_loss": 2.7996115684509277, "uptime": 12261.782319222984, "examples_seen": 32716800.0, "progress": 0.28660620576441775, "epoch": 25.79467105029743, "img/sec/core": 189.60671727317248, "core_hours_Tesla V100-SXM2-32GB": 47.93139081591999, "core_hours": 47.93139081591999}
{"step": 32000, "global_schedule": 0.8884530067443848, "l2_grads": 1.0580248832702637, "l2_params": 335.1484680175781, "l2_updates": 0.9300531148910522, "training_loss": 5.294328689575195, "uptime": 12278.659146358958, "examples_seen": 32768000.0, "progress": 0.2870547287781336, "epoch": 25.835038297637492, "img/sec/core": 189.6090997566222, "core_hours_Tesla V100-SXM2-32GB": 48.00639893652431, "core_hours": 48.00639893652431}
{"step": 32050, "global_schedule": 0.887965202331543, "l2_grads": 1.1355143785476685, "l2_params": 335.1298828125, "l2_updates": 0.9701444506645203, "training_loss": 3.542635440826416, "uptime": 12296.116940774955, "examples_seen": 32819200.0, "progress": 0.28750325179184943, "epoch": 25.87540554497755, "img/sec/core": 189.4293522783838, "core_hours_Tesla V100-SXM2-32GB": 48.08147823152883, "core_hours": 48.08147823152883}
{"step": 32100, "global_schedule": 0.8874765038490295, "l2_grads": 1.2737387418746948, "l2_params": 335.08868408203125, "l2_updates": 0.9552923440933228, "training_loss": 2.946524143218994, "uptime": 12312.997120415966, "examples_seen": 32870400.0, "progress": 0.2879517748055653, "epoch": 25.915772792317608, "img/sec/core": 189.57144225084932, "core_hours_Tesla V100-SXM2-32GB": 48.15650125215554, "core_hours": 48.15650125215554}
{"step": 32150, "global_schedule": 0.8869868516921997, "l2_grads": 1.3302940130233765, "l2_params": 335.06640625, "l2_updates": 0.9571489691734314, "training_loss": 2.8143625259399414, "uptime": 12329.891363223956, "examples_seen": 32921600.0, "progress": 0.2884002978192811, "epoch": 25.956140039657665, "img/sec/core": 189.41363850214088, "core_hours_Tesla V100-SXM2-32GB": 48.23158677574661, "core_hours": 48.23158677574661}
{"step": 32200, "global_schedule": 0.8864963054656982, "l2_grads": 1.3439279794692993, "l2_params": 335.0374755859375, "l2_updates": 0.9868236184120178, "training_loss": 2.805602550506592, "uptime": 12346.775240879972, "examples_seen": 32972800.0, "progress": 0.28884882083299696, "epoch": 25.996507286997726, "img/sec/core": 189.52992109960937, "core_hours_Tesla V100-SXM2-32GB": 48.306626231995565, "core_hours": 48.306626231995565}
{"step": 32250, "global_schedule": 0.8860048055648804, "l2_grads": 0.9580655097961426, "l2_params": 335.06341552734375, "l2_updates": 0.9401438236236572, "training_loss": 5.162426948547363, "uptime": 12363.665745263977, "examples_seen": 33024000.0, "progress": 0.2892973438467128, "epoch": 26.036874534337784, "img/sec/core": 189.45556196830745, "core_hours_Tesla V100-SXM2-32GB": 48.381695140368926, "core_hours": 48.381695140368926}
{"step": 32300, "global_schedule": 0.8855124711990356, "l2_grads": 1.293140172958374, "l2_params": 335.0130920410156, "l2_updates": 0.9664849638938904, "training_loss": 3.033461570739746, "uptime": 12380.529356581974, "examples_seen": 33075200.0, "progress": 0.28974586686042864, "epoch": 26.07724178167784, "img/sec/core": 189.7576942244301, "core_hours_Tesla V100-SXM2-32GB": 48.45664452400447, "core_hours": 48.45664452400447}
{"step": 32350, "global_schedule": 0.8850191235542297, "l2_grads": 1.2940258979797363, "l2_params": 334.99053955078125, "l2_updates": 0.9094258546829224, "training_loss": 3.025188446044922, "uptime": 12397.431209741975, "examples_seen": 33126400.0, "progress": 0.2901943898741444, "epoch": 26.117609029017903, "img/sec/core": 189.32835173203853, "core_hours_Tesla V100-SXM2-32GB": 48.53176387138225, "core_hours": 48.53176387138225}
{"step": 32400, "global_schedule": 0.8845248818397522, "l2_grads": 1.107415795326233, "l2_params": 334.96600341796875, "l2_updates": 0.9721260666847229, "training_loss": 4.2992048263549805, "uptime": 12414.309768188978, "examples_seen": 33177600.0, "progress": 0.29064291288786026, "epoch": 26.15797627635796, "img/sec/core": 189.58965068301242, "core_hours_Tesla V100-SXM2-32GB": 48.60677968670226, "core_hours": 48.60677968670226}
{"step": 32450, "global_schedule": 0.8840296864509583, "l2_grads": 1.329656958580017, "l2_params": 334.93548583984375, "l2_updates": 0.9413738250732422, "training_loss": 2.801754951477051, "uptime": 12431.175604749995, "examples_seen": 33228800.0, "progress": 0.2910914359015761, "epoch": 26.198343523698018, "img/sec/core": 189.73265799315934, "core_hours_Tesla V100-SXM2-32GB": 48.68173896030678, "core_hours": 48.68173896030678}
{"step": 32500, "global_schedule": 0.8835335969924927, "l2_grads": 1.2655216455459595, "l2_params": 334.8773193359375, "l2_updates": 0.9750601053237915, "training_loss": 2.7535877227783203, "uptime": 12448.048116300954, "examples_seen": 33280000.0, "progress": 0.29153995891529194, "epoch": 26.238710771038075, "img/sec/core": 189.6575972305776, "core_hours_Tesla V100-SXM2-32GB": 48.756727900533264, "core_hours": 48.756727900533264, "minival/prec@1": 0.5995941305026538, "minival/loss": 1.6814034873159684, "minival/sample count": 12812.0, "minival/attn_weight_avg": [13312, 12, 281], "minival/attn_mag": [13312, 12, 281], "minival/before_mlp": [13312, 12, 281], "z/secs/eval/minival": 2.9337831439916044, "real/prec@1": 0.6434442855007793, "real/loss": 2.5503764113941703, "real/sample count": 46837.0, "real/attn_weight_avg": [50176, 12, 281], "real/attn_mag": [50176, 12, 281], "real/before_mlp": [50176, 12, 281], "z/secs/eval/real": 11.166058312985115, "train/prec@1": 0.6214338680092105, "train/loss": 1.5808779175283478, "train/sample count": 25623.0, "train/attn_weight_avg": [26624, 12, 281], "train/attn_mag": [26624, 12, 281], "train/before_mlp": [26624, 12, 281], "z/secs/eval/train": 6.565490281966049, "v2/prec@1": 0.4482, "v2/loss": 2.505152587890625, "v2/sample count": 10000.0, "v2/attn_weight_avg": [10240, 12, 281], "v2/attn_mag": [10240, 12, 281], "v2/before_mlp": [10240, 12, 281], "z/secs/eval/v2": 3.3700247909873724, "val/prec@1": 0.57168, "val/loss": 1.8209069702148437, "val/sample count": 50000.0, "val/attn_weight_avg": [50176, 12, 281], "val/attn_mag": [50176, 12, 281], "val/before_mlp": [50176, 12, 281], "z/secs/eval/val": 12.362513130996376}
{"step": 32550, "global_schedule": 0.8830366134643555, "l2_grads": 1.0541439056396484, "l2_params": 334.8542785644531, "l2_updates": 0.9391403794288635, "training_loss": 4.615114212036133, "uptime": 12501.377083900967, "examples_seen": 33331200.0, "progress": 0.2919884819290078, "epoch": 26.279078018378137, "img/sec/core": 189.02342539897444, "core_hours_Tesla V100-SXM2-32GB": 48.83196842795574, "core_hours": 48.83196842795574}
{"step": 32600, "global_schedule": 0.8825386762619019, "l2_grads": 1.271302580833435, "l2_params": 334.7897644042969, "l2_updates": 0.9582049250602722, "training_loss": 2.7864413261413574, "uptime": 12518.254936695972, "examples_seen": 33382400.0, "progress": 0.2924370049427236, "epoch": 26.319445265718194, "img/sec/core": 189.59757730242683, "core_hours_Tesla V100-SXM2-32GB": 48.90698110704466, "core_hours": 48.90698110704466}
{"step": 32650, "global_schedule": 0.8820397853851318, "l2_grads": 1.0568768978118896, "l2_params": 334.7682189941406, "l2_updates": 0.9404269456863403, "training_loss": 4.7040205001831055, "uptime": 12535.142823349976, "examples_seen": 33433600.0, "progress": 0.29288552795643946, "epoch": 26.35981251305825, "img/sec/core": 189.48492878719034, "core_hours_Tesla V100-SXM2-32GB": 48.98203838106245, "core_hours": 48.98203838106245}
{"step": 32700, "global_schedule": 0.881540060043335, "l2_grads": 1.3117822408676147, "l2_params": 334.7448425292969, "l2_updates": 0.9524955749511719, "training_loss": 2.8788528442382812, "uptime": 12552.022366696969, "examples_seen": 33484800.0, "progress": 0.2933340509701553, "epoch": 26.400179760398313, "img/sec/core": 189.57858836684895, "core_hours_Tesla V100-SXM2-32GB": 49.05705857371575, "core_hours": 49.05705857371575}
{"step": 32750, "global_schedule": 0.8810393810272217, "l2_grads": 1.2146358489990234, "l2_params": 334.7248229980469, "l2_updates": 0.9628119468688965, "training_loss": 2.7338778972625732, "uptime": 12568.875304113957, "examples_seen": 33536000.0, "progress": 0.2937825739838711, "epoch": 26.44054700773837, "img/sec/core": 189.87787830828077, "core_hours_Tesla V100-SXM2-32GB": 49.131960517791256, "core_hours": 49.131960517791256}
{"step": 32800, "global_schedule": 0.880537748336792, "l2_grads": 1.2285867929458618, "l2_params": 334.6791076660156, "l2_updates": 0.9770669937133789, "training_loss": 2.8466293811798096, "uptime": 12585.76007050398, "examples_seen": 33587200.0, "progress": 0.2942310969975869, "epoch": 26.480914255078428, "img/sec/core": 189.51994514361692, "core_hours_Tesla V100-SXM2-32GB": 49.20700392396914, "core_hours": 49.20700392396914}
{"step": 32850, "global_schedule": 0.8800352811813354, "l2_grads": 1.349402666091919, "l2_params": 334.6607971191406, "l2_updates": 0.9245405197143555, "training_loss": 2.8179574012756348, "uptime": 12602.628612484958, "examples_seen": 33638400.0, "progress": 0.29467962001130277, "epoch": 26.521281502418486, "img/sec/core": 189.70222818360196, "core_hours_Tesla V100-SXM2-32GB": 49.28197522166237, "core_hours": 49.28197522166237}
{"step": 32900, "global_schedule": 0.8795318603515625, "l2_grads": 1.2795772552490234, "l2_params": 334.6426696777344, "l2_updates": 0.9770141243934631, "training_loss": 2.820138692855835, "uptime": 12619.512850187952, "examples_seen": 33689600.0, "progress": 0.2951281430250186, "epoch": 26.561648749758547, "img/sec/core": 189.52587947944684, "core_hours_Tesla V100-SXM2-32GB": 49.35701627812012, "core_hours": 49.35701627812012}
{"step": 32950, "global_schedule": 0.8790275454521179, "l2_grads": 1.050257921218872, "l2_params": 334.6525573730469, "l2_updates": 0.9294047951698303, "training_loss": 5.430239677429199, "uptime": 12636.40230336797, "examples_seen": 33740800.0, "progress": 0.29557666603873445, "epoch": 26.602015997098604, "img/sec/core": 189.4673537320888, "core_hours_Tesla V100-SXM2-32GB": 49.43208051447575, "core_hours": 49.43208051447575}
{"step": 33000, "global_schedule": 0.8785223364830017, "l2_grads": 1.2347395420074463, "l2_params": 334.61737060546875, "l2_updates": 0.9605688452720642, "training_loss": 2.774350166320801, "uptime": 12653.271230444952, "examples_seen": 33792000.0, "progress": 0.2960251890524503, "epoch": 26.642383244438662, "img/sec/core": 189.6978975246336, "core_hours_Tesla V100-SXM2-32GB": 49.50705352370679, "core_hours": 49.50705352370679}
{"step": 33050, "global_schedule": 0.8780162334442139, "l2_grads": 1.3218728303909302, "l2_params": 334.59075927734375, "l2_updates": 0.9145033359527588, "training_loss": 3.1165473461151123, "uptime": 12670.94598578097, "examples_seen": 33843200.0, "progress": 0.29647371206616613, "epoch": 26.68275049177872, "img/sec/core": 189.5545128206357, "core_hours_Tesla V100-SXM2-32GB": 49.58208324476482, "core_hours": 49.58208324476482}
{"step": 33100, "global_schedule": 0.8775091767311096, "l2_grads": 1.0070035457611084, "l2_params": 334.5179748535156, "l2_updates": 0.9144812822341919, "training_loss": 5.053844451904297, "uptime": 12687.821054675966, "examples_seen": 33894400.0, "progress": 0.29692223507988197, "epoch": 26.72311773911878, "img/sec/core": 189.6288554382797, "core_hours_Tesla V100-SXM2-32GB": 49.65708355096479, "core_hours": 49.65708355096479}
{"step": 33150, "global_schedule": 0.8770012259483337, "l2_grads": 1.058276891708374, "l2_params": 334.522705078125, "l2_updates": 0.9255990982055664, "training_loss": 4.979879379272461, "uptime": 12704.688990123977, "examples_seen": 33945600.0, "progress": 0.2973707580935978, "epoch": 26.763484986458838, "img/sec/core": 189.70904944844156, "core_hours_Tesla V100-SXM2-32GB": 49.73205215295595, "core_hours": 49.73205215295595}
{"step": 33200, "global_schedule": 0.8764923810958862, "l2_grads": 1.2496576309204102, "l2_params": 334.49359130859375, "l2_updates": 0.9336262941360474, "training_loss": 2.7299935817718506, "uptime": 12721.576844226976, "examples_seen": 33996800.0, "progress": 0.2978192811073136, "epoch": 26.803852233798896, "img/sec/core": 189.48529401564045, "core_hours_Tesla V100-SXM2-32GB": 49.80710928230262, "core_hours": 49.80710928230262}
{"step": 33250, "global_schedule": 0.8759826421737671, "l2_grads": 1.2162257432937622, "l2_params": 334.4635009765625, "l2_updates": 0.9623005390167236, "training_loss": 2.869959831237793, "uptime": 12738.448207206966, "examples_seen": 34048000.0, "progress": 0.29826780412102943, "epoch": 26.844219481138957, "img/sec/core": 189.6705087665651, "core_hours_Tesla V100-SXM2-32GB": 49.88209311776924, "core_hours": 49.88209311776924}
{"step": 33300, "global_schedule": 0.8754719495773315, "l2_grads": 1.3520339727401733, "l2_params": 334.4427795410156, "l2_updates": 0.9428043365478516, "training_loss": 2.8550500869750977, "uptime": 12755.327010783949, "examples_seen": 34099200.0, "progress": 0.2987163271347453, "epoch": 26.884586728479015, "img/sec/core": 189.58689728244204, "core_hours_Tesla V100-SXM2-32GB": 49.95711002255583, "core_hours": 49.95711002255583}
{"step": 33350, "global_schedule": 0.8749604225158691, "l2_grads": 1.377443790435791, "l2_params": 334.4151306152344, "l2_updates": 0.9284054636955261, "training_loss": 3.2987163066864014, "uptime": 12772.226362650981, "examples_seen": 34150400.0, "progress": 0.2991648501484611, "epoch": 26.924953975819072, "img/sec/core": 189.35637444431558, "core_hours_Tesla V100-SXM2-32GB": 50.03221825307597, "core_hours": 50.03221825307597}
{"step": 33400, "global_schedule": 0.8744479417800903, "l2_grads": 1.3114300966262817, "l2_params": 334.3870849609375, "l2_updates": 0.9395676255226135, "training_loss": 2.8017678260803223, "uptime": 12789.114425279957, "examples_seen": 34201600.0, "progress": 0.29961337316217695, "epoch": 26.96532122315913, "img/sec/core": 189.48295433897889, "core_hours_Tesla V100-SXM2-32GB": 50.10727630920475, "core_hours": 50.10727630920475}
{"step": 33450, "global_schedule": 0.8739346265792847, "l2_grads": 1.300555944442749, "l2_params": 334.3712463378906, "l2_updates": 0.9387809038162231, "training_loss": 2.7308926582336426, "uptime": 12805.971481051005, "examples_seen": 34252800.0, "progress": 0.3000618961758928, "epoch": 27.00568847049919, "img/sec/core": 189.83148916763787, "core_hours_Tesla V100-SXM2-32GB": 50.182196557076075, "core_hours": 50.182196557076075}
{"step": 33500, "global_schedule": 0.8734203577041626, "l2_grads": 1.3359277248382568, "l2_params": 334.3485107421875, "l2_updates": 0.9475963711738586, "training_loss": 2.773178815841675, "uptime": 12822.869335897965, "examples_seen": 34304000.0, "progress": 0.30051041918960864, "epoch": 27.04605571783925, "img/sec/core": 189.37314996380258, "core_hours_Tesla V100-SXM2-32GB": 50.25729813417368, "core_hours": 50.25729813417368}
{"step": 33550, "global_schedule": 0.8729052543640137, "l2_grads": 1.2820179462432861, "l2_params": 334.3125, "l2_updates": 0.9138476252555847, "training_loss": 2.808742046356201, "uptime": 12839.769487922953, "examples_seen": 34355200.0, "progress": 0.3009589422033245, "epoch": 27.086422965179306, "img/sec/core": 189.3474091397911, "core_hours_Tesla V100-SXM2-32GB": 50.3324099209514, "core_hours": 50.3324099209514}
{"step": 33600, "global_schedule": 0.8723891973495483, "l2_grads": 1.1693445444107056, "l2_params": 334.26727294921875, "l2_updates": 0.9106389880180359, "training_loss": 3.871471405029297, "uptime": 12856.63654777396, "examples_seen": 34406400.0, "progress": 0.30140746521704026, "epoch": 27.126790212519367, "img/sec/core": 189.71889755931232, "core_hours_Tesla V100-SXM2-32GB": 50.40737463140032, "core_hours": 50.40737463140032}
{"step": 33650, "global_schedule": 0.8718723058700562, "l2_grads": 1.2022645473480225, "l2_params": 334.2095642089844, "l2_updates": 0.9345275163650513, "training_loss": 2.930172920227051, "uptime": 12873.518537833006, "examples_seen": 34457600.0, "progress": 0.3018559882307561, "epoch": 27.167157459859425, "img/sec/core": 189.55111268326488, "core_hours_Tesla V100-SXM2-32GB": 50.482405698329416, "core_hours": 50.482405698329416}
{"step": 33700, "global_schedule": 0.8713544607162476, "l2_grads": 1.2699083089828491, "l2_params": 334.1938171386719, "l2_updates": 0.9438815712928772, "training_loss": 2.9132137298583984, "uptime": 12890.402876562963, "examples_seen": 34508800.0, "progress": 0.30230451124447194, "epoch": 27.207524707199482, "img/sec/core": 189.52474545671564, "core_hours_Tesla V100-SXM2-32GB": 50.55744720379589, "core_hours": 50.55744720379589}
{"step": 33750, "global_schedule": 0.8708357810974121, "l2_grads": 1.193650245666504, "l2_params": 334.1719055175781, "l2_updates": 0.950763463973999, "training_loss": 4.134700298309326, "uptime": 12907.277939849999, "examples_seen": 34560000.0, "progress": 0.3027530342581878, "epoch": 27.24789195453954, "img/sec/core": 189.62891845616628, "core_hours_Tesla V100-SXM2-32GB": 50.6324474850716, "core_hours": 50.6324474850716}
{"step": 33800, "global_schedule": 0.8703161478042603, "l2_grads": 1.42751944065094, "l2_params": 334.1666564941406, "l2_updates": 0.9491329789161682, "training_loss": 2.854513645172119, "uptime": 12924.164110657992, "examples_seen": 34611200.0, "progress": 0.3032015572719036, "epoch": 27.2882592018796, "img/sec/core": 189.504182824284, "core_hours_Tesla V100-SXM2-32GB": 50.70749713310713, "core_hours": 50.70749713310713}
{"step": 33850, "global_schedule": 0.8697956800460815, "l2_grads": 1.2722234725952148, "l2_params": 334.1574401855469, "l2_updates": 0.9421367645263672, "training_loss": 3.1812291145324707, "uptime": 12941.038514686981, "examples_seen": 34662400.0, "progress": 0.30365008028561946, "epoch": 27.32862644921966, "img/sec/core": 189.63632697798164, "core_hours_Tesla V100-SXM2-32GB": 50.78249448434709, "core_hours": 50.78249448434709}
{"step": 33900, "global_schedule": 0.8692743182182312, "l2_grads": 1.0437027215957642, "l2_params": 334.1293029785156, "l2_updates": 0.901251494884491, "training_loss": 4.959499835968018, "uptime": 12957.895722582994, "examples_seen": 34713600.0, "progress": 0.3040986032993353, "epoch": 27.368993696559716, "img/sec/core": 189.82977606610632, "core_hours_Tesla V100-SXM2-32GB": 50.857415408329366, "core_hours": 50.857415408329366}
{"step": 33950, "global_schedule": 0.8687520623207092, "l2_grads": 1.1705952882766724, "l2_params": 334.1079406738281, "l2_updates": 0.9202594757080078, "training_loss": 5.2735161781311035, "uptime": 12974.791225150984, "examples_seen": 34764800.0, "progress": 0.30454712631305114, "epoch": 27.409360943899777, "img/sec/core": 189.39951547003554, "core_hours_Tesla V100-SXM2-32GB": 50.932506530853765, "core_hours": 50.932506530853765}
{"step": 34000, "global_schedule": 0.8682289123535156, "l2_grads": 1.2874363660812378, "l2_params": 334.1109619140625, "l2_updates": 0.9332945346832275, "training_loss": 2.7644543647766113, "uptime": 12991.669475663977, "examples_seen": 34816000.0, "progress": 0.304995649326767, "epoch": 27.449728191239835, "img/sec/core": 189.59310963755536, "core_hours_Tesla V100-SXM2-32GB": 51.00752097757818, "core_hours": 51.00752097757818}
{"step": 34050, "global_schedule": 0.8677049279212952, "l2_grads": 1.3068681955337524, "l2_params": 334.04718017578125, "l2_updates": 0.927302360534668, "training_loss": 2.7958128452301025, "uptime": 13009.136176889006, "examples_seen": 34867200.0, "progress": 0.30544417234048277, "epoch": 27.490095438579893, "img/sec/core": 189.88686589463626, "core_hours_Tesla V100-SXM2-32GB": 51.08241937644961, "core_hours": 51.08241937644961}
{"step": 34100, "global_schedule": 0.8671799898147583, "l2_grads": 1.0403594970703125, "l2_params": 333.9754638671875, "l2_updates": 0.9483596682548523, "training_loss": 4.401976585388184, "uptime": 13026.038718998956, "examples_seen": 34918400.0, "progress": 0.3058926953541986, "epoch": 27.53046268591995, "img/sec/core": 189.32063468229288, "core_hours_Tesla V100-SXM2-32GB": 51.15754178582717, "core_hours": 51.15754178582717}
{"step": 34150, "global_schedule": 0.8666542768478394, "l2_grads": 1.0685713291168213, "l2_params": 333.9342041015625, "l2_updates": 0.9047484993934631, "training_loss": 5.03382682800293, "uptime": 13042.898218088958, "examples_seen": 34969600.0, "progress": 0.30634121836791445, "epoch": 27.57082993326001, "img/sec/core": 189.80397833395156, "core_hours_Tesla V100-SXM2-32GB": 51.23247289289384, "core_hours": 51.23247289289384}
{"step": 34200, "global_schedule": 0.866127610206604, "l2_grads": 1.1445521116256714, "l2_params": 333.9111328125, "l2_updates": 0.9359675645828247, "training_loss": 3.9265522956848145, "uptime": 13059.761371573957, "examples_seen": 35020800.0, "progress": 0.3067897413816303, "epoch": 27.61119718060007, "img/sec/core": 189.7628461275997, "core_hours_Tesla V100-SXM2-32GB": 51.30742024171606, "core_hours": 51.30742024171606}
{"step": 34250, "global_schedule": 0.865600049495697, "l2_grads": 1.4376013278961182, "l2_params": 333.8721618652344, "l2_updates": 0.9063348174095154, "training_loss": 2.8487040996551514, "uptime": 13076.639973260986, "examples_seen": 35072000.0, "progress": 0.30723826439534613, "epoch": 27.651564427940126, "img/sec/core": 189.58916498747408, "core_hours_Tesla V100-SXM2-32GB": 51.38243624921396, "core_hours": 51.38243624921396}
{"step": 34300, "global_schedule": 0.8650716543197632, "l2_grads": 1.2727832794189453, "l2_params": 333.86920166015625, "l2_updates": 0.9205164313316345, "training_loss": 2.6991095542907715, "uptime": 13093.517296014994, "examples_seen": 35123200.0, "progress": 0.30768678740906197, "epoch": 27.691931675280184, "img/sec/core": 189.60353171181217, "core_hours_Tesla V100-SXM2-32GB": 51.45744657256511, "core_hours": 51.45744657256511}
{"step": 34350, "global_schedule": 0.8645423650741577, "l2_grads": 1.448014736175537, "l2_params": 333.83123779296875, "l2_updates": 0.906139612197876, "training_loss": 2.9610843658447266, "uptime": 13110.390721970994, "examples_seen": 35174400.0, "progress": 0.3081353104227778, "epoch": 27.732298922620245, "img/sec/core": 189.64731930221956, "core_hours_Tesla V100-SXM2-32GB": 51.532439576814, "core_hours": 51.532439576814}
{"step": 34400, "global_schedule": 0.8640122413635254, "l2_grads": 1.0567238330841064, "l2_params": 333.7742919921875, "l2_updates": 0.9336071610450745, "training_loss": 5.044434547424316, "uptime": 13127.250438558985, "examples_seen": 35225600.0, "progress": 0.30858383343649365, "epoch": 27.772666169960303, "img/sec/core": 189.8015297765639, "core_hours_Tesla V100-SXM2-32GB": 51.60737165053841, "core_hours": 51.60737165053841}
{"step": 34451, "global_schedule": 0.8634811639785767, "l2_grads": 1.204088568687439, "l2_params": 333.751708984375, "l2_updates": 0.8998978734016418, "training_loss": 3.553016185760498, "uptime": 13144.129102712963, "examples_seen": 35276800.0, "progress": 0.30903235645020943, "epoch": 27.81303341730036, "img/sec/core": 189.5884633290692, "core_hours_Tesla V100-SXM2-32GB": 51.682387935667194, "core_hours": 51.682387935667194}
{"step": 34500, "global_schedule": 0.8629492521286011, "l2_grads": 1.2974696159362793, "l2_params": 333.7332763671875, "l2_updates": 0.9302000403404236, "training_loss": 2.870969533920288, "uptime": 13160.982282362005, "examples_seen": 35328000.0, "progress": 0.3094808794639253, "epoch": 27.85340066464042, "img/sec/core": 189.8751491788565, "core_hours_Tesla V100-SXM2-32GB": 51.757290956329605, "core_hours": 51.757290956329605}
{"step": 34550, "global_schedule": 0.8624165058135986, "l2_grads": 1.3337332010269165, "l2_params": 333.6829528808594, "l2_updates": 0.9136942625045776, "training_loss": 2.867530345916748, "uptime": 13177.868163909996, "examples_seen": 35379200.0, "progress": 0.3099294024776411, "epoch": 27.89376791198048, "img/sec/core": 189.5074290853813, "core_hours_Tesla V100-SXM2-32GB": 51.83233931876512, "core_hours": 51.83233931876512}
{"step": 34600, "global_schedule": 0.8618828654289246, "l2_grads": 1.0319737195968628, "l2_params": 333.61273193359375, "l2_updates": 0.9348747134208679, "training_loss": 5.27267599105835, "uptime": 13194.74098837399, "examples_seen": 35430400.0, "progress": 0.31037792549135695, "epoch": 27.934135159320537, "img/sec/core": 189.65407995731925, "core_hours_Tesla V100-SXM2-32GB": 51.9073296497162, "core_hours": 51.9073296497162}
{"step": 34650, "global_schedule": 0.8613483905792236, "l2_grads": 1.3511408567428589, "l2_params": 333.5768127441406, "l2_updates": 0.9255204200744629, "training_loss": 2.8846960067749023, "uptime": 13211.58565980097, "examples_seen": 35481600.0, "progress": 0.3108264485050728, "epoch": 27.974502406660594, "img/sec/core": 189.9710548746204, "core_hours_Tesla V100-SXM2-32GB": 51.982194856058335, "core_hours": 51.982194856058335}
{"step": 34700, "global_schedule": 0.8608130216598511, "l2_grads": 1.3939001560211182, "l2_params": 333.5478820800781, "l2_updates": 0.9062973856925964, "training_loss": 2.844719886779785, "uptime": 13228.478840934986, "examples_seen": 35532800.0, "progress": 0.31127497151878863, "epoch": 28.014869654000655, "img/sec/core": 189.42554244899614, "core_hours_Tesla V100-SXM2-32GB": 52.05727566109841, "core_hours": 52.05727566109841}
{"step": 34750, "global_schedule": 0.8602767586708069, "l2_grads": 1.2329423427581787, "l2_params": 333.5196838378906, "l2_updates": 0.8695608377456665, "training_loss": 5.371077537536621, "uptime": 13245.34053114499, "examples_seen": 35584000.0, "progress": 0.3117234945325045, "epoch": 28.055236901340713, "img/sec/core": 189.77931394454586, "core_hours_Tesla V100-SXM2-32GB": 52.132216506476205, "core_hours": 52.132216506476205}
{"step": 34800, "global_schedule": 0.8597396612167358, "l2_grads": 1.0642327070236206, "l2_params": 333.4735412597656, "l2_updates": 0.8897727727890015, "training_loss": 5.304316520690918, "uptime": 13262.215102645976, "examples_seen": 35635200.0, "progress": 0.3121720175462203, "epoch": 28.09560414868077, "img/sec/core": 189.63444492874703, "core_hours_Tesla V100-SXM2-32GB": 52.207214602036146, "core_hours": 52.207214602036146}
{"step": 34850, "global_schedule": 0.8592016696929932, "l2_grads": 1.1383475065231323, "l2_params": 333.40948486328125, "l2_updates": 0.9122152328491211, "training_loss": 4.320186614990234, "uptime": 13279.080052096979, "examples_seen": 35686400.0, "progress": 0.31262054055993616, "epoch": 28.13597139602083, "img/sec/core": 189.74263808479628, "core_hours_Tesla V100-SXM2-32GB": 52.28216993292949, "core_hours": 52.28216993292949}
{"step": 34900, "global_schedule": 0.8586628437042236, "l2_grads": 1.2377818822860718, "l2_params": 333.3738098144531, "l2_updates": 0.9251813292503357, "training_loss": 5.380395889282227, "uptime": 13295.944183926971, "examples_seen": 35737600.0, "progress": 0.31306906357365194, "epoch": 28.17633864336089, "img/sec/core": 189.75183734681713, "core_hours_Tesla V100-SXM2-32GB": 52.35712162995167, "core_hours": 52.35712162995167}
{"step": 34950, "global_schedule": 0.8581231832504272, "l2_grads": 1.0467276573181152, "l2_params": 333.32647705078125, "l2_updates": 0.900854766368866, "training_loss": 4.625739574432373, "uptime": 13312.808018023963, "examples_seen": 35788800.0, "progress": 0.3135175865873678, "epoch": 28.216705890700947, "img/sec/core": 189.75518743811637, "core_hours_Tesla V100-SXM2-32GB": 52.43207200371608, "core_hours": 52.43207200371608}
{"step": 35000, "global_schedule": 0.857582688331604, "l2_grads": 1.1151572465896606, "l2_params": 333.3091125488281, "l2_updates": 0.9260320067405701, "training_loss": 4.610676288604736, "uptime": 13329.687874130963, "examples_seen": 35840000.0, "progress": 0.3139661096010836, "epoch": 28.257073138041005, "img/sec/core": 189.57507574208606, "core_hours_Tesla V100-SXM2-32GB": 52.50709358641386, "core_hours": 52.50709358641386, "minival/prec@1": 0.601311270683734, "minival/loss": 1.6660257530629243, "minival/sample count": 12812.0, "minival/attn_weight_avg": [13312, 12, 281], "minival/attn_mag": [13312, 12, 281], "minival/before_mlp": [13312, 12, 281], "z/secs/eval/minival": 2.9384110489627346, "real/prec@1": 0.6467322843051434, "real/loss": 2.539115761927669, "real/sample count": 46837.0, "real/attn_weight_avg": [50176, 12, 281], "real/attn_mag": [50176, 12, 281], "real/before_mlp": [50176, 12, 281], "z/secs/eval/real": 11.118649407988414, "train/prec@1": 0.6252195293291184, "train/loss": 1.554523554143417, "train/sample count": 25623.0, "train/attn_weight_avg": [26624, 12, 281], "train/attn_mag": [26624, 12, 281], "train/before_mlp": [26624, 12, 281], "z/secs/eval/train": 6.613006127008703, "v2/prec@1": 0.4521, "v2/loss": 2.4956722412109373, "v2/sample count": 10000.0, "v2/attn_weight_avg": [10240, 12, 281], "v2/attn_mag": [10240, 12, 281], "v2/before_mlp": [10240, 12, 281], "z/secs/eval/v2": 3.33062736899592, "val/prec@1": 0.57452, "val/loss": 1.8070985278320313, "val/sample count": 50000.0, "val/attn_weight_avg": [50176, 12, 281], "val/attn_mag": [50176, 12, 281], "val/before_mlp": [50176, 12, 281], "z/secs/eval/val": 12.27317323902389}
{"step": 35050, "global_schedule": 0.8570412397384644, "l2_grads": 1.3684974908828735, "l2_params": 333.29010009765625, "l2_updates": 0.9281620979309082, "training_loss": 2.764735698699951, "uptime": 13383.409261421999, "examples_seen": 35891200.0, "progress": 0.31441463261479946, "epoch": 28.297440385381066, "img/sec/core": 189.2325398850846, "core_hours_Tesla V100-SXM2-32GB": 52.58225096807168, "core_hours": 52.58225096807168}
{"step": 35100, "global_schedule": 0.8564990162849426, "l2_grads": 1.3217650651931763, "l2_params": 333.2260437011719, "l2_updates": 0.886804461479187, "training_loss": 2.75142502784729, "uptime": 13400.261204112961, "examples_seen": 35942400.0, "progress": 0.3148631556285153, "epoch": 28.337807632721123, "img/sec/core": 189.88908630196863, "core_hours_Tesla V100-SXM2-32GB": 52.65714849114263, "core_hours": 52.65714849114263}
{"step": 35151, "global_schedule": 0.8559558987617493, "l2_grads": 1.4545389413833618, "l2_params": 333.1733093261719, "l2_updates": 0.8931984901428223, "training_loss": 2.79874849319458, "uptime": 13417.138582835963, "examples_seen": 35993600.0, "progress": 0.31531167864223114, "epoch": 28.37817488006118, "img/sec/core": 189.60290294598573, "core_hours_Tesla V100-SXM2-32GB": 52.73215906324486, "core_hours": 52.73215906324486}
{"step": 35200, "global_schedule": 0.855411946773529, "l2_grads": 1.1158071756362915, "l2_params": 333.10382080078125, "l2_updates": 0.9197524785995483, "training_loss": 3.789405584335327, "uptime": 13433.997504330997, "examples_seen": 36044800.0, "progress": 0.315760201655947, "epoch": 28.41854212740124, "img/sec/core": 189.8104811118972, "core_hours_Tesla V100-SXM2-32GB": 52.80708760322279, "core_hours": 52.80708760322279}
{"step": 35250, "global_schedule": 0.8548671007156372, "l2_grads": 1.3004226684570312, "l2_params": 333.0921325683594, "l2_updates": 0.930529773235321, "training_loss": 3.153702735900879, "uptime": 13450.861669462989, "examples_seen": 36096000.0, "progress": 0.3162087246696628, "epoch": 28.4589093747413, "img/sec/core": 189.75146264011815, "core_hours_Tesla V100-SXM2-32GB": 52.88203944825386, "core_hours": 52.88203944825386}
{"step": 35300, "global_schedule": 0.8543214797973633, "l2_grads": 1.311585545539856, "l2_params": 333.0611572265625, "l2_updates": 0.9179847240447998, "training_loss": 2.851846218109131, "uptime": 13467.738950872968, "examples_seen": 36147200.0, "progress": 0.3166572476833786, "epoch": 28.499276622081357, "img/sec/core": 189.60399618079953, "core_hours_Tesla V100-SXM2-32GB": 52.957049587853774, "core_hours": 52.957049587853774}
{"step": 35350, "global_schedule": 0.8537749648094177, "l2_grads": 1.3560476303100586, "l2_params": 333.01617431640625, "l2_updates": 0.8973658680915833, "training_loss": 2.7331204414367676, "uptime": 13484.627176790964, "examples_seen": 36198400.0, "progress": 0.31710577069709445, "epoch": 28.539643869421415, "img/sec/core": 189.48112226460705, "core_hours_Tesla V100-SXM2-32GB": 53.03210836971153, "core_hours": 53.03210836971153}
{"step": 35400, "global_schedule": 0.8532276153564453, "l2_grads": 1.152038812637329, "l2_params": 332.9967041015625, "l2_updates": 0.9077299237251282, "training_loss": 3.6493098735809326, "uptime": 13501.49365867197, "examples_seen": 36249600.0, "progress": 0.3175542937108103, "epoch": 28.580011116761476, "img/sec/core": 189.72539872725483, "core_hours_Tesla V100-SXM2-32GB": 53.10707051140489, "core_hours": 53.10707051140489}
{"step": 35450, "global_schedule": 0.8526793718338013, "l2_grads": 1.0824713706970215, "l2_params": 332.9464111328125, "l2_updates": 0.9154216051101685, "training_loss": 4.759881973266602, "uptime": 13518.365912534995, "examples_seen": 36300800.0, "progress": 0.3180028167245261, "epoch": 28.620378364101533, "img/sec/core": 189.6604938485893, "core_hours_Tesla V100-SXM2-32GB": 53.182058306351664, "core_hours": 53.182058306351664}
{"step": 35500, "global_schedule": 0.8521303534507751, "l2_grads": 1.3639191389083862, "l2_params": 332.919921875, "l2_updates": 0.9272521138191223, "training_loss": 2.6955130100250244, "uptime": 13535.227950925997, "examples_seen": 36352000.0, "progress": 0.31845133973824197, "epoch": 28.66074561144159, "img/sec/core": 189.77539522787478, "core_hours_Tesla V100-SXM2-32GB": 53.25700069920057, "core_hours": 53.25700069920057}
{"step": 35550, "global_schedule": 0.8515805006027222, "l2_grads": 1.0205241441726685, "l2_params": 332.8822021484375, "l2_updates": 0.9124081134796143, "training_loss": 5.026346683502197, "uptime": 13552.105262003955, "examples_seen": 36403200.0, "progress": 0.3188998627519578, "epoch": 28.70111285878165, "img/sec/core": 189.60366288319238, "core_hours_Tesla V100-SXM2-32GB": 53.33201097065816, "core_hours": 53.33201097065816}
{"step": 35600, "global_schedule": 0.8510297536849976, "l2_grads": 1.1473584175109863, "l2_params": 332.8260192871094, "l2_updates": 0.9057573080062866, "training_loss": 3.3063106536865234, "uptime": 13568.975014514988, "examples_seen": 36454400.0, "progress": 0.31934838576567365, "epoch": 28.74148010612171, "img/sec/core": 189.68861563957103, "core_hours_Tesla V100-SXM2-32GB": 53.406987648484964, "core_hours": 53.406987648484964}
{"step": 35650, "global_schedule": 0.8504781723022461, "l2_grads": 1.0558823347091675, "l2_params": 332.8185729980469, "l2_updates": 0.9009233117103577, "training_loss": 5.1687331199646, "uptime": 13585.835061096994, "examples_seen": 36505600.0, "progress": 0.3197969087793895, "epoch": 28.781847353461767, "img/sec/core": 189.79781487764842, "core_hours_Tesla V100-SXM2-32GB": 53.48192118884944, "core_hours": 53.48192118884944}
{"step": 35700, "global_schedule": 0.8499257564544678, "l2_grads": 1.257375955581665, "l2_params": 332.7896728515625, "l2_updates": 0.8983722925186157, "training_loss": 3.2595322132110596, "uptime": 13602.726625414973, "examples_seen": 36556800.0, "progress": 0.32024543179310533, "epoch": 28.822214600801825, "img/sec/core": 189.44367376288574, "core_hours_Tesla V100-SXM2-32GB": 53.55699480804046, "core_hours": 53.55699480804046}
{"step": 35750, "global_schedule": 0.8493725061416626, "l2_grads": 1.4552958011627197, "l2_params": 332.7403869628906, "l2_updates": 0.8918507695198059, "training_loss": 3.285705089569092, "uptime": 13619.588377873995, "examples_seen": 36608000.0, "progress": 0.3206939548068211, "epoch": 28.862581848141886, "img/sec/core": 189.77861333076848, "core_hours_Tesla V100-SXM2-32GB": 53.63193593008056, "core_hours": 53.63193593008056}
{"step": 35800, "global_schedule": 0.8488184213638306, "l2_grads": 1.2891244888305664, "l2_params": 332.695068359375, "l2_updates": 0.9255093336105347, "training_loss": 2.9279353618621826, "uptime": 13636.464567290968, "examples_seen": 36659200.0, "progress": 0.32114247782053695, "epoch": 28.902949095481944, "img/sec/core": 189.61626472274946, "core_hours_Tesla V100-SXM2-32GB": 53.70694121637822, "core_hours": 53.70694121637822}
{"step": 35850, "global_schedule": 0.8482635021209717, "l2_grads": 1.3842400312423706, "l2_params": 332.6694641113281, "l2_updates": 0.9430692791938782, "training_loss": 2.932666778564453, "uptime": 13653.341278618958, "examples_seen": 36710400.0, "progress": 0.3215910008342528, "epoch": 28.943316342822, "img/sec/core": 189.61040085415192, "core_hours_Tesla V100-SXM2-32GB": 53.78194882228039, "core_hours": 53.78194882228039}
{"step": 35900, "global_schedule": 0.8477076888084412, "l2_grads": 1.3248201608657837, "l2_params": 332.6400451660156, "l2_updates": 0.9195579290390015, "training_loss": 2.7034008502960205, "uptime": 13670.210487817996, "examples_seen": 36761600.0, "progress": 0.32203952384796863, "epoch": 28.98368359016206, "img/sec/core": 189.69472500124732, "core_hours_Tesla V100-SXM2-32GB": 53.85692308538723, "core_hours": 53.85692308538723}
{"step": 35950, "global_schedule": 0.8471511006355286, "l2_grads": 1.33177649974823, "l2_params": 332.5896301269531, "l2_updates": 0.8931276798248291, "training_loss": 2.687859058380127, "uptime": 13687.07518172497, "examples_seen": 36812800.0, "progress": 0.3224880468616845, "epoch": 29.02405083750212, "img/sec/core": 189.7455131798676, "core_hours_Tesla V100-SXM2-32GB": 53.93187728052933, "core_hours": 53.93187728052933}
{"step": 36000, "global_schedule": 0.8465936779975891, "l2_grads": 1.403427004814148, "l2_params": 332.5655517578125, "l2_updates": 0.9217345714569092, "training_loss": 2.803316593170166, "uptime": 13703.937004131963, "examples_seen": 36864000.0, "progress": 0.3229365698754003, "epoch": 29.064418084842178, "img/sec/core": 189.77782607131837, "core_hours_Tesla V100-SXM2-32GB": 54.006818713449306, "core_hours": 54.006818713449306}
{"step": 36050, "global_schedule": 0.8460354208946228, "l2_grads": 1.3212724924087524, "l2_params": 332.5353088378906, "l2_updates": 0.9122871160507202, "training_loss": 2.6320881843566895, "uptime": 13721.612328476971, "examples_seen": 36915200.0, "progress": 0.32338509288911615, "epoch": 29.104785332182235, "img/sec/core": 189.6520939226771, "core_hours_Tesla V100-SXM2-32GB": 54.0818098296983, "core_hours": 54.0818098296983}
{"step": 36100, "global_schedule": 0.8454763293266296, "l2_grads": 1.224621057510376, "l2_params": 332.49920654296875, "l2_updates": 0.9258031249046326, "training_loss": 2.845064163208008, "uptime": 13738.512101039, "examples_seen": 36966400.0, "progress": 0.323833615902832, "epoch": 29.145152579522296, "img/sec/core": 189.3516606957179, "core_hours_Tesla V100-SXM2-32GB": 54.15691992997399, "core_hours": 54.15691992997399}
{"step": 36150, "global_schedule": 0.8449164628982544, "l2_grads": 1.2826989889144897, "l2_params": 332.43524169921875, "l2_updates": 0.9111965298652649, "training_loss": 2.791914463043213, "uptime": 13755.423802735982, "examples_seen": 37017600.0, "progress": 0.32428213891654784, "epoch": 29.185519826862354, "img/sec/core": 189.21809628246086, "core_hours_Tesla V100-SXM2-32GB": 54.232083048627246, "core_hours": 54.232083048627246}
{"step": 36200, "global_schedule": 0.8443557024002075, "l2_grads": 1.3271676301956177, "l2_params": 332.3805847167969, "l2_updates": 0.9119611978530884, "training_loss": 2.7581229209899902, "uptime": 13772.33336887299, "examples_seen": 37068800.0, "progress": 0.3247306619302636, "epoch": 29.22588707420241, "img/sec/core": 189.2419932050452, "core_hours_Tesla V100-SXM2-32GB": 54.307236675902836, "core_hours": 54.307236675902836}
{"step": 36250, "global_schedule": 0.8437941074371338, "l2_grads": 1.3346123695373535, "l2_params": 332.3351745605469, "l2_updates": 0.9022786021232605, "training_loss": 2.740001916885376, "uptime": 13789.250660583959, "examples_seen": 37120000.0, "progress": 0.32517918494397946, "epoch": 29.26625432154247, "img/sec/core": 189.15557257461708, "core_hours_Tesla V100-SXM2-32GB": 54.3824246390627, "core_hours": 54.3824246390627}
{"step": 36300, "global_schedule": 0.843231737613678, "l2_grads": 1.2244969606399536, "l2_params": 332.2819519042969, "l2_updates": 0.8951017260551453, "training_loss": 3.6269917488098145, "uptime": 13806.156821015, "examples_seen": 37171200.0, "progress": 0.3256277079576953, "epoch": 29.30662156888253, "img/sec/core": 189.28011555625437, "core_hours_Tesla V100-SXM2-32GB": 54.457563129867324, "core_hours": 54.457563129867324}
{"step": 36350, "global_schedule": 0.8426685333251953, "l2_grads": 1.1487101316452026, "l2_params": 332.2162780761719, "l2_updates": 0.8861491680145264, "training_loss": 5.26767635345459, "uptime": 13823.049926701991, "examples_seen": 37222400.0, "progress": 0.32607623097141114, "epoch": 29.346988816222588, "img/sec/core": 189.42638845053565, "core_hours_Tesla V100-SXM2-32GB": 54.53264359958728, "core_hours": 54.53264359958728}
{"step": 36400, "global_schedule": 0.842104434967041, "l2_grads": 1.3630813360214233, "l2_params": 332.1636047363281, "l2_updates": 0.9200595021247864, "training_loss": 2.864384889602661, "uptime": 13839.942979755986, "examples_seen": 37273600.0, "progress": 0.326524753985127, "epoch": 29.387356063562645, "img/sec/core": 189.4269786386128, "core_hours_Tesla V100-SXM2-32GB": 54.607723835382814, "core_hours": 54.607723835382814}
{"step": 36450, "global_schedule": 0.8415396213531494, "l2_grads": 1.1944191455841064, "l2_params": 332.1613464355469, "l2_updates": 0.9130608439445496, "training_loss": 5.149999618530273, "uptime": 13856.866132092953, "examples_seen": 37324800.0, "progress": 0.3269732769988428, "epoch": 29.427723310902703, "img/sec/core": 189.0900664535102, "core_hours_Tesla V100-SXM2-32GB": 54.68293784576934, "core_hours": 54.68293784576934}
{"step": 36500, "global_schedule": 0.840973973274231, "l2_grads": 1.3294789791107178, "l2_params": 332.135498046875, "l2_updates": 0.9148823022842407, "training_loss": 2.89396071434021, "uptime": 13873.77894407796, "examples_seen": 37376000.0, "progress": 0.32742180001255866, "epoch": 29.468090558242764, "img/sec/core": 189.20567454051076, "core_hours_Tesla V100-SXM2-32GB": 54.75810589903604, "core_hours": 54.75810589903604}
{"step": 36550, "global_schedule": 0.8404074907302856, "l2_grads": 1.150739312171936, "l2_params": 332.1100158691406, "l2_updates": 0.9232209920883179, "training_loss": 3.369813919067383, "uptime": 13890.691562096996, "examples_seen": 37427200.0, "progress": 0.3278703230262745, "epoch": 29.50845780558282, "img/sec/core": 189.207844486184, "core_hours_Tesla V100-SXM2-32GB": 54.83327309023175, "core_hours": 54.83327309023175}
{"step": 36600, "global_schedule": 0.8398401737213135, "l2_grads": 1.3648289442062378, "l2_params": 332.1015625, "l2_updates": 0.8933337926864624, "training_loss": 2.7998745441436768, "uptime": 13907.602371436951, "examples_seen": 37478400.0, "progress": 0.3283188460399903, "epoch": 29.54882505292288, "img/sec/core": 189.22808102621718, "core_hours_Tesla V100-SXM2-32GB": 54.90843224285378, "core_hours": 54.90843224285378}
{"step": 36650, "global_schedule": 0.8392720222473145, "l2_grads": 1.3347136974334717, "l2_params": 332.05511474609375, "l2_updates": 0.8853026032447815, "training_loss": 2.938445568084717, "uptime": 13924.495815025002, "examples_seen": 37529600.0, "progress": 0.3287673690537061, "epoch": 29.58919230026294, "img/sec/core": 189.4225995618447, "core_hours_Tesla V100-SXM2-32GB": 54.98351421435622, "core_hours": 54.98351421435622}
{"step": 36700, "global_schedule": 0.8387030959129333, "l2_grads": 1.4210482835769653, "l2_params": 331.97271728515625, "l2_updates": 0.8813541531562805, "training_loss": 2.9157259464263916, "uptime": 13941.391691978963, "examples_seen": 37580800.0, "progress": 0.32921589206742197, "epoch": 29.629559547602998, "img/sec/core": 189.39531867565591, "core_hours_Tesla V100-SXM2-32GB": 55.05860700081827, "core_hours": 55.05860700081827}
{"step": 36750, "global_schedule": 0.8381333351135254, "l2_grads": 1.3222728967666626, "l2_params": 331.9195861816406, "l2_updates": 0.8987774848937988, "training_loss": 2.6630616188049316, "uptime": 13958.310628163978, "examples_seen": 37632000.0, "progress": 0.3296644150811378, "epoch": 29.669926794943056, "img/sec/core": 189.13718717340157, "core_hours_Tesla V100-SXM2-32GB": 55.13380227275167, "core_hours": 55.13380227275167}
{"step": 36800, "global_schedule": 0.8375627994537354, "l2_grads": 1.1012178659439087, "l2_params": 331.9072570800781, "l2_updates": 0.8743176460266113, "training_loss": 5.2556562423706055, "uptime": 13975.19972121995, "examples_seen": 37683200.0, "progress": 0.33011293809485365, "epoch": 29.710294042283113, "img/sec/core": 189.47139372107944, "core_hours_Tesla V100-SXM2-32GB": 55.20886490855599, "core_hours": 55.20886490855599}
{"step": 36850, "global_schedule": 0.8369914293289185, "l2_grads": 1.183165431022644, "l2_params": 331.8417053222656, "l2_updates": 0.8456599116325378, "training_loss": 5.206022262573242, "uptime": 13992.122522357968, "examples_seen": 37734400.0, "progress": 0.3305614611085695, "epoch": 29.750661289623174, "img/sec/core": 189.09399064029512, "core_hours_Tesla V100-SXM2-32GB": 55.28407735805829, "core_hours": 55.28407735805829}
{"step": 36900, "global_schedule": 0.8364192843437195, "l2_grads": 1.3381667137145996, "l2_params": 331.776123046875, "l2_updates": 0.9112467765808105, "training_loss": 2.847719430923462, "uptime": 14009.025966667978, "examples_seen": 37785600.0, "progress": 0.33100998412228533, "epoch": 29.791028536963232, "img/sec/core": 189.3105299317614, "core_hours_Tesla V100-SXM2-32GB": 55.35920377721389, "core_hours": 55.35920377721389}
{"step": 36950, "global_schedule": 0.8358463048934937, "l2_grads": 1.3964855670928955, "l2_params": 331.7584533691406, "l2_updates": 0.8980711698532104, "training_loss": 2.809662342071533, "uptime": 14025.935942069977, "examples_seen": 37836800.0, "progress": 0.33145850713600117, "epoch": 29.83139578430329, "img/sec/core": 189.23741306103386, "core_hours_Tesla V100-SXM2-32GB": 55.43435922344499, "core_hours": 55.43435922344499}
{"step": 37000, "global_schedule": 0.8352725505828857, "l2_grads": 1.302534580230713, "l2_params": 331.7004699707031, "l2_updates": 0.887507975101471, "training_loss": 2.769867181777954, "uptime": 14042.848016200995, "examples_seen": 37888000.0, "progress": 0.331907030149717, "epoch": 29.87176303164335, "img/sec/core": 189.21392936251144, "core_hours_Tesla V100-SXM2-32GB": 55.50952399736063, "core_hours": 55.50952399736063}
{"step": 37050, "global_schedule": 0.834697961807251, "l2_grads": 1.4178881645202637, "l2_params": 331.6567687988281, "l2_updates": 0.8892791867256165, "training_loss": 2.7789530754089355, "uptime": 14060.234802058956, "examples_seen": 37939200.0, "progress": 0.3323555531634328, "epoch": 29.91213027898341, "img/sec/core": 189.6257474317871, "core_hours_Tesla V100-SXM2-32GB": 55.58452553283165, "core_hours": 55.58452553283165}
{"step": 37100, "global_schedule": 0.8341225385665894, "l2_grads": 1.3624643087387085, "l2_params": 331.5822448730469, "l2_updates": 0.8939524292945862, "training_loss": 2.814027786254883, "uptime": 14077.113495220954, "examples_seen": 37990400.0, "progress": 0.33280407617714863, "epoch": 29.952497526323466, "img/sec/core": 189.58813749898238, "core_hours_Tesla V100-SXM2-32GB": 55.659541946884964, "core_hours": 55.659541946884964}
{"step": 37150, "global_schedule": 0.8335464000701904, "l2_grads": 1.2636171579360962, "l2_params": 331.52264404296875, "l2_updates": 0.9026963114738464, "training_loss": 3.320547580718994, "uptime": 14093.98896832799, "examples_seen": 38041600.0, "progress": 0.3332525991908645, "epoch": 29.992864773663523, "img/sec/core": 189.62431332758763, "core_hours_Tesla V100-SXM2-32GB": 55.734544049582915, "core_hours": 55.734544049582915}
{"step": 37200, "global_schedule": 0.8329693675041199, "l2_grads": 1.310965657234192, "l2_params": 331.4909362792969, "l2_updates": 0.8911045789718628, "training_loss": 2.759708881378174, "uptime": 14110.879861972993, "examples_seen": 38092800.0, "progress": 0.3337011222045803, "epoch": 30.033232021003585, "img/sec/core": 189.45119584876323, "core_hours_Tesla V100-SXM2-32GB": 55.80961468800514, "core_hours": 55.80961468800514}
{"step": 37250, "global_schedule": 0.832391619682312, "l2_grads": 1.2901182174682617, "l2_params": 331.4480285644531, "l2_updates": 0.9063751697540283, "training_loss": 2.6569035053253174, "uptime": 14127.746915237978, "examples_seen": 38144000.0, "progress": 0.33414964521829615, "epoch": 30.073599268343642, "img/sec/core": 189.71897163821947, "core_hours_Tesla V100-SXM2-32GB": 55.88457936918285, "core_hours": 55.88457936918285}
{"step": 37300, "global_schedule": 0.8318129777908325, "l2_grads": 1.2385015487670898, "l2_params": 331.4114685058594, "l2_updates": 0.8853996992111206, "training_loss": 3.9446630477905273, "uptime": 14144.634477120999, "examples_seen": 38195200.0, "progress": 0.334598168232012, "epoch": 30.1139665156837, "img/sec/core": 189.4885728423229, "core_hours_Tesla V100-SXM2-32GB": 55.959635199774056, "core_hours": 55.959635199774056}
{"step": 37350, "global_schedule": 0.8312336206436157, "l2_grads": 1.3301935195922852, "l2_params": 331.3743591308594, "l2_updates": 0.8972116112709045, "training_loss": 2.690673589706421, "uptime": 14161.508745533996, "examples_seen": 38246400.0, "progress": 0.33504669124572783, "epoch": 30.15433376302376, "img/sec/core": 189.63785105700853, "core_hours_Tesla V100-SXM2-32GB": 56.034631948276264, "core_hours": 56.034631948276264}
{"step": 37400, "global_schedule": 0.8306534886360168, "l2_grads": 1.1096951961517334, "l2_params": 331.29833984375, "l2_updates": 0.9065558910369873, "training_loss": 3.382768154144287, "uptime": 14178.380519654951, "examples_seen": 38297600.0, "progress": 0.3354952142594437, "epoch": 30.19470101036382, "img/sec/core": 189.6658867679831, "core_hours_Tesla V100-SXM2-32GB": 56.109617611036064, "core_hours": 56.109617611036064}
{"step": 37450, "global_schedule": 0.8300725221633911, "l2_grads": 1.1188225746154785, "l2_params": 331.270263671875, "l2_updates": 0.8795729875564575, "training_loss": 4.952387809753418, "uptime": 14195.26427270897, "examples_seen": 38348800.0, "progress": 0.33594373727315946, "epoch": 30.235068257703876, "img/sec/core": 189.53131982929293, "core_hours_Tesla V100-SXM2-32GB": 56.18465651349837, "core_hours": 56.18465651349837}
{"step": 37500, "global_schedule": 0.8294907808303833, "l2_grads": 1.3559592962265015, "l2_params": 331.2540283203125, "l2_updates": 0.8944805860519409, "training_loss": 2.897911787033081, "uptime": 14212.140297646984, "examples_seen": 38400000.0, "progress": 0.3363922602868753, "epoch": 30.275435505043934, "img/sec/core": 189.61811278151654, "core_hours_Tesla V100-SXM2-32GB": 56.259661068778435, "core_hours": 56.259661068778435, "minival/prec@1": 0.6180924133624727, "minival/loss": 1.6669723887090715, "minival/sample count": 12812.0, "minival/attn_weight_avg": [13312, 12, 281], "minival/attn_mag": [13312, 12, 281], "minival/before_mlp": [13312, 12, 281], "z/secs/eval/minival": 2.935794460994657, "real/prec@1": 0.6621474475307983, "real/loss": 2.5067530890875536, "real/sample count": 46837.0, "real/attn_weight_avg": [50176, 12, 281], "real/attn_mag": [50176, 12, 281], "real/before_mlp": [50176, 12, 281], "z/secs/eval/real": 11.15557910403004, "train/prec@1": 0.6410646684619288, "train/loss": 1.5596389504016452, "train/sample count": 25623.0, "train/attn_weight_avg": [26624, 12, 281], "train/attn_mag": [26624, 12, 281], "train/before_mlp": [26624, 12, 281], "z/secs/eval/train": 6.584750227048062, "v2/prec@1": 0.4692, "v2/loss": 2.4540976440429687, "v2/sample count": 10000.0, "v2/attn_weight_avg": [10240, 12, 281], "v2/attn_mag": [10240, 12, 281], "v2/before_mlp": [10240, 12, 281], "z/secs/eval/v2": 3.39485376898665, "val/prec@1": 0.58752, "val/loss": 1.8039443237304686, "val/sample count": 50000.0, "val/attn_weight_avg": [50176, 12, 281], "val/attn_mag": [50176, 12, 281], "val/before_mlp": [50176, 12, 281], "z/secs/eval/val": 12.25361597497249}
{"step": 37550, "global_schedule": 0.8289082050323486, "l2_grads": 1.3102880716323853, "l2_params": 331.2154846191406, "l2_updates": 0.8875637054443359, "training_loss": 2.667922258377075, "uptime": 14265.364851281978, "examples_seen": 38451200.0, "progress": 0.33684078330059114, "epoch": 30.315802752383995, "img/sec/core": 189.3707380273123, "core_hours_Tesla V100-SXM2-32GB": 56.33476360241365, "core_hours": 56.33476360241365}
{"step": 37600, "global_schedule": 0.8283249139785767, "l2_grads": 1.3189893960952759, "l2_params": 331.1562805175781, "l2_updates": 0.8906012177467346, "training_loss": 2.828674793243408, "uptime": 14282.232676215994, "examples_seen": 38502400.0, "progress": 0.337289306314307, "epoch": 30.356169999724052, "img/sec/core": 189.71029237722917, "core_hours_Tesla V100-SXM2-32GB": 56.4097317132315, "core_hours": 56.4097317132315}
{"step": 37650, "global_schedule": 0.8277407884597778, "l2_grads": 1.2834794521331787, "l2_params": 331.1200256347656, "l2_updates": 0.8832756876945496, "training_loss": 2.562587261199951, "uptime": 14299.101023519004, "examples_seen": 38553600.0, "progress": 0.3377378293280228, "epoch": 30.39653724706411, "img/sec/core": 189.7044175411832, "core_hours_Tesla V100-SXM2-32GB": 56.48470214568932, "core_hours": 56.48470214568932}
{"step": 37700, "global_schedule": 0.8271559476852417, "l2_grads": 1.1537808179855347, "l2_params": 331.0791320800781, "l2_updates": 0.8605014085769653, "training_loss": 5.22415828704834, "uptime": 14315.941831859003, "examples_seen": 38604800.0, "progress": 0.33818635234173866, "epoch": 30.436904494404168, "img/sec/core": 190.0146320411232, "core_hours_Tesla V100-SXM2-32GB": 56.559550182755984, "core_hours": 56.559550182755984}
{"step": 37750, "global_schedule": 0.8265702128410339, "l2_grads": 1.1543257236480713, "l2_params": 331.03240966796875, "l2_updates": 0.8856131434440613, "training_loss": 4.4966139793396, "uptime": 14332.813728098, "examples_seen": 38656000.0, "progress": 0.3386348753554545, "epoch": 30.47727174174423, "img/sec/core": 189.66451397463808, "core_hours_Tesla V100-SXM2-32GB": 56.63453638826264, "core_hours": 56.63453638826264}
{"step": 37800, "global_schedule": 0.8259837627410889, "l2_grads": 1.6054397821426392, "l2_params": 331.00823974609375, "l2_updates": 0.8510372042655945, "training_loss": 2.7968337535858154, "uptime": 14349.671104367997, "examples_seen": 38707200.0, "progress": 0.33908339836917034, "epoch": 30.517638989084286, "img/sec/core": 189.82788001805264, "core_hours_Tesla V100-SXM2-32GB": 56.70945806057374, "core_hours": 56.70945806057374}
{"step": 37850, "global_schedule": 0.8253965377807617, "l2_grads": 1.324654459953308, "l2_params": 330.93780517578125, "l2_updates": 0.9002436399459839, "training_loss": 2.918762683868408, "uptime": 14366.545166597003, "examples_seen": 38758400.0, "progress": 0.3395319213828862, "epoch": 30.558006236424344, "img/sec/core": 189.64016823994407, "core_hours_Tesla V100-SXM2-32GB": 56.78445389270265, "core_hours": 56.78445389270265}
{"step": 37900, "global_schedule": 0.8248084783554077, "l2_grads": 1.361767053604126, "l2_params": 330.8916931152344, "l2_updates": 0.8960312604904175, "training_loss": 2.664393901824951, "uptime": 14383.42795572296, "examples_seen": 38809600.0, "progress": 0.33998044439660197, "epoch": 30.598373483764405, "img/sec/core": 189.54214117855938, "core_hours_Tesla V100-SXM2-32GB": 56.85948851104024, "core_hours": 56.85948851104024}
{"step": 37950, "global_schedule": 0.8242197036743164, "l2_grads": 1.2924487590789795, "l2_params": 330.872802734375, "l2_updates": 0.8840457201004028, "training_loss": 5.006996154785156, "uptime": 14400.28912339796, "examples_seen": 38860800.0, "progress": 0.3404289674103178, "epoch": 30.638740731104463, "img/sec/core": 189.78519528896643, "core_hours_Tesla V100-SXM2-32GB": 56.93442703404024, "core_hours": 56.93442703404024}
{"step": 38000, "global_schedule": 0.8236300945281982, "l2_grads": 1.2942183017730713, "l2_params": 330.8389892578125, "l2_updates": 0.8522926568984985, "training_loss": 3.610104560852051, "uptime": 14417.15976409195, "examples_seen": 38912000.0, "progress": 0.34087749042403365, "epoch": 30.67910797844452, "img/sec/core": 189.67862916671186, "core_hours_Tesla V100-SXM2-32GB": 57.009407659346856, "core_hours": 57.009407659346856}
{"step": 38050, "global_schedule": 0.8230397701263428, "l2_grads": 1.1078100204467773, "l2_params": 330.7674865722656, "l2_updates": 0.8829504251480103, "training_loss": 3.727153778076172, "uptime": 14434.527549146966, "examples_seen": 38963200.0, "progress": 0.3413260134377495, "epoch": 30.719475225784578, "img/sec/core": 189.7893841886668, "core_hours_Tesla V100-SXM2-32GB": 57.084344528355736, "core_hours": 57.084344528355736}
{"step": 38100, "global_schedule": 0.8224486112594604, "l2_grads": 1.3185120820999146, "l2_params": 330.7107849121094, "l2_updates": 0.8803793787956238, "training_loss": 2.6181421279907227, "uptime": 14451.378114921972, "examples_seen": 39014400.0, "progress": 0.3417745364514653, "epoch": 30.75984247312464, "img/sec/core": 189.9046027728263, "core_hours_Tesla V100-SXM2-32GB": 57.15923593180022, "core_hours": 57.15923593180022}
{"step": 38150, "global_schedule": 0.8218567371368408, "l2_grads": 1.45357346534729, "l2_params": 330.6632995605469, "l2_updates": 0.8747252225875854, "training_loss": 2.854543447494507, "uptime": 14468.24450064596, "examples_seen": 39065600.0, "progress": 0.34222305946518117, "epoch": 30.800209720464697, "img/sec/core": 189.72648037147815, "core_hours_Tesla V100-SXM2-32GB": 57.23419764612905, "core_hours": 57.23419764612905}
{"step": 38200, "global_schedule": 0.8212640285491943, "l2_grads": 1.3657623529434204, "l2_params": 330.6037292480469, "l2_updates": 0.8540794849395752, "training_loss": 2.7064149379730225, "uptime": 14485.108913464996, "examples_seen": 39116800.0, "progress": 0.342671582478897, "epoch": 30.840576967804754, "img/sec/core": 189.74867576700134, "core_hours_Tesla V100-SXM2-32GB": 57.309150591991425, "core_hours": 57.309150591991425}
{"step": 38250, "global_schedule": 0.8206706047058105, "l2_grads": 1.1601225137710571, "l2_params": 330.55267333984375, "l2_updates": 0.9069470167160034, "training_loss": 3.426513671875, "uptime": 14501.999327773985, "examples_seen": 39168000.0, "progress": 0.34312010549261285, "epoch": 30.880944215144815, "img/sec/core": 189.4565723172874, "core_hours_Tesla V100-SXM2-32GB": 57.38421910003138, "core_hours": 57.38421910003138}
{"step": 38300, "global_schedule": 0.8200763463973999, "l2_grads": 1.2749028205871582, "l2_params": 330.52264404296875, "l2_updates": 0.9041992425918579, "training_loss": 2.722012996673584, "uptime": 14518.867485619965, "examples_seen": 39219200.0, "progress": 0.34356862850632863, "epoch": 30.921311462484873, "img/sec/core": 189.70654823239138, "core_hours_Tesla V100-SXM2-32GB": 57.45918869045796, "core_hours": 57.45918869045796}
{"step": 38350, "global_schedule": 0.819481372833252, "l2_grads": 1.3052853345870972, "l2_params": 330.4791259765625, "l2_updates": 0.8832526803016663, "training_loss": 2.849329948425293, "uptime": 14535.737390849972, "examples_seen": 39270400.0, "progress": 0.3440171515200445, "epoch": 30.96167870982493, "img/sec/core": 189.68689843663375, "core_hours_Tesla V100-SXM2-32GB": 57.53416604703577, "core_hours": 57.53416604703577}
{"step": 38400, "global_schedule": 0.8188856244087219, "l2_grads": 1.1767778396606445, "l2_params": 330.42431640625, "l2_updates": 0.8936707377433777, "training_loss": 3.4941158294677734, "uptime": 14552.606514393992, "examples_seen": 39321600.0, "progress": 0.3444656745337603, "epoch": 31.002045957164988, "img/sec/core": 189.69568819918678, "core_hours_Tesla V100-SXM2-32GB": 57.60913992945363, "core_hours": 57.60913992945363}
{"step": 38450, "global_schedule": 0.8182891607284546, "l2_grads": 1.1377671957015991, "l2_params": 330.3656921386719, "l2_updates": 0.8659805655479431, "training_loss": 4.538954734802246, "uptime": 14569.47660737997, "examples_seen": 39372800.0, "progress": 0.34491419754747615, "epoch": 31.04241320450505, "img/sec/core": 189.68478731326252, "core_hours_Tesla V100-SXM2-32GB": 57.68411812050242, "core_hours": 57.68411812050242}
{"step": 38500, "global_schedule": 0.8176918625831604, "l2_grads": 1.4298672676086426, "l2_params": 330.35272216796875, "l2_updates": 0.8730778694152832, "training_loss": 2.907156467437744, "uptime": 14586.358478203998, "examples_seen": 39424000.0, "progress": 0.345362720561192, "epoch": 31.082780451845107, "img/sec/core": 189.55245146440132, "core_hours_Tesla V100-SXM2-32GB": 57.75914865749811, "core_hours": 57.75914865749811}
{"step": 38550, "global_schedule": 0.8170937299728394, "l2_grads": 1.3265457153320312, "l2_params": 330.2950744628906, "l2_updates": 0.8774410486221313, "training_loss": 2.8224358558654785, "uptime": 14603.207405130961, "examples_seen": 39475200.0, "progress": 0.34581124357490783, "epoch": 31.123147699185164, "img/sec/core": 189.92307426291333, "core_hours_Tesla V100-SXM2-32GB": 57.8340327771735, "core_hours": 57.8340327771735}
{"step": 38600, "global_schedule": 0.8164949417114258, "l2_grads": 1.2569929361343384, "l2_params": 330.2086181640625, "l2_updates": 0.8524842262268066, "training_loss": 4.632964134216309, "uptime": 14620.096124731994, "examples_seen": 39526400.0, "progress": 0.3462597665886237, "epoch": 31.163514946525222, "img/sec/core": 189.47558344235352, "core_hours_Tesla V100-SXM2-32GB": 57.90909375317809, "core_hours": 57.90909375317809}
{"step": 38650, "global_schedule": 0.8158954381942749, "l2_grads": 1.401296854019165, "l2_params": 330.15570068359375, "l2_updates": 0.8902603387832642, "training_loss": 2.67935848236084, "uptime": 14636.960493933992, "examples_seen": 39577600.0, "progress": 0.3467082896023395, "epoch": 31.203882193865283, "img/sec/core": 189.74916652209717, "core_hours_Tesla V100-SXM2-32GB": 57.98404650518697, "core_hours": 57.98404650518697}
{"step": 38700, "global_schedule": 0.8152951002120972, "l2_grads": 1.0741937160491943, "l2_params": 330.1109313964844, "l2_updates": 0.8636539578437805, "training_loss": 4.0752458572387695, "uptime": 14653.833762720984, "examples_seen": 39628800.0, "progress": 0.34715681261605535, "epoch": 31.24424944120534, "img/sec/core": 189.6490858052873, "core_hours_Tesla V100-SXM2-32GB": 58.059038810906934, "core_hours": 58.059038810906934}
{"step": 38750, "global_schedule": 0.8146940469741821, "l2_grads": 1.1582998037338257, "l2_params": 330.076904296875, "l2_updates": 0.8795880079269409, "training_loss": 5.116110801696777, "uptime": 14670.708110736974, "examples_seen": 39680000.0, "progress": 0.34760533562977114, "epoch": 31.2846166885454, "img/sec/core": 189.6369564600472, "core_hours_Tesla V100-SXM2-32GB": 58.13403591320022, "core_hours": 58.13403591320022}
{"step": 38801, "global_schedule": 0.8140922784805298, "l2_grads": 1.348652720451355, "l2_params": 330.03314208984375, "l2_updates": 0.8746715188026428, "training_loss": 2.6895103454589844, "uptime": 14687.589733714005, "examples_seen": 39731200.0, "progress": 0.348053858643487, "epoch": 31.32498393588546, "img/sec/core": 189.5552343725427, "core_hours_Tesla V100-SXM2-32GB": 58.20906534865369, "core_hours": 58.20906534865369}
{"step": 38851, "global_schedule": 0.8134896755218506, "l2_grads": 1.2296072244644165, "l2_params": 329.9488830566406, "l2_updates": 0.8343518376350403, "training_loss": 5.099783420562744, "uptime": 14704.463961915986, "examples_seen": 39782400.0, "progress": 0.3485023816572028, "epoch": 31.365351183225517, "img/sec/core": 189.63830296097896, "core_hours_Tesla V100-SXM2-32GB": 58.28406191844028, "core_hours": 58.28406191844028}
{"step": 38900, "global_schedule": 0.8128863573074341, "l2_grads": 1.0908396244049072, "l2_params": 329.9168395996094, "l2_updates": 0.8700147271156311, "training_loss": 4.113882064819336, "uptime": 14721.347033548984, "examples_seen": 39833600.0, "progress": 0.34895090467091866, "epoch": 31.405718430565575, "img/sec/core": 189.53896954068887, "core_hours_Tesla V100-SXM2-32GB": 58.359097792364715, "core_hours": 58.359097792364715}
{"step": 38950, "global_schedule": 0.8122823238372803, "l2_grads": 1.3709869384765625, "l2_params": 329.8739013671875, "l2_updates": 0.8576440811157227, "training_loss": 3.1600492000579834, "uptime": 14738.229690720967, "examples_seen": 39884800.0, "progress": 0.3493994276846345, "epoch": 31.446085677905632, "img/sec/core": 189.54362263010967, "core_hours_Tesla V100-SXM2-32GB": 58.4341318242402, "core_hours": 58.4341318242402}
{"step": 39000, "global_schedule": 0.8116774559020996, "l2_grads": 1.4084360599517822, "l2_params": 329.78826904296875, "l2_updates": 0.8551872968673706, "training_loss": 2.676300287246704, "uptime": 14755.089860812994, "examples_seen": 39936000.0, "progress": 0.34984795069835034, "epoch": 31.486452925245693, "img/sec/core": 189.79642450424575, "core_hours_Tesla V100-SXM2-32GB": 58.50906591353809, "core_hours": 58.50906591353809}
{"step": 39050, "global_schedule": 0.8110718727111816, "l2_grads": 1.340925693511963, "l2_params": 329.7518005371094, "l2_updates": 0.8801060318946838, "training_loss": 2.7394790649414062, "uptime": 14772.522277269978, "examples_seen": 39987200.0, "progress": 0.3502964737120662, "epoch": 31.52682017258575, "img/sec/core": 189.67123492266774, "core_hours_Tesla V100-SXM2-32GB": 58.58404946192918, "core_hours": 58.58404946192918}
{"step": 39100, "global_schedule": 0.8104655742645264, "l2_grads": 1.2147583961486816, "l2_params": 329.6763610839844, "l2_updates": 0.8624186515808105, "training_loss": 3.2186779975891113, "uptime": 14789.412811909977, "examples_seen": 40038400.0, "progress": 0.350744996725782, "epoch": 31.56718741992581, "img/sec/core": 189.45522259680388, "core_hours_Tesla V100-SXM2-32GB": 58.659118504773616, "core_hours": 58.659118504773616}
{"step": 39150, "global_schedule": 0.8098585605621338, "l2_grads": 1.311597228050232, "l2_params": 329.613525390625, "l2_updates": 0.8896142244338989, "training_loss": 3.041043758392334, "uptime": 14806.282248114992, "examples_seen": 40089600.0, "progress": 0.35119351973949786, "epoch": 31.60755466726587, "img/sec/core": 189.69217234708742, "core_hours_Tesla V100-SXM2-32GB": 58.73409377679591, "core_hours": 58.73409377679591}
{"step": 39201, "global_schedule": 0.8092507123947144, "l2_grads": 1.2636643648147583, "l2_params": 329.5960693359375, "l2_updates": 0.8751349449157715, "training_loss": 2.6402392387390137, "uptime": 14823.179532333976, "examples_seen": 40140800.0, "progress": 0.35164204275321365, "epoch": 31.647921914605927, "img/sec/core": 189.37954517004331, "core_hours_Tesla V100-SXM2-32GB": 58.809192817769166, "core_hours": 58.809192817769166}
{"step": 39250, "global_schedule": 0.8086421489715576, "l2_grads": 1.3800384998321533, "l2_params": 329.55035400390625, "l2_updates": 0.8535280227661133, "training_loss": 2.756124496459961, "uptime": 14840.065646973962, "examples_seen": 40192000.0, "progress": 0.3520905657669295, "epoch": 31.688289161945985, "img/sec/core": 189.50481316894025, "core_hours_Tesla V100-SXM2-32GB": 58.88424221616911, "core_hours": 58.88424221616911}
{"step": 39300, "global_schedule": 0.8080328702926636, "l2_grads": 1.2868928909301758, "l2_params": 329.4920654296875, "l2_updates": 0.8836904168128967, "training_loss": 4.435753345489502, "uptime": 14856.943688809988, "examples_seen": 40243200.0, "progress": 0.3525390887806453, "epoch": 31.728656409286042, "img/sec/core": 189.59545373146895, "core_hours_Tesla V100-SXM2-32GB": 58.95925573544034, "core_hours": 58.95925573544034}
{"step": 39350, "global_schedule": 0.8074228763580322, "l2_grads": 1.1744093894958496, "l2_params": 329.4613952636719, "l2_updates": 0.8699439764022827, "training_loss": 3.8953537940979004, "uptime": 14873.834635484964, "examples_seen": 40294400.0, "progress": 0.35298761179436117, "epoch": 31.769023656626104, "img/sec/core": 189.4506010572453, "core_hours_Tesla V100-SXM2-32GB": 59.03432660955134, "core_hours": 59.03432660955134}
{"step": 39400, "global_schedule": 0.8068121671676636, "l2_grads": 1.2620035409927368, "l2_params": 329.42547607421875, "l2_updates": 0.9012504816055298, "training_loss": 2.729684591293335, "uptime": 14890.723119720991, "examples_seen": 40345600.0, "progress": 0.353436134808077, "epoch": 31.80939090396616, "img/sec/core": 189.47822405361626, "core_hours_Tesla V100-SXM2-32GB": 59.109386539489236, "core_hours": 59.109386539489236}
{"step": 39450, "global_schedule": 0.8062006235122681, "l2_grads": 1.4602471590042114, "l2_params": 329.366943359375, "l2_updates": 0.8549063801765442, "training_loss": 2.6930079460144043, "uptime": 14907.609231305949, "examples_seen": 40396800.0, "progress": 0.35388465782179285, "epoch": 31.84975815130622, "img/sec/core": 189.5048474540812, "core_hours_Tesla V100-SXM2-32GB": 59.18443592431127, "core_hours": 59.18443592431127}
{"step": 39500, "global_schedule": 0.80558842420578, "l2_grads": 1.221256136894226, "l2_params": 329.30987548828125, "l2_updates": 0.8777482509613037, "training_loss": 3.262638807296753, "uptime": 14924.491515117988, "examples_seen": 40448000.0, "progress": 0.3543331808355087, "epoch": 31.89012539864628, "img/sec/core": 189.54781447981185, "core_hours_Tesla V100-SXM2-32GB": 59.259468296809224, "core_hours": 59.259468296809224}
{"step": 39550, "global_schedule": 0.8049754500389099, "l2_grads": 1.3977652788162231, "l2_params": 329.2573547363281, "l2_updates": 0.8613956570625305, "training_loss": 2.8400304317474365, "uptime": 14941.370332484948, "examples_seen": 40499200.0, "progress": 0.35478170384922453, "epoch": 31.930492645986337, "img/sec/core": 189.58674239013612, "core_hours_Tesla V100-SXM2-32GB": 59.334485262884606, "core_hours": 59.334485262884606}
{"step": 39600, "global_schedule": 0.8043618202209473, "l2_grads": 1.4353976249694824, "l2_params": 329.2289123535156, "l2_updates": 0.8570398092269897, "training_loss": 2.7845096588134766, "uptime": 14958.25606648199, "examples_seen": 40550400.0, "progress": 0.3552302268629403, "epoch": 31.970859893326395, "img/sec/core": 189.5090850395133, "core_hours_Tesla V100-SXM2-32GB": 59.40953296953812, "core_hours": 59.40953296953812}
{"step": 39650, "global_schedule": 0.8037473559379578, "l2_grads": 1.3276907205581665, "l2_params": 329.15435791015625, "l2_updates": 0.8655616044998169, "training_loss": 2.9261388778686523, "uptime": 14975.15617534495, "examples_seen": 40601600.0, "progress": 0.35567874987665615, "epoch": 32.011227140666456, "img/sec/core": 189.34789272355374, "core_hours_Tesla V100-SXM2-32GB": 59.484644564484604, "core_hours": 59.484644564484604}
{"step": 39700, "global_schedule": 0.803132176399231, "l2_grads": 1.2103543281555176, "l2_params": 329.1150207519531, "l2_updates": 0.8729232549667358, "training_loss": 4.676544189453125, "uptime": 14992.03030583798, "examples_seen": 40652800.0, "progress": 0.356127272890372, "epoch": 32.051594388006514, "img/sec/core": 189.6394010536896, "core_hours_Tesla V100-SXM2-32GB": 59.55964070000918, "core_hours": 59.55964070000918}
{"step": 39750, "global_schedule": 0.8025163412094116, "l2_grads": 1.2937859296798706, "l2_params": 329.0769348144531, "l2_updates": 0.8330951929092407, "training_loss": 3.1191985607147217, "uptime": 15008.90696525696, "examples_seen": 40704000.0, "progress": 0.35657579590408783, "epoch": 32.09196163534657, "img/sec/core": 189.6109840553611, "core_hours_Tesla V100-SXM2-32GB": 59.63464807520465, "core_hours": 59.63464807520465}
{"step": 39800, "global_schedule": 0.801899790763855, "l2_grads": 1.4541430473327637, "l2_params": 329.02911376953125, "l2_updates": 0.8434576392173767, "training_loss": 2.6735310554504395, "uptime": 15025.79152400198, "examples_seen": 40755200.0, "progress": 0.3570243189178037, "epoch": 32.13232888268663, "img/sec/core": 189.52227584531317, "core_hours_Tesla V100-SXM2-32GB": 59.70969055851585, "core_hours": 59.70969055851585}
{"step": 39850, "global_schedule": 0.8012824058532715, "l2_grads": 1.1141263246536255, "l2_params": 328.9828186035156, "l2_updates": 0.8498576879501343, "training_loss": 4.797276020050049, "uptime": 15042.690917242959, "examples_seen": 40806400.0, "progress": 0.3574728419315195, "epoch": 32.17269613002669, "img/sec/core": 189.35591085248595, "core_hours_Tesla V100-SXM2-32GB": 59.7847989729202, "core_hours": 59.7847989729202}
{"step": 39900, "global_schedule": 0.8006644248962402, "l2_grads": 1.4658302068710327, "l2_params": 328.9419860839844, "l2_updates": 0.8487773537635803, "training_loss": 2.6411755084991455, "uptime": 15059.565280387993, "examples_seen": 40857600.0, "progress": 0.35792136494523535, "epoch": 32.213063377366744, "img/sec/core": 189.63678643728136, "core_hours_Tesla V100-SXM2-32GB": 59.85979614245369, "core_hours": 59.85979614245369}
{"step": 39950, "global_schedule": 0.8000456094741821, "l2_grads": 1.298884391784668, "l2_params": 328.8639831542969, "l2_updates": 0.8680323958396912, "training_loss": 2.6545777320861816, "uptime": 15076.45875975996, "examples_seen": 40908800.0, "progress": 0.3583698879589512, "epoch": 32.25343062470681, "img/sec/core": 189.42219832523213, "core_hours_Tesla V100-SXM2-32GB": 59.93487827299577, "core_hours": 59.93487827299577}
{"step": 40000, "global_schedule": 0.7994261980056763, "l2_grads": 1.060834288597107, "l2_params": 328.8114929199219, "l2_updates": 0.8466724157333374, "training_loss": 4.750245094299316, "uptime": 15093.338287421968, "examples_seen": 40960000.0, "progress": 0.35881841097266703, "epoch": 32.293797872046866, "img/sec/core": 189.57876452920846, "core_hours_Tesla V100-SXM2-32GB": 60.009898395938016, "core_hours": 60.009898395938016, "minival/prec@1": 0.6299562909772088, "minival/loss": 1.5329208302564856, "minival/sample count": 12812.0, "minival/attn_weight_avg": [13312, 12, 281], "minival/attn_mag": [13312, 12, 281], "minival/before_mlp": [13312, 12, 281], "z/secs/eval/minival": 2.867284303996712, "real/prec@1": 0.6786087921942054, "real/loss": 2.3736068602113445, "real/sample count": 46837.0, "real/attn_weight_avg": [50176, 12, 281], "real/attn_mag": [50176, 12, 281], "real/before_mlp": [50176, 12, 281], "z/secs/eval/real": 11.19818096398376, "train/prec@1": 0.6568707801584514, "train/loss": 1.406287413600345, "train/sample count": 25623.0, "train/attn_weight_avg": [26624, 12, 281], "train/attn_mag": [26624, 12, 281], "train/before_mlp": [26624, 12, 281], "z/secs/eval/train": 6.602164815005381, "v2/prec@1": 0.4866, "v2/loss": 2.3245375, "v2/sample count": 10000.0, "v2/attn_weight_avg": [10240, 12, 281], "v2/attn_mag": [10240, 12, 281], "v2/before_mlp": [10240, 12, 281], "z/secs/eval/v2": 3.3633321399684064, "val/prec@1": 0.60592, "val/loss": 1.6661908764648437, "val/sample count": 50000.0, "val/attn_weight_avg": [50176, 12, 281], "val/attn_mag": [50176, 12, 281], "val/before_mlp": [50176, 12, 281], "z/secs/eval/val": 12.23519962298451}
{"step": 40050, "global_schedule": 0.7988059520721436, "l2_grads": 1.5224249362945557, "l2_params": 328.74725341796875, "l2_updates": 0.8566158413887024, "training_loss": 2.775717258453369, "uptime": 15147.365996034001, "examples_seen": 41011200.0, "progress": 0.3592669339863828, "epoch": 32.334165119386924, "img/sec/core": 189.01137914294344, "core_hours_Tesla V100-SXM2-32GB": 60.08514371866257, "core_hours": 60.08514371866257}
{"step": 40100, "global_schedule": 0.7981850504875183, "l2_grads": 1.3130289316177368, "l2_params": 328.6980285644531, "l2_updates": 0.8670303821563721, "training_loss": 2.6318278312683105, "uptime": 15164.24385229696, "examples_seen": 41062400.0, "progress": 0.35971545700009866, "epoch": 32.37453236672698, "img/sec/core": 189.59753834512622, "core_hours_Tesla V100-SXM2-32GB": 60.16015641316461, "core_hours": 60.16015641316461}
{"step": 40150, "global_schedule": 0.7975634336471558, "l2_grads": 1.1613409519195557, "l2_params": 328.65594482421875, "l2_updates": 0.8488247394561768, "training_loss": 5.198250770568848, "uptime": 15181.12341410399, "examples_seen": 41113600.0, "progress": 0.3601639800138145, "epoch": 32.41489961406704, "img/sec/core": 189.57838103756126, "core_hours_Tesla V100-SXM2-32GB": 60.23517668786251, "core_hours": 60.23517668786251}
{"step": 40200, "global_schedule": 0.7969410419464111, "l2_grads": 1.118149757385254, "l2_params": 328.6043395996094, "l2_updates": 0.8363584876060486, "training_loss": 5.253875255584717, "uptime": 15198.001471714, "examples_seen": 41164800.0, "progress": 0.36061250302753034, "epoch": 32.4552668614071, "img/sec/core": 189.59527653833894, "core_hours_Tesla V100-SXM2-32GB": 60.310190277240345, "core_hours": 60.310190277240345}
{"step": 40250, "global_schedule": 0.7963180541992188, "l2_grads": 1.3935492038726807, "l2_params": 328.551025390625, "l2_updates": 0.8470930457115173, "training_loss": 2.795888662338257, "uptime": 15214.887792871974, "examples_seen": 41216000.0, "progress": 0.3610610260412462, "epoch": 32.495634108747154, "img/sec/core": 189.50249554438676, "core_hours_Tesla V100-SXM2-32GB": 60.385240593498004, "core_hours": 60.385240593498004}
{"step": 40300, "global_schedule": 0.7956942319869995, "l2_grads": 1.4462789297103882, "l2_params": 328.51849365234375, "l2_updates": 0.8390887379646301, "training_loss": 2.7259883880615234, "uptime": 15231.751261824975, "examples_seen": 41267200.0, "progress": 0.361509549054962, "epoch": 32.53600135608721, "img/sec/core": 189.7592961992889, "core_hours_Tesla V100-SXM2-32GB": 60.46018934440023, "core_hours": 60.46018934440023}
{"step": 40350, "global_schedule": 0.7950698137283325, "l2_grads": 1.2208479642868042, "l2_params": 328.466796875, "l2_updates": 0.8455644845962524, "training_loss": 3.7659244537353516, "uptime": 15248.633067542978, "examples_seen": 41318400.0, "progress": 0.36195807206867786, "epoch": 32.57636860342728, "img/sec/core": 189.55318248849505, "core_hours_Tesla V100-SXM2-32GB": 60.5352195920358, "core_hours": 60.5352195920358}
{"step": 40400, "global_schedule": 0.7944446206092834, "l2_grads": 1.2659727334976196, "l2_params": 328.4046630859375, "l2_updates": 0.8483127951622009, "training_loss": 2.958922863006592, "uptime": 15265.517097716976, "examples_seen": 41369600.0, "progress": 0.3624065950823937, "epoch": 32.616735850767334, "img/sec/core": 189.5282090248838, "core_hours_Tesla V100-SXM2-32GB": 60.61025972614246, "core_hours": 60.61025972614246}
{"step": 40450, "global_schedule": 0.7938187122344971, "l2_grads": 1.1191139221191406, "l2_params": 328.3584899902344, "l2_updates": 0.850752055644989, "training_loss": 5.048511028289795, "uptime": 15282.401990255981, "examples_seen": 41420800.0, "progress": 0.3628551180961095, "epoch": 32.65710309810739, "img/sec/core": 189.5185292182268, "core_hours_Tesla V100-SXM2-32GB": 60.68530369298249, "core_hours": 60.68530369298249}
{"step": 40500, "global_schedule": 0.7931921482086182, "l2_grads": 1.24576997756958, "l2_params": 328.28106689453125, "l2_updates": 0.8264846205711365, "training_loss": 4.500612735748291, "uptime": 15299.271072845964, "examples_seen": 41472000.0, "progress": 0.3633036411098253, "epoch": 32.69747034544745, "img/sec/core": 189.696148734264, "core_hours_Tesla V100-SXM2-32GB": 60.7602773933824, "core_hours": 60.7602773933824}
{"step": 40551, "global_schedule": 0.792564868927002, "l2_grads": 1.172286868095398, "l2_params": 328.2019958496094, "l2_updates": 0.8438649773597717, "training_loss": 3.8405025005340576, "uptime": 15316.160557178955, "examples_seen": 41523200.0, "progress": 0.36375216412354117, "epoch": 32.73783759278751, "img/sec/core": 189.46700425597516, "core_hours_Tesla V100-SXM2-32GB": 60.8353417681957, "core_hours": 60.8353417681957}
{"step": 40600, "global_schedule": 0.7919368743896484, "l2_grads": 1.3976612091064453, "l2_params": 328.15130615234375, "l2_updates": 0.8261566758155823, "training_loss": 2.749053716659546, "uptime": 15333.035600812, "examples_seen": 41574400.0, "progress": 0.364200687137257, "epoch": 32.778204840127565, "img/sec/core": 189.62913931278746, "core_hours_Tesla V100-SXM2-32GB": 60.91034196212034, "core_hours": 60.91034196212034}
{"step": 40650, "global_schedule": 0.7913081645965576, "l2_grads": 1.3937095403671265, "l2_params": 328.0789794921875, "l2_updates": 0.8403811454772949, "training_loss": 2.763517379760742, "uptime": 15349.895397805958, "examples_seen": 41625600.0, "progress": 0.36464921015097285, "epoch": 32.81857208746762, "img/sec/core": 189.80062459510745, "core_hours_Tesla V100-SXM2-32GB": 60.9852743932046, "core_hours": 60.9852743932046}
{"step": 40700, "global_schedule": 0.7906787395477295, "l2_grads": 1.147607445716858, "l2_params": 328.0483703613281, "l2_updates": 0.8601629137992859, "training_loss": 3.9857544898986816, "uptime": 15366.78592024796, "examples_seen": 41676800.0, "progress": 0.3650977331646887, "epoch": 32.85893933480769, "img/sec/core": 189.45535941757566, "core_hours_Tesla V100-SXM2-32GB": 61.06034338183572, "core_hours": 61.06034338183572}
{"step": 40750, "global_schedule": 0.7900487184524536, "l2_grads": 1.4698340892791748, "l2_params": 327.9992370605469, "l2_updates": 0.8531320691108704, "training_loss": 2.644408702850342, "uptime": 15383.661810754973, "examples_seen": 41728000.0, "progress": 0.3655462561784045, "epoch": 32.899306582147744, "img/sec/core": 189.61962325307192, "core_hours_Tesla V100-SXM2-32GB": 61.13534733964467, "core_hours": 61.13534733964467}
{"step": 40800, "global_schedule": 0.7894178628921509, "l2_grads": 1.0613564252853394, "l2_params": 327.96051025390625, "l2_updates": 0.8331623077392578, "training_loss": 4.8410139083862305, "uptime": 15400.537708154996, "examples_seen": 41779200.0, "progress": 0.36599477919212037, "epoch": 32.9396738294878, "img/sec/core": 189.6195458023849, "core_hours_Tesla V100-SXM2-32GB": 61.21035132808922, "core_hours": 61.21035132808922}
{"step": 40850, "global_schedule": 0.7887864112854004, "l2_grads": 1.0380685329437256, "l2_params": 327.88751220703125, "l2_updates": 0.8537434935569763, "training_loss": 5.1719255447387695, "uptime": 15417.394104584004, "examples_seen": 41830400.0, "progress": 0.3664433022058362, "epoch": 32.98004107682786, "img/sec/core": 189.83891447244187, "core_hours_Tesla V100-SXM2-32GB": 61.28526864555147, "core_hours": 61.28526864555147}
{"step": 40900, "global_schedule": 0.7881542444229126, "l2_grads": 1.2670247554779053, "l2_params": 327.833251953125, "l2_updates": 0.8643664717674255, "training_loss": 2.856473207473755, "uptime": 15434.252515046974, "examples_seen": 41881600.0, "progress": 0.366891825219552, "epoch": 33.02040832416792, "img/sec/core": 189.81623487154448, "core_hours_Tesla V100-SXM2-32GB": 61.36019491427578, "core_hours": 61.36019491427578}
{"step": 40950, "global_schedule": 0.7875214219093323, "l2_grads": 1.3428504467010498, "l2_params": 327.7931213378906, "l2_updates": 0.8442082405090332, "training_loss": 2.662379264831543, "uptime": 15451.106143291981, "examples_seen": 41932800.0, "progress": 0.36734034823326783, "epoch": 33.060775571507975, "img/sec/core": 189.87009523886266, "core_hours_Tesla V100-SXM2-32GB": 61.43509992869804, "core_hours": 61.43509992869804}
{"step": 41000, "global_schedule": 0.7868878841400146, "l2_grads": 1.49443781375885, "l2_params": 327.7444763183594, "l2_updates": 0.8152170181274414, "training_loss": 2.697700023651123, "uptime": 15467.976515467977, "examples_seen": 41984000.0, "progress": 0.3677888712469837, "epoch": 33.10114281884803, "img/sec/core": 189.68164819464803, "core_hours_Tesla V100-SXM2-32GB": 61.510079360591355, "core_hours": 61.510079360591355}
{"step": 41050, "global_schedule": 0.7862536311149597, "l2_grads": 1.148694396018982, "l2_params": 327.7008361816406, "l2_updates": 0.8242276310920715, "training_loss": 4.210963726043701, "uptime": 15485.360054788005, "examples_seen": 42035200.0, "progress": 0.3682373942606995, "epoch": 33.1415100661881, "img/sec/core": 189.68329119579374, "core_hours_Tesla V100-SXM2-32GB": 61.58505814302687, "core_hours": 61.58505814302687}
{"step": 41100, "global_schedule": 0.7856187224388123, "l2_grads": 1.162919282913208, "l2_params": 327.6360168457031, "l2_updates": 0.8316068649291992, "training_loss": 4.365910053253174, "uptime": 15502.221833463002, "examples_seen": 42086400.0, "progress": 0.36868591727441535, "epoch": 33.181877313528155, "img/sec/core": 189.77831827108074, "core_hours_Tesla V100-SXM2-32GB": 61.65999938158241, "core_hours": 61.65999938158241}
{"step": 41150, "global_schedule": 0.7849831581115723, "l2_grads": 1.1118197441101074, "l2_params": 327.550537109375, "l2_updates": 0.8381372094154358, "training_loss": 4.964593887329102, "uptime": 15519.101656064973, "examples_seen": 42137600.0, "progress": 0.3691344402881312, "epoch": 33.22224456086821, "img/sec/core": 189.57545203266636, "core_hours_Tesla V100-SXM2-32GB": 61.73502081536895, "core_hours": 61.73502081536895}
{"step": 41200, "global_schedule": 0.7843468189239502, "l2_grads": 1.4030176401138306, "l2_params": 327.4956970214844, "l2_updates": 0.8433143496513367, "training_loss": 2.706221580505371, "uptime": 15535.951350363961, "examples_seen": 42188800.0, "progress": 0.36958296330184703, "epoch": 33.26261180820827, "img/sec/core": 189.91442474966695, "core_hours_Tesla V100-SXM2-32GB": 61.80990834558667, "core_hours": 61.80990834558667}
{"step": 41250, "global_schedule": 0.7837098836898804, "l2_grads": 1.1750236749649048, "l2_params": 327.432373046875, "l2_updates": 0.8231465816497803, "training_loss": 4.104523658752441, "uptime": 15552.815854106972, "examples_seen": 42240000.0, "progress": 0.3700314863155629, "epoch": 33.30297905554833, "img/sec/core": 189.74765274823028, "core_hours_Tesla V100-SXM2-32GB": 61.88486169555561, "core_hours": 61.88486169555561}
{"step": 41300, "global_schedule": 0.7830722332000732, "l2_grads": 1.1944324970245361, "l2_params": 327.36419677734375, "l2_updates": 0.835207462310791, "training_loss": 3.6572072505950928, "uptime": 15569.674652321963, "examples_seen": 42291200.0, "progress": 0.37048000932927866, "epoch": 33.343346302888385, "img/sec/core": 189.81186910194518, "core_hours_Tesla V100-SXM2-32GB": 61.959789687622234, "core_hours": 61.959789687622234}
{"step": 41350, "global_schedule": 0.7824338674545288, "l2_grads": 1.3553531169891357, "l2_params": 327.2860412597656, "l2_updates": 0.838280975818634, "training_loss": 2.771395206451416, "uptime": 15586.507039256976, "examples_seen": 42342400.0, "progress": 0.3709285323429945, "epoch": 33.38371355022844, "img/sec/core": 190.10969818805813, "core_hours_Tesla V100-SXM2-32GB": 62.034600296222294, "core_hours": 62.034600296222294}
{"step": 41400, "global_schedule": 0.7817949056625366, "l2_grads": 1.4249508380889893, "l2_params": 327.2411193847656, "l2_updates": 0.851879358291626, "training_loss": 2.606590986251831, "uptime": 15603.369407235994, "examples_seen": 42393600.0, "progress": 0.37137705535671034, "epoch": 33.42408079756851, "img/sec/core": 189.77168592108688, "core_hours_Tesla V100-SXM2-32GB": 62.10954415390682, "core_hours": 62.10954415390682}
{"step": 41450, "global_schedule": 0.7811552286148071, "l2_grads": 1.4063103199005127, "l2_params": 327.151611328125, "l2_updates": 0.8438329696655273, "training_loss": 2.570441961288452, "uptime": 15620.245994986966, "examples_seen": 42444800.0, "progress": 0.3718255783704262, "epoch": 33.464448044908565, "img/sec/core": 189.61178925613385, "core_hours_Tesla V100-SXM2-32GB": 62.1845512105778, "core_hours": 62.1845512105778}
{"step": 41500, "global_schedule": 0.7805148363113403, "l2_grads": 1.3470251560211182, "l2_params": 327.1160583496094, "l2_updates": 0.849807620048523, "training_loss": 2.6624369621276855, "uptime": 15637.119319696969, "examples_seen": 42496000.0, "progress": 0.372274101384142, "epoch": 33.50481529224862, "img/sec/core": 189.6484572541306, "core_hours_Tesla V100-SXM2-32GB": 62.25954376484449, "core_hours": 62.25954376484449}
{"step": 41550, "global_schedule": 0.7798738479614258, "l2_grads": 1.4083582162857056, "l2_params": 327.0715637207031, "l2_updates": 0.8381420373916626, "training_loss": 2.7175683975219727, "uptime": 15653.990097922971, "examples_seen": 42547200.0, "progress": 0.37272262439785786, "epoch": 33.54518253958868, "img/sec/core": 189.67708289045643, "core_hours_Tesla V100-SXM2-32GB": 62.334525001404494, "core_hours": 62.334525001404494}
{"step": 41600, "global_schedule": 0.7792321443557739, "l2_grads": 1.265992522239685, "l2_params": 327.03369140625, "l2_updates": 0.8507488965988159, "training_loss": 2.545710563659668, "uptime": 15670.86446974799, "examples_seen": 42598400.0, "progress": 0.3731711474115737, "epoch": 33.58554978692874, "img/sec/core": 189.63668889027912, "core_hours_Tesla V100-SXM2-32GB": 62.40952220951569, "core_hours": 62.40952220951569}
{"step": 41650, "global_schedule": 0.7785897850990295, "l2_grads": 1.1379157304763794, "l2_params": 326.9972229003906, "l2_updates": 0.8331847190856934, "training_loss": 4.015689373016357, "uptime": 15687.734179469, "examples_seen": 42649600.0, "progress": 0.37361967042528954, "epoch": 33.625917034268795, "img/sec/core": 189.6890967847945, "core_hours_Tesla V100-SXM2-32GB": 62.484498697164625, "core_hours": 62.484498697164625}
{"step": 41700, "global_schedule": 0.7779467701911926, "l2_grads": 1.4127558469772339, "l2_params": 326.92279052734375, "l2_updates": 0.8344942927360535, "training_loss": 2.5863847732543945, "uptime": 15704.59327728796, "examples_seen": 42700800.0, "progress": 0.3740681934390054, "epoch": 33.66628428160885, "img/sec/core": 189.80849594461384, "core_hours_Tesla V100-SXM2-32GB": 62.559428020804454, "core_hours": 62.559428020804454}
{"step": 41750, "global_schedule": 0.7773030996322632, "l2_grads": 1.384856104850769, "l2_params": 326.8537292480469, "l2_updates": 0.8422781229019165, "training_loss": 2.6212399005889893, "uptime": 15721.488159917993, "examples_seen": 42752000.0, "progress": 0.37451671645272117, "epoch": 33.70665152894892, "img/sec/core": 189.4064652637222, "core_hours_Tesla V100-SXM2-32GB": 62.63451638804904, "core_hours": 62.63451638804904}
{"step": 41800, "global_schedule": 0.7766587138175964, "l2_grads": 1.283979058265686, "l2_params": 326.7701110839844, "l2_updates": 0.79930180311203, "training_loss": 3.4473390579223633, "uptime": 15738.373429687985, "examples_seen": 42803200.0, "progress": 0.374965239466437, "epoch": 33.747018776288975, "img/sec/core": 189.51429521647802, "core_hours_Tesla V100-SXM2-32GB": 62.70956203147122, "core_hours": 62.70956203147122}
{"step": 41850, "global_schedule": 0.7760137319564819, "l2_grads": 1.4634888172149658, "l2_params": 326.6923828125, "l2_updates": 0.8401535153388977, "training_loss": 2.7621383666992188, "uptime": 15755.259720387985, "examples_seen": 42854400.0, "progress": 0.37541376248015285, "epoch": 33.78738602362903, "img/sec/core": 189.50283735195637, "core_hours_Tesla V100-SXM2-32GB": 62.78461221236011, "core_hours": 62.78461221236011}
{"step": 41900, "global_schedule": 0.7753679752349854, "l2_grads": 1.4321668148040771, "l2_params": 326.6485290527344, "l2_updates": 0.8402551412582397, "training_loss": 2.552558660507202, "uptime": 15772.130019359, "examples_seen": 42905600.0, "progress": 0.3758622854938687, "epoch": 33.82775327096909, "img/sec/core": 189.68247127677046, "core_hours_Tesla V100-SXM2-32GB": 62.859591318897955, "core_hours": 62.859591318897955}
{"step": 41950, "global_schedule": 0.774721622467041, "l2_grads": 1.134684443473816, "l2_params": 326.59735107421875, "l2_updates": 0.8383840918540955, "training_loss": 3.709074020385742, "uptime": 15789.012314851978, "examples_seen": 42956800.0, "progress": 0.3763108085075845, "epoch": 33.86812051830915, "img/sec/core": 189.54768333079744, "core_hours_Tesla V100-SXM2-32GB": 62.934623743311185, "core_hours": 62.934623743311185}
{"step": 42000, "global_schedule": 0.7740746736526489, "l2_grads": 1.4588497877120972, "l2_params": 326.54559326171875, "l2_updates": 0.8251369595527649, "training_loss": 2.610030174255371, "uptime": 15805.900055393984, "examples_seen": 43008000.0, "progress": 0.37675933152130037, "epoch": 33.908487765649205, "img/sec/core": 189.48656820256014, "core_hours_Tesla V100-SXM2-32GB": 63.00968036794233, "core_hours": 63.00968036794233}
{"step": 42050, "global_schedule": 0.7734270095825195, "l2_grads": 1.1058313846588135, "l2_params": 326.446044921875, "l2_updates": 0.8272950649261475, "training_loss": 4.030776023864746, "uptime": 15823.314839524974, "examples_seen": 43059200.0, "progress": 0.3772078545350162, "epoch": 33.94885501298926, "img/sec/core": 189.52469690840795, "core_hours_Tesla V100-SXM2-32GB": 63.0847218926313, "core_hours": 63.0847218926313}
{"step": 42100, "global_schedule": 0.7727787494659424, "l2_grads": 1.1553595066070557, "l2_params": 326.37799072265625, "l2_updates": 0.8155818581581116, "training_loss": 4.769998550415039, "uptime": 15840.196542406979, "examples_seen": 43110400.0, "progress": 0.37765637754873205, "epoch": 33.98922226032933, "img/sec/core": 189.55433716411684, "core_hours_Tesla V100-SXM2-32GB": 63.15975168321799, "core_hours": 63.15975168321799}
{"step": 42150, "global_schedule": 0.7721297740936279, "l2_grads": 1.3814693689346313, "l2_params": 326.3231201171875, "l2_updates": 0.8280386924743652, "training_loss": 2.768328905105591, "uptime": 15857.073733910976, "examples_seen": 43161600.0, "progress": 0.37810490056244783, "epoch": 34.029589507669385, "img/sec/core": 189.6050062145695, "core_hours_Tesla V100-SXM2-32GB": 63.23476142323576, "core_hours": 63.23476142323576}
{"step": 42200, "global_schedule": 0.7714800834655762, "l2_grads": 1.4631657600402832, "l2_params": 326.2542724609375, "l2_updates": 0.8189647793769836, "training_loss": 2.543046474456787, "uptime": 15873.945035555982, "examples_seen": 43212800.0, "progress": 0.3785534235761637, "epoch": 34.06995675500944, "img/sec/core": 189.67119830658095, "core_hours_Tesla V100-SXM2-32GB": 63.30974498610245, "core_hours": 63.30974498610245}
{"step": 42250, "global_schedule": 0.7708298563957214, "l2_grads": 1.211120843887329, "l2_params": 326.21514892578125, "l2_updates": 0.8242202997207642, "training_loss": 4.210835933685303, "uptime": 15890.811698223988, "examples_seen": 43264000.0, "progress": 0.3790019465898795, "epoch": 34.1103240023495, "img/sec/core": 189.72336513672047, "core_hours_Tesla V100-SXM2-32GB": 63.38470793129359, "core_hours": 63.38470793129359}
{"step": 42300, "global_schedule": 0.7701789140701294, "l2_grads": 1.2359453439712524, "l2_params": 326.1717834472656, "l2_updates": 0.8201467990875244, "training_loss": 4.014667510986328, "uptime": 15907.69064026, "examples_seen": 43315200.0, "progress": 0.37945046960359535, "epoch": 34.15069124968956, "img/sec/core": 189.58534208913719, "core_hours_Tesla V100-SXM2-32GB": 63.45972545145364, "core_hours": 63.45972545145364}
{"step": 42350, "global_schedule": 0.7695273756980896, "l2_grads": 1.3977084159851074, "l2_params": 326.11114501953125, "l2_updates": 0.8237285017967224, "training_loss": 2.4569156169891357, "uptime": 15924.570357210992, "examples_seen": 43366400.0, "progress": 0.3798989926173112, "epoch": 34.191058497029616, "img/sec/core": 189.57663859475016, "core_hours_Tesla V100-SXM2-32GB": 63.534746415680274, "core_hours": 63.534746415680274}
{"step": 42400, "global_schedule": 0.7688751220703125, "l2_grads": 1.3427574634552002, "l2_params": 326.0171813964844, "l2_updates": 0.8277764320373535, "training_loss": 2.6072521209716797, "uptime": 15941.431695768959, "examples_seen": 43417600.0, "progress": 0.38034751563102703, "epoch": 34.23142574436967, "img/sec/core": 189.78327189142928, "core_hours_Tesla V100-SXM2-32GB": 63.60968569816012, "core_hours": 63.60968569816012}
{"step": 42450, "global_schedule": 0.7682223320007324, "l2_grads": 1.3472893238067627, "l2_params": 325.9749450683594, "l2_updates": 0.8309975266456604, "training_loss": 2.5639095306396484, "uptime": 15958.339416237955, "examples_seen": 43468800.0, "progress": 0.3807960386447429, "epoch": 34.27179299170973, "img/sec/core": 189.2626510988157, "core_hours_Tesla V100-SXM2-32GB": 63.684831122466775, "core_hours": 63.684831122466775}
{"step": 42500, "global_schedule": 0.767568826675415, "l2_grads": 1.4597653150558472, "l2_params": 325.9373779296875, "l2_updates": 0.8133125305175781, "training_loss": 2.7522501945495605, "uptime": 15975.204515611986, "examples_seen": 43520000.0, "progress": 0.3812445616584587, "epoch": 34.312160239049796, "img/sec/core": 189.74095135944026, "core_hours_Tesla V100-SXM2-32GB": 63.75978711968469, "core_hours": 63.75978711968469, "minival/prec@1": 0.6344832969091476, "minival/loss": 1.5615427408447646, "minival/sample count": 12812.0, "minival/attn_weight_avg": [13312, 12, 281], "minival/attn_mag": [13312, 12, 281], "minival/before_mlp": [13312, 12, 281], "z/secs/eval/minival": 2.9091544590191916, "real/prec@1": 0.6806371031449495, "real/loss": 2.3990574713401, "real/sample count": 46837.0, "real/attn_weight_avg": [50176, 12, 281], "real/attn_mag": [50176, 12, 281], "real/before_mlp": [50176, 12, 281], "z/secs/eval/real": 11.15506349899806, "train/prec@1": 0.6562073137415603, "train/loss": 1.4459656630272153, "train/sample count": 25623.0, "train/attn_weight_avg": [26624, 12, 281], "train/attn_mag": [26624, 12, 281], "train/before_mlp": [26624, 12, 281], "z/secs/eval/train": 6.560613266017754, "v2/prec@1": 0.4841, "v2/loss": 2.3561531494140624, "v2/sample count": 10000.0, "v2/attn_weight_avg": [10240, 12, 281], "v2/attn_mag": [10240, 12, 281], "v2/before_mlp": [10240, 12, 281], "z/secs/eval/v2": 3.3773748939856887, "val/prec@1": 0.60552, "val/loss": 1.6982396435546876, "val/sample count": 50000.0, "val/attn_weight_avg": [50176, 12, 281], "val/attn_mag": [50176, 12, 281], "val/before_mlp": [50176, 12, 281], "z/secs/eval/val": 12.339952014037408}
{"step": 42550, "global_schedule": 0.7669146656990051, "l2_grads": 1.2745271921157837, "l2_params": 325.88763427734375, "l2_updates": 0.8163522481918335, "training_loss": 4.2928643226623535, "uptime": 16028.447870365984, "examples_seen": 43571200.0, "progress": 0.38169308467217455, "epoch": 34.35252748638985, "img/sec/core": 189.3585459657209, "core_hours_Tesla V100-SXM2-32GB": 63.83489448888046, "core_hours": 63.83489448888046}
{"step": 42600, "global_schedule": 0.7662599086761475, "l2_grads": 1.1776567697525024, "l2_params": 325.81402587890625, "l2_updates": 0.8337008357048035, "training_loss": 3.170628309249878, "uptime": 16045.357448268973, "examples_seen": 43622400.0, "progress": 0.38214160768589034, "epoch": 34.39289473372991, "img/sec/core": 189.24186152715527, "core_hours_Tesla V100-SXM2-32GB": 63.9100481684493, "core_hours": 63.9100481684493}
{"step": 42650, "global_schedule": 0.7656044960021973, "l2_grads": 1.2317824363708496, "l2_params": 325.7460021972656, "l2_updates": 0.8169872164726257, "training_loss": 5.073559761047363, "uptime": 16062.238135423977, "examples_seen": 43673600.0, "progress": 0.3825901306996062, "epoch": 34.43326198106997, "img/sec/core": 189.56574282886282, "core_hours_Tesla V100-SXM2-32GB": 63.98507344469376, "core_hours": 63.98507344469376}
{"step": 42700, "global_schedule": 0.7649484276771545, "l2_grads": 1.4144214391708374, "l2_params": 325.70556640625, "l2_updates": 0.8375765085220337, "training_loss": 2.594707727432251, "uptime": 16079.111009583983, "examples_seen": 43724800.0, "progress": 0.383038653713322, "epoch": 34.473629228410026, "img/sec/core": 189.6535213653741, "core_hours_Tesla V100-SXM2-32GB": 64.060063996516, "core_hours": 64.060063996516}
{"step": 42750, "global_schedule": 0.7642917633056641, "l2_grads": 1.340929627418518, "l2_params": 325.6552429199219, "l2_updates": 0.8430636525154114, "training_loss": 2.67425537109375, "uptime": 16095.955832549953, "examples_seen": 43776000.0, "progress": 0.38348717672703786, "epoch": 34.51399647575008, "img/sec/core": 189.9693458616155, "core_hours_Tesla V100-SXM2-32GB": 64.13492987636477, "core_hours": 64.13492987636477}
{"step": 42800, "global_schedule": 0.763634443283081, "l2_grads": 1.2283743619918823, "l2_params": 325.6019287109375, "l2_updates": 0.8081749081611633, "training_loss": 3.4276089668273926, "uptime": 16112.81629561499, "examples_seen": 43827200.0, "progress": 0.3839356997407537, "epoch": 34.55436372309014, "img/sec/core": 189.7931265384834, "core_hours_Tesla V100-SXM2-32GB": 64.20986526776493, "core_hours": 64.20986526776493}
{"step": 42850, "global_schedule": 0.7629764080047607, "l2_grads": 1.451317548751831, "l2_params": 325.55718994140625, "l2_updates": 0.8181440830230713, "training_loss": 2.6212217807769775, "uptime": 16129.685122273979, "examples_seen": 43878400.0, "progress": 0.38438422275446954, "epoch": 34.594730970430206, "img/sec/core": 189.6990267722519, "core_hours_Tesla V100-SXM2-32GB": 64.28483783069377, "core_hours": 64.28483783069377}
{"step": 42900, "global_schedule": 0.7623177766799927, "l2_grads": 1.296331524848938, "l2_params": 325.4786682128906, "l2_updates": 0.8379234075546265, "training_loss": 3.1675987243652344, "uptime": 16146.548980402993, "examples_seen": 43929600.0, "progress": 0.3848327457681854, "epoch": 34.63509821777026, "img/sec/core": 189.75491702544636, "core_hours_Tesla V100-SXM2-32GB": 64.35978831126717, "core_hours": 64.35978831126717}
{"step": 42950, "global_schedule": 0.7616586089134216, "l2_grads": 1.332586407661438, "l2_params": 325.4179992675781, "l2_updates": 0.8074324131011963, "training_loss": 2.4872193336486816, "uptime": 16163.402767218999, "examples_seen": 43980800.0, "progress": 0.3852812687819012, "epoch": 34.67546546511032, "img/sec/core": 189.86830882191086, "core_hours_Tesla V100-SXM2-32GB": 64.43469403044942, "core_hours": 64.43469403044942}
{"step": 43000, "global_schedule": 0.7609987258911133, "l2_grads": 1.1925013065338135, "l2_params": 325.341064453125, "l2_updates": 0.8053909540176392, "training_loss": 4.592409133911133, "uptime": 16180.277824225952, "examples_seen": 44032000.0, "progress": 0.38572979179561706, "epoch": 34.71583271245038, "img/sec/core": 189.62898902690853, "core_hours_Tesla V100-SXM2-32GB": 64.50969428381366, "core_hours": 64.50969428381366}
{"step": 43050, "global_schedule": 0.760338306427002, "l2_grads": 1.4058406352996826, "l2_params": 325.2716369628906, "l2_updates": 0.8201970458030701, "training_loss": 2.526404619216919, "uptime": 16197.655381363002, "examples_seen": 44083200.0, "progress": 0.38617831480933285, "epoch": 34.756199959790436, "img/sec/core": 189.5887187090242, "core_hours_Tesla V100-SXM2-32GB": 64.58471046789394, "core_hours": 64.58471046789394}
{"step": 43100, "global_schedule": 0.7596771717071533, "l2_grads": 1.3944683074951172, "l2_params": 325.22869873046875, "l2_updates": 0.8250896334648132, "training_loss": 2.7457432746887207, "uptime": 16214.502282061963, "examples_seen": 44134400.0, "progress": 0.3866268378230487, "epoch": 34.796567207130494, "img/sec/core": 189.94591688886862, "core_hours_Tesla V100-SXM2-32GB": 64.65958558211155, "core_hours": 64.65958558211155}
{"step": 43150, "global_schedule": 0.7590155005455017, "l2_grads": 1.3355493545532227, "l2_params": 325.1903381347656, "l2_updates": 0.8538992404937744, "training_loss": 2.6073837280273438, "uptime": 16231.364437914977, "examples_seen": 44185600.0, "progress": 0.3870753608367645, "epoch": 34.83693445447055, "img/sec/core": 189.77407324983454, "core_hours_Tesla V100-SXM2-32GB": 64.73452849701384, "core_hours": 64.73452849701384}
{"step": 43200, "global_schedule": 0.7583531737327576, "l2_grads": 1.1662242412567139, "l2_params": 325.1512145996094, "l2_updates": 0.8013563752174377, "training_loss": 4.975242614746094, "uptime": 16248.218096305965, "examples_seen": 44236800.0, "progress": 0.38752388385048037, "epoch": 34.877301701810616, "img/sec/core": 189.8697556200072, "core_hours_Tesla V100-SXM2-32GB": 64.80943364541822, "core_hours": 64.80943364541822}
{"step": 43250, "global_schedule": 0.7576901912689209, "l2_grads": 1.3410015106201172, "l2_params": 325.07354736328125, "l2_updates": 0.8266047835350037, "training_loss": 2.6507441997528076, "uptime": 16265.054297000985, "examples_seen": 44288000.0, "progress": 0.3879724068641962, "epoch": 34.91766894915067, "img/sec/core": 190.0666342702057, "core_hours_Tesla V100-SXM2-32GB": 64.88426120406275, "core_hours": 64.88426120406275}
{"step": 43300, "global_schedule": 0.7570266723632812, "l2_grads": 1.2504369020462036, "l2_params": 325.0249938964844, "l2_updates": 0.7966893911361694, "training_loss": 5.148123264312744, "uptime": 16281.920969967963, "examples_seen": 44339200.0, "progress": 0.38842092987791205, "epoch": 34.95803619649073, "img/sec/core": 189.72324928958685, "core_hours_Tesla V100-SXM2-32GB": 64.9592241950271, "core_hours": 64.9592241950271}
{"step": 43350, "global_schedule": 0.7563624382019043, "l2_grads": 1.3749384880065918, "l2_params": 324.9272766113281, "l2_updates": 0.8127208948135376, "training_loss": 2.705711603164673, "uptime": 16298.778650077991, "examples_seen": 44390400.0, "progress": 0.3888694528916279, "epoch": 34.99840344383079, "img/sec/core": 189.8244585918105, "core_hours_Tesla V100-SXM2-32GB": 65.03414721773834, "core_hours": 65.03414721773834}
{"step": 43400, "global_schedule": 0.7556976675987244, "l2_grads": 1.3926239013671875, "l2_params": 324.8626403808594, "l2_updates": 0.8077175617218018, "training_loss": 2.9764516353607178, "uptime": 16315.653926070954, "examples_seen": 44441600.0, "progress": 0.3893179759053437, "epoch": 35.038770691170846, "img/sec/core": 189.62652826148755, "core_hours_Tesla V100-SXM2-32GB": 65.10914844437373, "core_hours": 65.10914844437373}
{"step": 43450, "global_schedule": 0.7550323009490967, "l2_grads": 1.270323395729065, "l2_params": 324.7950439453125, "l2_updates": 0.815670907497406, "training_loss": 3.7261099815368652, "uptime": 16332.530596625991, "examples_seen": 44492800.0, "progress": 0.3897664989190595, "epoch": 35.079137938510904, "img/sec/core": 189.61085894071292, "core_hours_Tesla V100-SXM2-32GB": 65.18415586906278, "core_hours": 65.18415586906278}
{"step": 43500, "global_schedule": 0.7543662786483765, "l2_grads": 1.3940041065216064, "l2_params": 324.7241516113281, "l2_updates": 0.8181300163269043, "training_loss": 2.5445480346679688, "uptime": 16349.386364025006, "examples_seen": 44544000.0, "progress": 0.39021502193277535, "epoch": 35.11950518585096, "img/sec/core": 189.8459989538717, "core_hours_Tesla V100-SXM2-32GB": 65.25907039083617, "core_hours": 65.25907039083617}
{"step": 43550, "global_schedule": 0.7536996006965637, "l2_grads": 1.2062389850616455, "l2_params": 324.6780090332031, "l2_updates": 0.8026764392852783, "training_loss": 4.293872833251953, "uptime": 16366.247435769998, "examples_seen": 44595200.0, "progress": 0.3906635449464912, "epoch": 35.159872433191026, "img/sec/core": 189.786275059915, "core_hours_Tesla V100-SXM2-32GB": 65.33400848748059, "core_hours": 65.33400848748059}
{"step": 43600, "global_schedule": 0.7530323266983032, "l2_grads": 1.4169679880142212, "l2_params": 324.62786865234375, "l2_updates": 0.8202430605888367, "training_loss": 2.668609857559204, "uptime": 16383.118849893974, "examples_seen": 44646400.0, "progress": 0.39111206796020703, "epoch": 35.200239680531084, "img/sec/core": 189.6699337995887, "core_hours_Tesla V100-SXM2-32GB": 65.40899255025381, "core_hours": 65.40899255025381}
{"step": 43650, "global_schedule": 0.7523645162582397, "l2_grads": 1.5594381093978882, "l2_params": 324.5781555175781, "l2_updates": 0.8011098504066467, "training_loss": 2.6671509742736816, "uptime": 16399.974698542967, "examples_seen": 44697600.0, "progress": 0.3915605909739229, "epoch": 35.24060692787114, "img/sec/core": 189.84508384223096, "core_hours_Tesla V100-SXM2-32GB": 65.48390743313823, "core_hours": 65.48390743313823}
{"step": 43700, "global_schedule": 0.7516961097717285, "l2_grads": 1.4875575304031372, "l2_params": 324.50982666015625, "l2_updates": 0.7979517579078674, "training_loss": 2.5720138549804688, "uptime": 16416.857827847998, "examples_seen": 44748800.0, "progress": 0.3920091139876387, "epoch": 35.2809741752112, "img/sec/core": 189.53832208382815, "core_hours_Tesla V100-SXM2-32GB": 65.55894356338281, "core_hours": 65.55894356338281}
{"step": 43750, "global_schedule": 0.75102698802948, "l2_grads": 1.405452013015747, "l2_params": 324.45391845703125, "l2_updates": 0.8031305074691772, "training_loss": 2.5775527954101562, "uptime": 16433.703546773002, "examples_seen": 44800000.0, "progress": 0.39245763700135455, "epoch": 35.32134142255126, "img/sec/core": 189.95924212235784, "core_hours_Tesla V100-SXM2-32GB": 65.63381342527173, "core_hours": 65.63381342527173}
{"step": 43800, "global_schedule": 0.7503573894500732, "l2_grads": 1.414662480354309, "l2_params": 324.412353515625, "l2_updates": 0.8240439295768738, "training_loss": 2.6463351249694824, "uptime": 16450.572851901, "examples_seen": 44851200.0, "progress": 0.3929061600150704, "epoch": 35.361708669891314, "img/sec/core": 189.69364628355692, "core_hours_Tesla V100-SXM2-32GB": 65.7087881147295, "core_hours": 65.7087881147295}
{"step": 43850, "global_schedule": 0.7496870756149292, "l2_grads": 1.4255002737045288, "l2_params": 324.3345947265625, "l2_updates": 0.8114727139472961, "training_loss": 2.978127956390381, "uptime": 16467.431657917972, "examples_seen": 44902400.0, "progress": 0.39335468302878623, "epoch": 35.40207591723137, "img/sec/core": 189.8117812601104, "core_hours_Tesla V100-SXM2-32GB": 65.78371614147159, "core_hours": 65.78371614147159}
{"step": 43900, "global_schedule": 0.749016284942627, "l2_grads": 1.2239962816238403, "l2_params": 324.2774658203125, "l2_updates": 0.7850528359413147, "training_loss": 4.09414005279541, "uptime": 16484.299034365977, "examples_seen": 44953600.0, "progress": 0.393803206042502, "epoch": 35.442443164571436, "img/sec/core": 189.71533657675468, "core_hours_Tesla V100-SXM2-32GB": 65.85868225901828, "core_hours": 65.85868225901828}
{"step": 43950, "global_schedule": 0.7483447790145874, "l2_grads": 1.2836079597473145, "l2_params": 324.1970520019531, "l2_updates": 0.7981158494949341, "training_loss": 3.258880615234375, "uptime": 16501.160635583976, "examples_seen": 45004800.0, "progress": 0.39425172905621786, "epoch": 35.482810411911494, "img/sec/core": 189.7803155600739, "core_hours_Tesla V100-SXM2-32GB": 65.93362270887604, "core_hours": 65.93362270887604}
{"step": 44000, "global_schedule": 0.7476727962493896, "l2_grads": 1.428711175918579, "l2_params": 324.1455078125, "l2_updates": 0.803805947303772, "training_loss": 2.649197578430176, "uptime": 16518.03187558998, "examples_seen": 45056000.0, "progress": 0.3947002520699337, "epoch": 35.52317765925155, "img/sec/core": 189.6718912694851, "core_hours_Tesla V100-SXM2-32GB": 66.00860599779162, "core_hours": 66.00860599779162}
{"step": 44050, "global_schedule": 0.7470000982284546, "l2_grads": 1.4828379154205322, "l2_params": 324.0847473144531, "l2_updates": 0.8104601502418518, "training_loss": 2.4842493534088135, "uptime": 16535.664233624004, "examples_seen": 45107200.0, "progress": 0.39514877508364954, "epoch": 35.56354490659161, "img/sec/core": 189.6748925440939, "core_hours_Tesla V100-SXM2-32GB": 66.08358810022732, "core_hours": 66.08358810022732}
{"step": 44100, "global_schedule": 0.7463269233703613, "l2_grads": 1.127529263496399, "l2_params": 324.0472412109375, "l2_updates": 0.7953965663909912, "training_loss": 4.318727493286133, "uptime": 16552.543273216987, "examples_seen": 45158400.0, "progress": 0.3955972980973654, "epoch": 35.60391215393167, "img/sec/core": 189.58424632941572, "core_hours_Tesla V100-SXM2-32GB": 66.15860605397391, "core_hours": 66.15860605397391}
{"step": 44150, "global_schedule": 0.7456530928611755, "l2_grads": 1.4886834621429443, "l2_params": 323.9823303222656, "l2_updates": 0.7998412251472473, "training_loss": 2.4934654235839844, "uptime": 16569.424056269985, "examples_seen": 45209600.0, "progress": 0.3960458211110812, "epoch": 35.644279401271724, "img/sec/core": 189.56466592535068, "core_hours_Tesla V100-SXM2-32GB": 66.23363175643168, "core_hours": 66.23363175643168}
{"step": 44200, "global_schedule": 0.744978666305542, "l2_grads": 1.322198510169983, "l2_params": 323.9187927246094, "l2_updates": 0.7968240976333618, "training_loss": 2.912996292114258, "uptime": 16586.29600606399, "examples_seen": 45260800.0, "progress": 0.39649434412479706, "epoch": 35.68464664861178, "img/sec/core": 189.6639119408282, "core_hours_Tesla V100-SXM2-32GB": 66.30861819996059, "core_hours": 66.30861819996059}
{"step": 44250, "global_schedule": 0.7443037033081055, "l2_grads": 1.4348866939544678, "l2_params": 323.8128967285156, "l2_updates": 0.7959592938423157, "training_loss": 2.526740074157715, "uptime": 16603.155911622976, "examples_seen": 45312000.0, "progress": 0.3969428671385129, "epoch": 35.72501389595185, "img/sec/core": 189.79940242275995, "core_hours_Tesla V100-SXM2-32GB": 66.38355111355608, "core_hours": 66.38355111355608}
{"step": 44300, "global_schedule": 0.7436280846595764, "l2_grads": 1.4459688663482666, "l2_params": 323.7455749511719, "l2_updates": 0.8029535412788391, "training_loss": 2.6923882961273193, "uptime": 16620.019589190953, "examples_seen": 45363200.0, "progress": 0.3973913901522287, "epoch": 35.765381143291904, "img/sec/core": 189.75694874981411, "core_hours_Tesla V100-SXM2-32GB": 66.45850079163598, "core_hours": 66.45850079163598}
{"step": 44350, "global_schedule": 0.7429519891738892, "l2_grads": 1.5491234064102173, "l2_params": 323.6861572265625, "l2_updates": 0.7790606021881104, "training_loss": 2.5366945266723633, "uptime": 16636.91829625197, "examples_seen": 45414400.0, "progress": 0.3978399131659445, "epoch": 35.80574839063196, "img/sec/core": 189.36359973847124, "core_hours_Tesla V100-SXM2-32GB": 66.53360615635161, "core_hours": 66.53360615635161}
{"step": 44400, "global_schedule": 0.7422752380371094, "l2_grads": 1.2916228771209717, "l2_params": 323.6498718261719, "l2_updates": 0.801938533782959, "training_loss": 4.973604679107666, "uptime": 16653.795741020003, "examples_seen": 45465600.0, "progress": 0.39828843617966037, "epoch": 35.84611563797202, "img/sec/core": 189.60216098949562, "core_hours_Tesla V100-SXM2-32GB": 66.60861702198731, "core_hours": 66.60861702198731}
{"step": 44450, "global_schedule": 0.7415978908538818, "l2_grads": 1.163710117340088, "l2_params": 323.5701904296875, "l2_updates": 0.7770938277244568, "training_loss": 4.92521858215332, "uptime": 16670.67178812099, "examples_seen": 45516800.0, "progress": 0.3987369591933762, "epoch": 35.88648288531208, "img/sec/core": 189.61786375985028, "core_hours_Tesla V100-SXM2-32GB": 66.68362167576949, "core_hours": 66.68362167576949}
{"step": 44500, "global_schedule": 0.7409200072288513, "l2_grads": 1.323878288269043, "l2_params": 323.51617431640625, "l2_updates": 0.8107686042785645, "training_loss": 2.6535749435424805, "uptime": 16687.54955989198, "examples_seen": 45568000.0, "progress": 0.39918548220709205, "epoch": 35.926850132652135, "img/sec/core": 189.59848749112908, "core_hours_Tesla V100-SXM2-32GB": 66.75863399475166, "core_hours": 66.75863399475166}
{"step": 44550, "global_schedule": 0.740241527557373, "l2_grads": 1.4180271625518799, "l2_params": 323.4524841308594, "l2_updates": 0.8078978061676025, "training_loss": 2.682225227355957, "uptime": 16704.419864956988, "examples_seen": 45619200.0, "progress": 0.3996340052208079, "epoch": 35.96721737999219, "img/sec/core": 189.6824027585297, "core_hours_Tesla V100-SXM2-32GB": 66.83361312837391, "core_hours": 66.83361312837391}
{"step": 44600, "global_schedule": 0.739562451839447, "l2_grads": 1.2615501880645752, "l2_params": 323.3857421875, "l2_updates": 0.7929955720901489, "training_loss": 4.360337257385254, "uptime": 16721.266323001997, "examples_seen": 45670400.0, "progress": 0.4000825282345237, "epoch": 36.00758462733225, "img/sec/core": 189.9509078674276, "core_hours_Tesla V100-SXM2-32GB": 66.90848627524062, "core_hours": 66.90848627524062}
{"step": 44650, "global_schedule": 0.738882839679718, "l2_grads": 1.304904580116272, "l2_params": 323.3095397949219, "l2_updates": 0.7999608516693115, "training_loss": 2.660675048828125, "uptime": 16738.167396834004, "examples_seen": 45721600.0, "progress": 0.40053105124823957, "epoch": 36.047951874672314, "img/sec/core": 189.33708188055795, "core_hours_Tesla V100-SXM2-32GB": 66.98360215893844, "core_hours": 66.98360215893844}
{"step": 44700, "global_schedule": 0.7382026314735413, "l2_grads": 1.265237808227539, "l2_params": 323.22894287109375, "l2_updates": 0.7903068661689758, "training_loss": 3.277709484100342, "uptime": 16755.015854575962, "examples_seen": 45772800.0, "progress": 0.4009795742619554, "epoch": 36.08831912201237, "img/sec/core": 189.92836311841648, "core_hours_Tesla V100-SXM2-32GB": 67.05848419334714, "core_hours": 67.05848419334714}
{"step": 44750, "global_schedule": 0.7375218272209167, "l2_grads": 1.25773024559021, "l2_params": 323.15533447265625, "l2_updates": 0.7784228324890137, "training_loss": 5.003547191619873, "uptime": 16771.893401601003, "examples_seen": 45824000.0, "progress": 0.4014280972756712, "epoch": 36.12868636935243, "img/sec/core": 189.60101223550683, "core_hours_Tesla V100-SXM2-32GB": 67.13349551345843, "core_hours": 67.13349551345843}
{"step": 44800, "global_schedule": 0.7368404865264893, "l2_grads": 1.3192908763885498, "l2_params": 323.0783386230469, "l2_updates": 0.7804217338562012, "training_loss": 3.097315549850464, "uptime": 16788.780254512967, "examples_seen": 45875200.0, "progress": 0.40187662028938703, "epoch": 36.16905361669249, "img/sec/core": 189.49652825676975, "core_hours_Tesla V100-SXM2-32GB": 67.20854819306716, "core_hours": 67.20854819306716}
{"step": 44850, "global_schedule": 0.7361586093902588, "l2_grads": 1.4525681734085083, "l2_params": 323.01373291015625, "l2_updates": 0.7827596664428711, "training_loss": 2.4932711124420166, "uptime": 16805.65293757897, "examples_seen": 45926400.0, "progress": 0.4023251433031029, "epoch": 36.209420864032545, "img/sec/core": 189.65566931367212, "core_hours_Tesla V100-SXM2-32GB": 67.28353789558273, "core_hours": 67.28353789558273}
{"step": 44900, "global_schedule": 0.7354761362075806, "l2_grads": 1.3842477798461914, "l2_params": 322.94598388671875, "l2_updates": 0.7737692594528198, "training_loss": 2.58518648147583, "uptime": 16822.526549225964, "examples_seen": 45977600.0, "progress": 0.4027736663168187, "epoch": 36.2497881113726, "img/sec/core": 189.64523226832742, "core_hours_Tesla V100-SXM2-32GB": 67.35853172512492, "core_hours": 67.35853172512492}
{"step": 44950, "global_schedule": 0.7347930669784546, "l2_grads": 1.4229464530944824, "l2_params": 322.87298583984375, "l2_updates": 0.77631014585495, "training_loss": 2.6402745246887207, "uptime": 16839.38177321898, "examples_seen": 46028800.0, "progress": 0.40322218933053455, "epoch": 36.29015535871266, "img/sec/core": 189.85211951655415, "core_hours_Tesla V100-SXM2-32GB": 67.43344383176054, "core_hours": 67.43344383176054}
{"step": 45000, "global_schedule": 0.7341094613075256, "l2_grads": 1.3391164541244507, "l2_params": 322.7866516113281, "l2_updates": 0.80159991979599, "training_loss": 2.73770809173584, "uptime": 16856.246673530957, "examples_seen": 46080000.0, "progress": 0.4036707123442504, "epoch": 36.330522606052725, "img/sec/core": 189.74319093526253, "core_hours_Tesla V100-SXM2-32GB": 67.50839894425822, "core_hours": 67.50839894425822, "minival/prec@1": 0.6554011863877615, "minival/loss": 1.4198544276270537, "minival/sample count": 12812.0, "minival/attn_weight_avg": [13312, 12, 281], "minival/attn_mag": [13312, 12, 281], "minival/before_mlp": [13312, 12, 281], "z/secs/eval/minival": 2.8874605930177495, "real/prec@1": 0.6985716420778444, "real/loss": 2.2555616153870406, "real/sample count": 46837.0, "real/attn_weight_avg": [50176, 12, 281], "real/attn_mag": [50176, 12, 281], "real/before_mlp": [50176, 12, 281], "z/secs/eval/real": 11.201766757993028, "train/prec@1": 0.6760722788120048, "train/loss": 1.309935221054029, "train/sample count": 25623.0, "train/attn_weight_avg": [26624, 12, 281], "train/attn_mag": [26624, 12, 281], "train/before_mlp": [26624, 12, 281], "z/secs/eval/train": 6.5227554139564745, "v2/prec@1": 0.5029, "v2/loss": 2.226587829589844, "v2/sample count": 10000.0, "v2/attn_weight_avg": [10240, 12, 281], "v2/attn_mag": [10240, 12, 281], "v2/before_mlp": [10240, 12, 281], "z/secs/eval/v2": 3.3630735620390624, "val/prec@1": 0.62264, "val/loss": 1.5644752978515626, "val/sample count": 50000.0, "val/attn_weight_avg": [50176, 12, 281], "val/attn_mag": [50176, 12, 281], "val/before_mlp": [50176, 12, 281], "z/secs/eval/val": 12.37879992701346}
{"step": 45050, "global_schedule": 0.7334252595901489, "l2_grads": 1.3378232717514038, "l2_params": 322.73333740234375, "l2_updates": 0.7877411842346191, "training_loss": 3.2811009883880615, "uptime": 16910.078507495986, "examples_seen": 46131200.0, "progress": 0.40411923535796623, "epoch": 36.37088985339278, "img/sec/core": 189.0719580966164, "core_hours_Tesla V100-SXM2-32GB": 67.58362015826266, "core_hours": 67.58362015826266}
{"step": 45100, "global_schedule": 0.7327405214309692, "l2_grads": 1.4156036376953125, "l2_params": 322.6701965332031, "l2_updates": 0.792249321937561, "training_loss": 2.712813138961792, "uptime": 16926.947432035988, "examples_seen": 46182400.0, "progress": 0.4045677583716821, "epoch": 36.41125710073284, "img/sec/core": 189.69792605401267, "core_hours_Tesla V100-SXM2-32GB": 67.65859315621822, "core_hours": 67.65859315621822}
{"step": 45150, "global_schedule": 0.7320552468299866, "l2_grads": 1.415884017944336, "l2_params": 322.6090087890625, "l2_updates": 0.7909666895866394, "training_loss": 2.694878339767456, "uptime": 16943.831812232966, "examples_seen": 46233600.0, "progress": 0.40501628138539786, "epoch": 36.4516243480729, "img/sec/core": 189.52427999535135, "core_hours_Tesla V100-SXM2-32GB": 67.73363484598256, "core_hours": 67.73363484598256}
{"step": 45200, "global_schedule": 0.7313693761825562, "l2_grads": 1.3041185140609741, "l2_params": 322.53997802734375, "l2_updates": 0.7888206839561462, "training_loss": 2.4068894386291504, "uptime": 16960.700522253, "examples_seen": 46284800.0, "progress": 0.4054648043991137, "epoch": 36.491991595412955, "img/sec/core": 189.70033844909892, "core_hours_Tesla V100-SXM2-32GB": 67.80860689051605, "core_hours": 67.80860689051605}
{"step": 45250, "global_schedule": 0.7306829690933228, "l2_grads": 1.4598685503005981, "l2_params": 322.4724426269531, "l2_updates": 0.7603955268859863, "training_loss": 2.570876121520996, "uptime": 16977.582904735988, "examples_seen": 46336000.0, "progress": 0.40591332741282954, "epoch": 36.53235884275301, "img/sec/core": 189.54670664667293, "core_hours_Tesla V100-SXM2-32GB": 67.88363970155154, "core_hours": 67.88363970155154}
{"step": 45300, "global_schedule": 0.7299960255622864, "l2_grads": 1.2363561391830444, "l2_params": 322.4049377441406, "l2_updates": 0.7926284074783325, "training_loss": 4.681086540222168, "uptime": 16994.472795488953, "examples_seen": 46387200.0, "progress": 0.4063618504265454, "epoch": 36.57272609009307, "img/sec/core": 189.4624451279019, "core_hours_Tesla V100-SXM2-32GB": 67.95870588267584, "core_hours": 67.95870588267584}
{"step": 45350, "global_schedule": 0.729308545589447, "l2_grads": 1.4354701042175293, "l2_params": 322.3515625, "l2_updates": 0.7967221736907959, "training_loss": 2.7377607822418213, "uptime": 17011.344355679, "examples_seen": 46438400.0, "progress": 0.4068103734402612, "epoch": 36.613093337433135, "img/sec/core": 189.66829172607606, "core_hours_Tesla V100-SXM2-32GB": 68.03369059463161, "core_hours": 68.03369059463161}
{"step": 45400, "global_schedule": 0.7286205291748047, "l2_grads": 1.4653406143188477, "l2_params": 322.2652282714844, "l2_updates": 0.793682873249054, "training_loss": 2.667757749557495, "uptime": 17028.22907190997, "examples_seen": 46489600.0, "progress": 0.40725889645397706, "epoch": 36.65346058477319, "img/sec/core": 189.52050814634586, "core_hours_Tesla V100-SXM2-32GB": 68.10873377788036, "core_hours": 68.10873377788036}
{"step": 45450, "global_schedule": 0.7279319167137146, "l2_grads": 1.1017589569091797, "l2_params": 322.1870422363281, "l2_updates": 0.7631024718284607, "training_loss": 4.567234516143799, "uptime": 17045.11243248696, "examples_seen": 46540800.0, "progress": 0.4077074194676929, "epoch": 36.69382783211325, "img/sec/core": 189.53572574651503, "core_hours_Tesla V100-SXM2-32GB": 68.18377093600031, "core_hours": 68.18377093600031}
{"step": 45500, "global_schedule": 0.7272427678108215, "l2_grads": 1.59461510181427, "l2_params": 322.1127014160156, "l2_updates": 0.7724963426589966, "training_loss": 2.5477137565612793, "uptime": 17062.00602360099, "examples_seen": 46592000.0, "progress": 0.40815594248140874, "epoch": 36.73419507945331, "img/sec/core": 189.4209453987937, "core_hours_Tesla V100-SXM2-32GB": 68.25885356317377, "core_hours": 68.25885356317377}
{"step": 45550, "global_schedule": 0.7265530824661255, "l2_grads": 1.4676690101623535, "l2_params": 322.052490234375, "l2_updates": 0.7801100611686707, "training_loss": 2.4469730854034424, "uptime": 17078.873661828984, "examples_seen": 46643200.0, "progress": 0.4086044654951246, "epoch": 36.774562326793365, "img/sec/core": 189.71239225945158, "core_hours_Tesla V100-SXM2-32GB": 68.33382084418709, "core_hours": 68.33382084418709}
{"step": 45600, "global_schedule": 0.7258628606796265, "l2_grads": 1.249758005142212, "l2_params": 321.99383544921875, "l2_updates": 0.7675273418426514, "training_loss": 5.090100288391113, "uptime": 17095.756448031985, "examples_seen": 46694400.0, "progress": 0.40905298850884036, "epoch": 36.81492957413342, "img/sec/core": 189.54217399442953, "core_hours_Tesla V100-SXM2-32GB": 68.40885544953376, "core_hours": 68.40885544953376}
{"step": 45650, "global_schedule": 0.7251721024513245, "l2_grads": 1.4234323501586914, "l2_params": 321.9258728027344, "l2_updates": 0.7898192405700684, "training_loss": 2.6170358657836914, "uptime": 17112.624339114, "examples_seen": 46745600.0, "progress": 0.4095015115225562, "epoch": 36.85529682147348, "img/sec/core": 189.70954842195314, "core_hours_Tesla V100-SXM2-32GB": 68.48382385434273, "core_hours": 68.48382385434273}
{"step": 45700, "global_schedule": 0.7244807481765747, "l2_grads": 1.4763753414154053, "l2_params": 321.88690185546875, "l2_updates": 0.7751296162605286, "training_loss": 2.5561506748199463, "uptime": 17129.505295662966, "examples_seen": 46796800.0, "progress": 0.40995003453627205, "epoch": 36.895664068813545, "img/sec/core": 189.56271765276668, "core_hours_Tesla V100-SXM2-32GB": 68.55885032789368, "core_hours": 68.55885032789368}
{"step": 45750, "global_schedule": 0.7237889170646667, "l2_grads": 1.3957334756851196, "l2_params": 321.8247985839844, "l2_updates": 0.7745004296302795, "training_loss": 2.4562861919403076, "uptime": 17146.383874058956, "examples_seen": 46848000.0, "progress": 0.4103985575499879, "epoch": 36.9360313161536, "img/sec/core": 189.58942660480326, "core_hours_Tesla V100-SXM2-32GB": 68.63386623187586, "core_hours": 68.63386623187586}
{"step": 45800, "global_schedule": 0.7230965495109558, "l2_grads": 1.4460067749023438, "l2_params": 321.7500915527344, "l2_updates": 0.7741921544075012, "training_loss": 2.6296210289001465, "uptime": 17163.255330509972, "examples_seen": 46899200.0, "progress": 0.4108470805637037, "epoch": 36.97639856349366, "img/sec/core": 189.66945795645177, "core_hours_Tesla V100-SXM2-32GB": 68.70885048276926, "core_hours": 68.70885048276926}
{"step": 45850, "global_schedule": 0.7224036455154419, "l2_grads": 1.4718424081802368, "l2_params": 321.7050476074219, "l2_updates": 0.7705040574073792, "training_loss": 2.5506157875061035, "uptime": 17180.12252947595, "examples_seen": 46950400.0, "progress": 0.41129560357741957, "epoch": 37.01676581083372, "img/sec/core": 189.7173328218032, "core_hours_Tesla V100-SXM2-32GB": 68.78381581150694, "core_hours": 68.78381581150694}
{"step": 45900, "global_schedule": 0.721710205078125, "l2_grads": 1.4229286909103394, "l2_params": 321.6416015625, "l2_updates": 0.7574708461761475, "training_loss": 2.534909963607788, "uptime": 17196.996711580956, "examples_seen": 47001600.0, "progress": 0.4117441265911354, "epoch": 37.057133058173775, "img/sec/core": 189.6388210158425, "core_hours_Tesla V100-SXM2-32GB": 68.85881217641807, "core_hours": 68.85881217641807}
{"step": 45950, "global_schedule": 0.7210161685943604, "l2_grads": 1.1953610181808472, "l2_params": 321.57061767578125, "l2_updates": 0.7839407920837402, "training_loss": 4.9922075271606445, "uptime": 17213.897736490006, "examples_seen": 47052800.0, "progress": 0.41219264960485125, "epoch": 37.09750030551383, "img/sec/core": 189.33762994968097, "core_hours_Tesla V100-SXM2-32GB": 68.93392784268052, "core_hours": 68.93392784268052}
{"step": 46000, "global_schedule": 0.7203216552734375, "l2_grads": 1.3531622886657715, "l2_params": 321.5274658203125, "l2_updates": 0.7949368953704834, "training_loss": 2.473228931427002, "uptime": 17230.761285997985, "examples_seen": 47104000.0, "progress": 0.41264117261856703, "epoch": 37.13786755285389, "img/sec/core": 189.75838974385385, "core_hours_Tesla V100-SXM2-32GB": 69.00887695160488, "core_hours": 69.00887695160488}
{"step": 46050, "global_schedule": 0.7196266651153564, "l2_grads": 1.5015934705734253, "l2_params": 321.4689025878906, "l2_updates": 0.7550429105758667, "training_loss": 2.457886219024658, "uptime": 17248.164604505, "examples_seen": 47155200.0, "progress": 0.41308969563228287, "epoch": 37.178234800193955, "img/sec/core": 189.40395465464889, "core_hours_Tesla V100-SXM2-32GB": 69.08396631416942, "core_hours": 69.08396631416942}
{"step": 46100, "global_schedule": 0.7189310789108276, "l2_grads": 1.2854208946228027, "l2_params": 321.4065856933594, "l2_updates": 0.7643957734107971, "training_loss": 3.5053365230560303, "uptime": 17265.056939475995, "examples_seen": 47206400.0, "progress": 0.4135382186459987, "epoch": 37.21860204753401, "img/sec/core": 189.43503106554488, "core_hours_Tesla V100-SXM2-32GB": 69.15904335848495, "core_hours": 69.15904335848495}
{"step": 46150, "global_schedule": 0.7182350158691406, "l2_grads": 1.4067305326461792, "l2_params": 321.338623046875, "l2_updates": 0.7634235620498657, "training_loss": 2.590942144393921, "uptime": 17281.954539839993, "examples_seen": 47257600.0, "progress": 0.41398674165971455, "epoch": 37.25896929487407, "img/sec/core": 189.37600198060522, "core_hours_Tesla V100-SXM2-32GB": 69.23414380454716, "core_hours": 69.23414380454716}
{"step": 46200, "global_schedule": 0.7175383567810059, "l2_grads": 1.4390451908111572, "l2_params": 321.2410583496094, "l2_updates": 0.7888691425323486, "training_loss": 2.6288890838623047, "uptime": 17298.842632734973, "examples_seen": 47308800.0, "progress": 0.4144352646734304, "epoch": 37.29933654221413, "img/sec/core": 189.48261475700204, "core_hours_Tesla V100-SXM2-32GB": 69.30920199519151, "core_hours": 69.30920199519151}
{"step": 46250, "global_schedule": 0.7168412208557129, "l2_grads": 1.3865987062454224, "l2_params": 321.1922302246094, "l2_updates": 0.7876888513565063, "training_loss": 2.519134521484375, "uptime": 17315.72610729799, "examples_seen": 47360000.0, "progress": 0.41488378768714623, "epoch": 37.339703789554186, "img/sec/core": 189.53444612697277, "core_hours_Tesla V100-SXM2-32GB": 69.38423965991605, "core_hours": 69.38423965991605}
{"step": 46300, "global_schedule": 0.7161436080932617, "l2_grads": 1.221444010734558, "l2_params": 321.14300537109375, "l2_updates": 0.7670636177062988, "training_loss": 3.7423861026763916, "uptime": 17332.587977143005, "examples_seen": 47411200.0, "progress": 0.4153323107008621, "epoch": 37.38007103689424, "img/sec/core": 189.7772921634757, "core_hours_Tesla V100-SXM2-32GB": 69.45918130367166, "core_hours": 69.45918130367166}
{"step": 46350, "global_schedule": 0.7154453992843628, "l2_grads": 1.5362974405288696, "l2_params": 321.0589599609375, "l2_updates": 0.7700109481811523, "training_loss": 2.621626377105713, "uptime": 17349.466023241985, "examples_seen": 47462400.0, "progress": 0.4157808337145779, "epoch": 37.4204382842343, "img/sec/core": 189.59540584459978, "core_hours_Tesla V100-SXM2-32GB": 69.53419484188935, "core_hours": 69.53419484188935}
{"step": 46400, "global_schedule": 0.7147467136383057, "l2_grads": 1.503401279449463, "l2_params": 320.99951171875, "l2_updates": 0.7688885927200317, "training_loss": 2.493473768234253, "uptime": 17366.34186686395, "examples_seen": 47513600.0, "progress": 0.41622935672829375, "epoch": 37.460805531574366, "img/sec/core": 189.62015006082348, "core_hours_Tesla V100-SXM2-32GB": 69.60919859132031, "core_hours": 69.60919859132031}
{"step": 46450, "global_schedule": 0.7140475511550903, "l2_grads": 1.3891340494155884, "l2_params": 320.909912109375, "l2_updates": 0.7790477871894836, "training_loss": 2.4658398628234863, "uptime": 17383.211188088986, "examples_seen": 47564800.0, "progress": 0.41667787974200954, "epoch": 37.50117277891442, "img/sec/core": 189.6934652741545, "core_hours_Tesla V100-SXM2-32GB": 69.68417335232047, "core_hours": 69.68417335232047}
{"step": 46500, "global_schedule": 0.7133477926254272, "l2_grads": 1.3528238534927368, "l2_params": 320.8541564941406, "l2_updates": 0.7638377547264099, "training_loss": 2.8017520904541016, "uptime": 17400.102725704957, "examples_seen": 47616000.0, "progress": 0.4171264027557254, "epoch": 37.54154002625448, "img/sec/core": 189.44397323393207, "core_hours_Tesla V100-SXM2-32GB": 69.7592468528359, "core_hours": 69.7592468528359}
{"step": 46550, "global_schedule": 0.712647557258606, "l2_grads": 1.4424508810043335, "l2_params": 320.7784118652344, "l2_updates": 0.7617167234420776, "training_loss": 2.582874298095703, "uptime": 17416.96806159598, "examples_seen": 47667200.0, "progress": 0.4175749257694412, "epoch": 37.58190727359454, "img/sec/core": 189.73829046021123, "core_hours_Tesla V100-SXM2-32GB": 69.83420390124044, "core_hours": 69.83420390124044}
{"step": 46600, "global_schedule": 0.7119468450546265, "l2_grads": 1.4505609273910522, "l2_params": 320.7070007324219, "l2_updates": 0.7721511125564575, "training_loss": 2.6940977573394775, "uptime": 17433.834683461, "examples_seen": 47718400.0, "progress": 0.41802344878315706, "epoch": 37.622274520934596, "img/sec/core": 189.72382410712342, "core_hours_Tesla V100-SXM2-32GB": 69.90916666508497, "core_hours": 69.90916666508497}
{"step": 46650, "global_schedule": 0.711245596408844, "l2_grads": 1.5044969320297241, "l2_params": 320.6263122558594, "l2_updates": 0.7495518922805786, "training_loss": 2.5475516319274902, "uptime": 17450.691180580005, "examples_seen": 47769600.0, "progress": 0.4184719717968729, "epoch": 37.66264176827465, "img/sec/core": 189.8377804954446, "core_hours_Tesla V100-SXM2-32GB": 69.98408443005833, "core_hours": 69.98408443005833}
{"step": 46700, "global_schedule": 0.7105438709259033, "l2_grads": 1.3568778038024902, "l2_params": 320.55322265625, "l2_updates": 0.7737728357315063, "training_loss": 2.769301652908325, "uptime": 17467.564365861996, "examples_seen": 47820800.0, "progress": 0.41892049481058874, "epoch": 37.70300901561471, "img/sec/core": 189.65002437420054, "core_hours_Tesla V100-SXM2-32GB": 70.05907636464495, "core_hours": 70.05907636464495}
{"step": 46750, "global_schedule": 0.7098416090011597, "l2_grads": 1.3662304878234863, "l2_params": 320.4874267578125, "l2_updates": 0.7731575965881348, "training_loss": 2.568695068359375, "uptime": 17484.43421136297, "examples_seen": 47872000.0, "progress": 0.4193690178243046, "epoch": 37.74337626295477, "img/sec/core": 189.68757003823848, "core_hours_Tesla V100-SXM2-32GB": 70.13405345576038, "core_hours": 70.13405345576038}
{"step": 46800, "global_schedule": 0.709138810634613, "l2_grads": 1.4824012517929077, "l2_params": 320.4166259765625, "l2_updates": 0.7677547931671143, "training_loss": 2.631391763687134, "uptime": 17501.304519246973, "examples_seen": 47923200.0, "progress": 0.4198175408380204, "epoch": 37.78374351029483, "img/sec/core": 189.68237106295356, "core_hours_Tesla V100-SXM2-32GB": 70.20903260191152, "core_hours": 70.20903260191152}
{"step": 46850, "global_schedule": 0.708435595035553, "l2_grads": 1.4179054498672485, "l2_params": 320.3368225097656, "l2_updates": 0.755925178527832, "training_loss": 2.581422805786133, "uptime": 17518.181821862992, "examples_seen": 47974400.0, "progress": 0.42026606385173626, "epoch": 37.82411075763489, "img/sec/core": 189.60375794664003, "core_hours_Tesla V100-SXM2-32GB": 70.2840428357605, "core_hours": 70.2840428357605}
{"step": 46900, "global_schedule": 0.7077318429946899, "l2_grads": 1.4689810276031494, "l2_params": 320.23876953125, "l2_updates": 0.7551925182342529, "training_loss": 2.591853618621826, "uptime": 17535.032604517997, "examples_seen": 48025600.0, "progress": 0.42071458686545204, "epoch": 37.86447800497495, "img/sec/core": 189.90215858309483, "core_hours_Tesla V100-SXM2-32GB": 70.35893520311608, "core_hours": 70.35893520311608}
{"step": 46950, "global_schedule": 0.7070275545120239, "l2_grads": 1.4181767702102661, "l2_params": 320.150634765625, "l2_updates": 0.7709230780601501, "training_loss": 2.8297853469848633, "uptime": 17551.898324629, "examples_seen": 48076800.0, "progress": 0.4211631098791679, "epoch": 37.904845252315006, "img/sec/core": 189.7339680095984, "core_hours_Tesla V100-SXM2-32GB": 70.43389395916499, "core_hours": 70.43389395916499}
{"step": 47000, "global_schedule": 0.7063227891921997, "l2_grads": 1.4313353300094604, "l2_params": 320.08502197265625, "l2_updates": 0.7455776333808899, "training_loss": 2.58750581741333, "uptime": 17568.778616949974, "examples_seen": 48128000.0, "progress": 0.4216116328928837, "epoch": 37.945212499655064, "img/sec/core": 189.57017681643458, "core_hours_Tesla V100-SXM2-32GB": 70.50891748059152, "core_hours": 70.50891748059152}
{"step": 47050, "global_schedule": 0.7056175470352173, "l2_grads": 1.4175198078155518, "l2_params": 320.0176696777344, "l2_updates": 0.775524914264679, "training_loss": 2.587520122528076, "uptime": 17586.433923235978, "examples_seen": 48179200.0, "progress": 0.42206015590659957, "epoch": 37.98557974699512, "img/sec/core": 190.00925406708237, "core_hours_Tesla V100-SXM2-32GB": 70.58376763613818, "core_hours": 70.58376763613818}
{"step": 47100, "global_schedule": 0.7049118280410767, "l2_grads": 1.4519788026809692, "l2_params": 319.9799499511719, "l2_updates": 0.7664903998374939, "training_loss": 2.725520133972168, "uptime": 17603.320336222998, "examples_seen": 48230400.0, "progress": 0.4225086789203154, "epoch": 38.02594699433518, "img/sec/core": 189.5014650215978, "core_hours_Tesla V100-SXM2-32GB": 70.65881836052493, "core_hours": 70.65881836052493}
{"step": 47150, "global_schedule": 0.7042055726051331, "l2_grads": 1.3564165830612183, "l2_params": 319.8872985839844, "l2_updates": 0.757279634475708, "training_loss": 2.5915637016296387, "uptime": 17620.191596473975, "examples_seen": 48281600.0, "progress": 0.42295720193403125, "epoch": 38.066314241675244, "img/sec/core": 189.67166366927054, "core_hours_Tesla V100-SXM2-32GB": 70.73380173941815, "core_hours": 70.73380173941815}
{"step": 47200, "global_schedule": 0.7034988403320312, "l2_grads": 1.1857781410217285, "l2_params": 319.8534240722656, "l2_updates": 0.7621721625328064, "training_loss": 4.930863380432129, "uptime": 17637.044551105995, "examples_seen": 48332800.0, "progress": 0.4234057249477471, "epoch": 38.1066814890153, "img/sec/core": 189.877684350969, "core_hours_Tesla V100-SXM2-32GB": 70.8087037600049, "core_hours": 70.8087037600049}
{"step": 47250, "global_schedule": 0.702791690826416, "l2_grads": 1.270399570465088, "l2_params": 319.7825927734375, "l2_updates": 0.7606745362281799, "training_loss": 2.8615922927856445, "uptime": 17653.918523381988, "examples_seen": 48384000.0, "progress": 0.4238542479614629, "epoch": 38.14704873635536, "img/sec/core": 189.6411791877093, "core_hours_Tesla V100-SXM2-32GB": 70.88369919234266, "core_hours": 70.88369919234266}
{"step": 47300, "global_schedule": 0.702083945274353, "l2_grads": 1.4934026002883911, "l2_params": 319.7244567871094, "l2_updates": 0.7505802512168884, "training_loss": 2.7723937034606934, "uptime": 17670.79942108097, "examples_seen": 48435200.0, "progress": 0.4243027709751787, "epoch": 38.187415983695416, "img/sec/core": 189.5633785040322, "core_hours_Tesla V100-SXM2-32GB": 70.95872540433814, "core_hours": 70.95872540433814}
{"step": 47350, "global_schedule": 0.7013757824897766, "l2_grads": 1.438652753829956, "l2_params": 319.622314453125, "l2_updates": 0.7673612833023071, "training_loss": 2.6392533779144287, "uptime": 17687.66137820098, "examples_seen": 48486400.0, "progress": 0.42475129398889455, "epoch": 38.227783231035474, "img/sec/core": 189.7763099042908, "core_hours_Tesla V100-SXM2-32GB": 71.03366743598262, "core_hours": 71.03366743598262}
{"step": 47400, "global_schedule": 0.700667142868042, "l2_grads": 1.5435630083084106, "l2_params": 319.5403747558594, "l2_updates": 0.747704803943634, "training_loss": 2.6883749961853027, "uptime": 17704.526294020994, "examples_seen": 48537600.0, "progress": 0.4251998170026104, "epoch": 38.26815047837553, "img/sec/core": 189.74301645802598, "core_hours_Tesla V100-SXM2-32GB": 71.10862261740492, "core_hours": 71.10862261740492}
{"step": 47450, "global_schedule": 0.6999579668045044, "l2_grads": 1.4516282081604004, "l2_params": 319.49371337890625, "l2_updates": 0.7544882297515869, "training_loss": 2.556163787841797, "uptime": 17721.390116330003, "examples_seen": 48588800.0, "progress": 0.42564834001632623, "epoch": 38.30851772571559, "img/sec/core": 189.75532007891496, "core_hours_Tesla V100-SXM2-32GB": 71.18357293877828, "core_hours": 71.18357293877828}
{"step": 47501, "global_schedule": 0.6992483735084534, "l2_grads": 1.2137998342514038, "l2_params": 319.4100646972656, "l2_updates": 0.7423328161239624, "training_loss": 4.096095085144043, "uptime": 17738.254918983963, "examples_seen": 48640000.0, "progress": 0.4260968630300421, "epoch": 38.348884973055654, "img/sec/core": 189.74428966998377, "core_hours_Tesla V100-SXM2-32GB": 71.25852761724033, "core_hours": 71.25852761724033, "minival/prec@1": 0.6524352169840775, "minival/loss": 1.4674449948046753, "minival/sample count": 12812.0, "minival/attn_weight_avg": [13312, 12, 281], "minival/attn_mag": [13312, 12, 281], "minival/before_mlp": [13312, 12, 281], "z/secs/eval/minival": 2.888236225990113, "real/prec@1": 0.6963298247112326, "real/loss": 2.3105835401398735, "real/sample count": 46837.0, "real/attn_weight_avg": [50176, 12, 281], "real/attn_mag": [50176, 12, 281], "real/before_mlp": [50176, 12, 281], "z/secs/eval/real": 11.150904733978678, "train/prec@1": 0.6754478398314014, "train/loss": 1.3586795954869353, "train/sample count": 25623.0, "train/attn_weight_avg": [26624, 12, 281], "train/attn_mag": [26624, 12, 281], "train/before_mlp": [26624, 12, 281], "z/secs/eval/train": 6.5958707260433584, "v2/prec@1": 0.4968, "v2/loss": 2.287214794921875, "v2/sample count": 10000.0, "v2/attn_weight_avg": [10240, 12, 281], "v2/attn_mag": [10240, 12, 281], "v2/before_mlp": [10240, 12, 281], "z/secs/eval/v2": 3.405589335015975, "val/prec@1": 0.62098, "val/loss": 1.6152903857421874, "val/sample count": 50000.0, "val/attn_weight_avg": [50176, 12, 281], "val/attn_mag": [50176, 12, 281], "val/before_mlp": [50176, 12, 281], "z/secs/eval/val": 12.2894827509881}
{"step": 47550, "global_schedule": 0.6985383033752441, "l2_grads": 1.4651432037353516, "l2_params": 319.3548583984375, "l2_updates": 0.7481120824813843, "training_loss": 2.4905362129211426, "uptime": 17791.495810428984, "examples_seen": 48691200.0, "progress": 0.4265453860437579, "epoch": 38.38925222039571, "img/sec/core": 189.25026721256063, "core_hours_Tesla V100-SXM2-32GB": 71.33367795880496, "core_hours": 71.33367795880496}
{"step": 47600, "global_schedule": 0.6978276968002319, "l2_grads": 1.2751216888427734, "l2_params": 319.2693786621094, "l2_updates": 0.7309743165969849, "training_loss": 4.836641311645508, "uptime": 17808.352810007986, "examples_seen": 48742400.0, "progress": 0.42699390905747375, "epoch": 38.42961946773577, "img/sec/core": 189.83212196232517, "core_hours_Tesla V100-SXM2-32GB": 71.40859795693386, "core_hours": 71.40859795693386}
{"step": 47650, "global_schedule": 0.6971166729927063, "l2_grads": 1.291064739227295, "l2_params": 319.1983642578125, "l2_updates": 0.7395052313804626, "training_loss": 4.886907577514648, "uptime": 17825.19642567495, "examples_seen": 48793600.0, "progress": 0.4274424320711896, "epoch": 38.46998671507583, "img/sec/core": 189.98296228501798, "core_hours_Tesla V100-SXM2-32GB": 71.48345847100926, "core_hours": 71.48345847100926}
{"step": 47700, "global_schedule": 0.6964051723480225, "l2_grads": 1.591639518737793, "l2_params": 319.1264343261719, "l2_updates": 0.7478221654891968, "training_loss": 2.7137131690979004, "uptime": 17842.068518846005, "examples_seen": 48844800.0, "progress": 0.42789095508490543, "epoch": 38.510353962415884, "img/sec/core": 189.66230019933778, "core_hours_Tesla V100-SXM2-32GB": 71.5584455517695, "core_hours": 71.5584455517695}
{"step": 47750, "global_schedule": 0.6956931352615356, "l2_grads": 1.2017829418182373, "l2_params": 319.04827880859375, "l2_updates": 0.7399882674217224, "training_loss": 3.863844394683838, "uptime": 17858.91415749595, "examples_seen": 48896000.0, "progress": 0.4283394780986212, "epoch": 38.55072120975594, "img/sec/core": 189.96014734118324, "core_hours_Tesla V100-SXM2-32GB": 71.63331505688036, "core_hours": 71.63331505688036}
{"step": 47800, "global_schedule": 0.6949806809425354, "l2_grads": 1.4103529453277588, "l2_params": 318.9739990234375, "l2_updates": 0.7669817209243774, "training_loss": 2.405177116394043, "uptime": 17875.77892247797, "examples_seen": 48947200.0, "progress": 0.42878800111233706, "epoch": 38.591088457096, "img/sec/core": 189.74471351434158, "core_hours_Tesla V100-SXM2-32GB": 71.70826956791157, "core_hours": 71.70826956791157}
{"step": 47850, "global_schedule": 0.694267749786377, "l2_grads": 1.3918981552124023, "l2_params": 318.9102783203125, "l2_updates": 0.7424278855323792, "training_loss": 2.690722703933716, "uptime": 17892.649369425955, "examples_seen": 48998400.0, "progress": 0.4292365241260529, "epoch": 38.631455704436064, "img/sec/core": 189.68080750119927, "core_hours_Tesla V100-SXM2-32GB": 71.78324933212483, "core_hours": 71.78324933212483}
{"step": 47900, "global_schedule": 0.6935544013977051, "l2_grads": 1.4961169958114624, "l2_params": 318.8366394042969, "l2_updates": 0.7408331632614136, "training_loss": 2.8198485374450684, "uptime": 17909.492783035967, "examples_seen": 49049600.0, "progress": 0.42968504713976874, "epoch": 38.67182295177612, "img/sec/core": 189.98524135855652, "core_hours_Tesla V100-SXM2-32GB": 71.85810894816933, "core_hours": 71.85810894816933}
{"step": 47950, "global_schedule": 0.6928405165672302, "l2_grads": 1.1855450868606567, "l2_params": 318.752197265625, "l2_updates": 0.7463549375534058, "training_loss": 3.897939682006836, "uptime": 17926.358726407983, "examples_seen": 49100800.0, "progress": 0.4301335701534846, "epoch": 38.71219019911618, "img/sec/core": 189.73145642770854, "core_hours_Tesla V100-SXM2-32GB": 71.93306869648941, "core_hours": 71.93306869648941}
{"step": 48000, "global_schedule": 0.6921262145042419, "l2_grads": 1.3167548179626465, "l2_params": 318.673828125, "l2_updates": 0.7239431142807007, "training_loss": 4.322939872741699, "uptime": 17943.213614306005, "examples_seen": 49152000.0, "progress": 0.4305820931672004, "epoch": 38.75255744645624, "img/sec/core": 189.85590526387094, "core_hours_Tesla V100-SXM2-32GB": 72.0079793093695, "core_hours": 72.0079793093695}
{"step": 48050, "global_schedule": 0.6914114356040955, "l2_grads": 1.2868801355361938, "l2_params": 318.59857177734375, "l2_updates": 0.7483699321746826, "training_loss": 3.1901156902313232, "uptime": 17960.855038923968, "examples_seen": 49203200.0, "progress": 0.43103061618091626, "epoch": 38.792924693796294, "img/sec/core": 189.80119409546114, "core_hours_Tesla V100-SXM2-32GB": 72.08291151561826, "core_hours": 72.08291151561826}
{"step": 48100, "global_schedule": 0.6906961798667908, "l2_grads": 1.467477560043335, "l2_params": 318.51458740234375, "l2_updates": 0.7469164729118347, "training_loss": 2.5708789825439453, "uptime": 17977.727915383002, "examples_seen": 49254400.0, "progress": 0.4314791391946321, "epoch": 38.83329194113635, "img/sec/core": 189.65349552397393, "core_hours_Tesla V100-SXM2-32GB": 72.15790207765842, "core_hours": 72.15790207765842}
{"step": 48150, "global_schedule": 0.6899805068969727, "l2_grads": 1.4614500999450684, "l2_params": 318.4360046386719, "l2_updates": 0.7471464276313782, "training_loss": 2.5738348960876465, "uptime": 17994.59507303196, "examples_seen": 49305600.0, "progress": 0.4319276622083479, "epoch": 38.87365918847641, "img/sec/core": 189.71779754472882, "core_hours_Tesla V100-SXM2-32GB": 72.2328672227649, "core_hours": 72.2328672227649}
{"step": 48200, "global_schedule": 0.6892643570899963, "l2_grads": 1.428399920463562, "l2_params": 318.3735656738281, "l2_updates": 0.730169951915741, "training_loss": 2.998258590698242, "uptime": 18011.43309682596, "examples_seen": 49356800.0, "progress": 0.4323761852220637, "epoch": 38.914026435816474, "img/sec/core": 190.04605523483517, "core_hours_Tesla V100-SXM2-32GB": 72.30770288407156, "core_hours": 72.30770288407156}
{"step": 48250, "global_schedule": 0.6885477304458618, "l2_grads": 1.314210295677185, "l2_params": 318.3238830566406, "l2_updates": 0.7434439063072205, "training_loss": 4.903190612792969, "uptime": 18028.29959935695, "examples_seen": 49408000.0, "progress": 0.43282470823577956, "epoch": 38.95439368315653, "img/sec/core": 189.72516644280947, "core_hours_Tesla V100-SXM2-32GB": 72.38266511754263, "core_hours": 72.38266511754263}
{"step": 48300, "global_schedule": 0.6878306865692139, "l2_grads": 1.4713315963745117, "l2_params": 318.2491149902344, "l2_updates": 0.7344555258750916, "training_loss": 2.7482383251190186, "uptime": 18045.169371921977, "examples_seen": 49459200.0, "progress": 0.4332732312494954, "epoch": 38.99476093049659, "img/sec/core": 189.6883901466418, "core_hours_Tesla V100-SXM2-32GB": 72.4576418844983, "core_hours": 72.4576418844983}
{"step": 48350, "global_schedule": 0.6871131658554077, "l2_grads": 1.497407078742981, "l2_params": 318.1737060546875, "l2_updates": 0.741878092288971, "training_loss": 2.4128341674804688, "uptime": 18062.05239380995, "examples_seen": 49510400.0, "progress": 0.43372175426321125, "epoch": 39.03512817783665, "img/sec/core": 189.53952800827824, "core_hours_Tesla V100-SXM2-32GB": 72.53267753733374, "core_hours": 72.53267753733374}
{"step": 48401, "global_schedule": 0.6863952279090881, "l2_grads": 1.5161497592926025, "l2_params": 318.1100769042969, "l2_updates": 0.7500162124633789, "training_loss": 2.6983957290649414, "uptime": 18078.924765906995, "examples_seen": 49561600.0, "progress": 0.4341702772769271, "epoch": 39.075495425176705, "img/sec/core": 189.65916479286847, "core_hours_Tesla V100-SXM2-32GB": 72.60766585776506, "core_hours": 72.60766585776506}
{"step": 48450, "global_schedule": 0.6856768131256104, "l2_grads": 1.5788882970809937, "l2_params": 318.0579833984375, "l2_updates": 0.732105016708374, "training_loss": 2.6219711303710938, "uptime": 18095.775565421965, "examples_seen": 49612800.0, "progress": 0.4346188002906429, "epoch": 39.11586267251676, "img/sec/core": 189.9019685776402, "core_hours_Tesla V100-SXM2-32GB": 72.68255830005381, "core_hours": 72.68255830005381}
{"step": 48500, "global_schedule": 0.6849579811096191, "l2_grads": 1.4819191694259644, "l2_params": 317.99188232421875, "l2_updates": 0.7472209930419922, "training_loss": 2.4676671028137207, "uptime": 18112.661810179998, "examples_seen": 49664000.0, "progress": 0.43506732330435877, "epoch": 39.15622991985682, "img/sec/core": 189.5033529274091, "core_hours_Tesla V100-SXM2-32GB": 72.75760827675617, "core_hours": 72.75760827675617}
{"step": 48550, "global_schedule": 0.6842387318611145, "l2_grads": 1.5165759325027466, "l2_params": 317.931640625, "l2_updates": 0.7420027852058411, "training_loss": 2.4898505210876465, "uptime": 18129.51169520797, "examples_seen": 49715200.0, "progress": 0.4355158463180746, "epoch": 39.196597167196884, "img/sec/core": 189.91227505040922, "core_hours_Tesla V100-SXM2-32GB": 72.83249665465827, "core_hours": 72.83249665465827}
{"step": 48600, "global_schedule": 0.6835190057754517, "l2_grads": 1.3296780586242676, "l2_params": 317.8706359863281, "l2_updates": 0.7347358465194702, "training_loss": 4.381101608276367, "uptime": 18146.390152845997, "examples_seen": 49766400.0, "progress": 0.4359643693317904, "epoch": 39.23696441453694, "img/sec/core": 189.5907830340087, "core_hours_Tesla V100-SXM2-32GB": 72.90751202193839, "core_hours": 72.90751202193839}
{"step": 48650, "global_schedule": 0.6827988028526306, "l2_grads": 1.405454158782959, "l2_params": 317.80120849609375, "l2_updates": 0.7519550323486328, "training_loss": 2.397580623626709, "uptime": 18163.253719747998, "examples_seen": 49817600.0, "progress": 0.43641289234550623, "epoch": 39.277331661877, "img/sec/core": 189.75819401649818, "core_hours_Tesla V100-SXM2-32GB": 72.98246120816951, "core_hours": 72.98246120816951}
{"step": 48700, "global_schedule": 0.6820782423019409, "l2_grads": 1.4779306650161743, "l2_params": 317.75079345703125, "l2_updates": 0.7404502630233765, "training_loss": 2.4234020709991455, "uptime": 18180.105187435984, "examples_seen": 49868800.0, "progress": 0.43686141535922207, "epoch": 39.31769890921706, "img/sec/core": 189.8944388257302, "core_hours_Tesla V100-SXM2-32GB": 73.0573566201161, "core_hours": 73.0573566201161}
{"step": 48750, "global_schedule": 0.6813571453094482, "l2_grads": 1.3970396518707275, "l2_params": 317.68780517578125, "l2_updates": 0.7469448447227478, "training_loss": 2.5847342014312744, "uptime": 18196.98275044799, "examples_seen": 49920000.0, "progress": 0.4373099383729379, "epoch": 39.358066156557115, "img/sec/core": 189.60083263937057, "core_hours_Tesla V100-SXM2-32GB": 73.13236801128058, "core_hours": 73.13236801128058}
{"step": 48800, "global_schedule": 0.6806356906890869, "l2_grads": 1.3617891073226929, "l2_params": 317.5859680175781, "l2_updates": 0.7430339455604553, "training_loss": 3.016777753829956, "uptime": 18213.850961611955, "examples_seen": 49971200.0, "progress": 0.43775846138665375, "epoch": 39.39843340389717, "img/sec/core": 189.70594859733154, "core_hours_Tesla V100-SXM2-32GB": 73.20733783867598, "core_hours": 73.20733783867598}
{"step": 48850, "global_schedule": 0.6799137592315674, "l2_grads": 1.4620898962020874, "l2_params": 317.5242614746094, "l2_updates": 0.7266066074371338, "training_loss": 2.339390277862549, "uptime": 18230.71109571698, "examples_seen": 50022400.0, "progress": 0.4382069844003696, "epoch": 39.43880065123723, "img/sec/core": 189.79682961398052, "core_hours_Tesla V100-SXM2-32GB": 73.28227176803165, "core_hours": 73.28227176803165}
{"step": 48900, "global_schedule": 0.6791914701461792, "l2_grads": 1.2814266681671143, "l2_params": 317.4551696777344, "l2_updates": 0.736190140247345, "training_loss": 3.668757438659668, "uptime": 18247.566718415997, "examples_seen": 50073600.0, "progress": 0.43865550741408543, "epoch": 39.47916789857729, "img/sec/core": 189.84762871954428, "core_hours_Tesla V100-SXM2-32GB": 73.35718564669395, "core_hours": 73.35718564669395}
{"step": 48950, "global_schedule": 0.6784687042236328, "l2_grads": 1.4492619037628174, "l2_params": 317.38818359375, "l2_updates": 0.7353284358978271, "training_loss": 2.59751033782959, "uptime": 18264.42302596796, "examples_seen": 50124800.0, "progress": 0.4391040304278013, "epoch": 39.51953514591735, "img/sec/core": 189.8399154224791, "core_hours_Tesla V100-SXM2-32GB": 73.43210256914712, "core_hours": 73.43210256914712}
{"step": 49000, "global_schedule": 0.6777454614639282, "l2_grads": 1.3468042612075806, "l2_params": 317.30474853515625, "l2_updates": 0.7285012602806091, "training_loss": 4.894118309020996, "uptime": 18281.295568678004, "examples_seen": 50176000.0, "progress": 0.43955255344151706, "epoch": 39.55990239325741, "img/sec/core": 189.65724698359656, "core_hours_Tesla V100-SXM2-32GB": 73.50709164785843, "core_hours": 73.50709164785843}
{"step": 49050, "global_schedule": 0.677021861076355, "l2_grads": 1.200028657913208, "l2_params": 317.2196960449219, "l2_updates": 0.7256616353988647, "training_loss": 4.542937278747559, "uptime": 18298.671247257967, "examples_seen": 50227200.0, "progress": 0.4400010764552329, "epoch": 39.60026964059747, "img/sec/core": 189.63197688599757, "core_hours_Tesla V100-SXM2-32GB": 73.58209071951167, "core_hours": 73.58209071951167}
{"step": 49100, "global_schedule": 0.6762977838516235, "l2_grads": 1.4914640188217163, "l2_params": 317.1587829589844, "l2_updates": 0.7240580320358276, "training_loss": 2.439075469970703, "uptime": 18315.525981137005, "examples_seen": 50278400.0, "progress": 0.44044959946894874, "epoch": 39.640636887937525, "img/sec/core": 189.8576401719317, "core_hours_Tesla V100-SXM2-32GB": 73.65700064786296, "core_hours": 73.65700064786296}
{"step": 49150, "global_schedule": 0.6755733489990234, "l2_grads": 1.2302201986312866, "l2_params": 317.0644836425781, "l2_updates": 0.7342239022254944, "training_loss": 4.252891540527344, "uptime": 18332.429607121972, "examples_seen": 50329600.0, "progress": 0.4408981224826646, "epoch": 39.68100413527758, "img/sec/core": 189.3084952805885, "core_hours_Tesla V100-SXM2-32GB": 73.7321278744628, "core_hours": 73.7321278744628}
{"step": 49200, "global_schedule": 0.6748484373092651, "l2_grads": 1.3712462186813354, "l2_params": 316.973876953125, "l2_updates": 0.7300205826759338, "training_loss": 2.698582410812378, "uptime": 18349.29011541599, "examples_seen": 50380800.0, "progress": 0.4413466454963804, "epoch": 39.72137138261764, "img/sec/core": 189.79261741089246, "core_hours_Tesla V100-SXM2-32GB": 73.80706346688068, "core_hours": 73.80706346688068}
{"step": 49250, "global_schedule": 0.6741231679916382, "l2_grads": 1.448704481124878, "l2_params": 316.9052734375, "l2_updates": 0.7345553636550903, "training_loss": 2.3925070762634277, "uptime": 18366.152787761996, "examples_seen": 50432000.0, "progress": 0.44179516851009626, "epoch": 39.7617386299577, "img/sec/core": 189.7682605899858, "core_hours_Tesla V100-SXM2-32GB": 73.88200867730735, "core_hours": 73.88200867730735}
{"step": 49300, "global_schedule": 0.673397421836853, "l2_grads": 1.4865920543670654, "l2_params": 316.8345947265625, "l2_updates": 0.7360889315605164, "training_loss": 2.777615547180176, "uptime": 18383.01953115099, "examples_seen": 50483200.0, "progress": 0.4422436915238121, "epoch": 39.80210587729776, "img/sec/core": 189.7224571572149, "core_hours_Tesla V100-SXM2-32GB": 73.95697198125845, "core_hours": 73.95697198125845}
{"step": 49350, "global_schedule": 0.6726712584495544, "l2_grads": 1.434940218925476, "l2_params": 316.7589416503906, "l2_updates": 0.7307811379432678, "training_loss": 2.4421920776367188, "uptime": 18399.877520254, "examples_seen": 50534400.0, "progress": 0.44269221453752794, "epoch": 39.84247312463782, "img/sec/core": 189.82097926666364, "core_hours_Tesla V100-SXM2-32GB": 74.03189637727182, "core_hours": 74.03189637727182}
{"step": 49400, "global_schedule": 0.6719446182250977, "l2_grads": 1.6855167150497437, "l2_params": 316.6821594238281, "l2_updates": 0.707010805606842, "training_loss": 2.5959367752075195, "uptime": 18416.72432155098, "examples_seen": 50585600.0, "progress": 0.4431407375512438, "epoch": 39.88284037197788, "img/sec/core": 189.94703763575433, "core_hours_Tesla V100-SXM2-32GB": 74.10677104970286, "core_hours": 74.10677104970286}
{"step": 49450, "global_schedule": 0.671217679977417, "l2_grads": 1.4057955741882324, "l2_params": 316.58837890625, "l2_updates": 0.727927565574646, "training_loss": 2.6969642639160156, "uptime": 18433.606622149993, "examples_seen": 50636800.0, "progress": 0.44358926056495956, "epoch": 39.923207619317935, "img/sec/core": 189.54762600229816, "core_hours_Tesla V100-SXM2-32GB": 74.18180349680958, "core_hours": 74.18180349680958}
{"step": 49500, "global_schedule": 0.6704903244972229, "l2_grads": 1.4511280059814453, "l2_params": 316.5111083984375, "l2_updates": 0.7294332385063171, "training_loss": 2.632689952850342, "uptime": 18450.46839252999, "examples_seen": 50688000.0, "progress": 0.4440377835786754, "epoch": 39.96357486665799, "img/sec/core": 189.77841163084963, "core_hours_Tesla V100-SXM2-32GB": 74.25674469849845, "core_hours": 74.25674469849845}
{"step": 49550, "global_schedule": 0.6697624921798706, "l2_grads": 1.5353641510009766, "l2_params": 316.44232177734375, "l2_updates": 0.7170699834823608, "training_loss": 2.4940152168273926, "uptime": 18467.334992774006, "examples_seen": 50739200.0, "progress": 0.44448630659239124, "epoch": 40.00394211399805, "img/sec/core": 189.72406731080855, "core_hours_Tesla V100-SXM2-32GB": 74.33170736624963, "core_hours": 74.33170736624963}
{"step": 49600, "global_schedule": 0.6690343618392944, "l2_grads": 1.5170214176177979, "l2_params": 316.3614807128906, "l2_updates": 0.7220397591590881, "training_loss": 2.4774112701416016, "uptime": 18484.207433110976, "examples_seen": 50790400.0, "progress": 0.4449348296061071, "epoch": 40.04430936133811, "img/sec/core": 189.65839772378467, "core_hours_Tesla V100-SXM2-32GB": 74.40669598996949, "core_hours": 74.40669598996949}
{"step": 49650, "global_schedule": 0.6683057546615601, "l2_grads": 1.362342119216919, "l2_params": 316.3042907714844, "l2_updates": 0.724612832069397, "training_loss": 2.3619844913482666, "uptime": 18501.076057041006, "examples_seen": 50841600.0, "progress": 0.4453833526198229, "epoch": 40.08467660867817, "img/sec/core": 189.70130659581255, "core_hours_Tesla V100-SXM2-32GB": 74.48166765188074, "core_hours": 74.48166765188074}
{"step": 49700, "global_schedule": 0.6675767302513123, "l2_grads": 1.3188859224319458, "l2_params": 316.2341003417969, "l2_updates": 0.7410019636154175, "training_loss": 4.464755535125732, "uptime": 18517.93145723798, "examples_seen": 50892800.0, "progress": 0.44583187563353877, "epoch": 40.12504385601823, "img/sec/core": 189.85013482944643, "core_hours_Tesla V100-SXM2-32GB": 74.55658054164506, "core_hours": 74.55658054164506}
{"step": 49750, "global_schedule": 0.6668473482131958, "l2_grads": 1.539685845375061, "l2_params": 316.1745300292969, "l2_updates": 0.7088398337364197, "training_loss": 2.5147347450256348, "uptime": 18534.795654214977, "examples_seen": 50944000.0, "progress": 0.4462803986472546, "epoch": 40.16541110335829, "img/sec/core": 189.751104328598, "core_hours_Tesla V100-SXM2-32GB": 74.63153252820949, "core_hours": 74.63153252820949}
{"step": 49800, "global_schedule": 0.6661175489425659, "l2_grads": 1.2835910320281982, "l2_params": 316.0917663574219, "l2_updates": 0.7350713610649109, "training_loss": 3.1171302795410156, "uptime": 18551.641597267997, "examples_seen": 50995200.0, "progress": 0.44672892166097045, "epoch": 40.205778350698345, "img/sec/core": 189.9567147964625, "core_hours_Tesla V100-SXM2-32GB": 74.70640338622293, "core_hours": 74.70640338622293}
{"step": 49850, "global_schedule": 0.6653873324394226, "l2_grads": 1.2619506120681763, "l2_params": 316.0464172363281, "l2_updates": 0.7199922800064087, "training_loss": 3.2857632637023926, "uptime": 18568.501906785998, "examples_seen": 51046400.0, "progress": 0.44717744467468623, "epoch": 40.2461455980384, "img/sec/core": 189.79485498671204, "core_hours_Tesla V100-SXM2-32GB": 74.78133809519181, "core_hours": 74.78133809519181}
{"step": 49900, "global_schedule": 0.6646567583084106, "l2_grads": 1.3990637063980103, "l2_params": 315.9806823730469, "l2_updates": 0.7243215441703796, "training_loss": 2.8233160972595215, "uptime": 18585.361985951953, "examples_seen": 51097600.0, "progress": 0.44762596768840207, "epoch": 40.28651284537846, "img/sec/core": 189.79744807257796, "core_hours_Tesla V100-SXM2-32GB": 74.85627178037385, "core_hours": 74.85627178037385}
{"step": 49950, "global_schedule": 0.6639257669448853, "l2_grads": 1.4401808977127075, "l2_params": 315.9087829589844, "l2_updates": 0.731356143951416, "training_loss": 2.5408220291137695, "uptime": 18602.21653550997, "examples_seen": 51148800.0, "progress": 0.4480744907021179, "epoch": 40.32688009271852, "img/sec/core": 189.85971645131514, "core_hours_Tesla V100-SXM2-32GB": 74.93118088952059, "core_hours": 74.93118088952059}
{"step": 50000, "global_schedule": 0.6631943583488464, "l2_grads": 1.3930983543395996, "l2_params": 315.8398742675781, "l2_updates": 0.7149034142494202, "training_loss": 3.0754554271698, "uptime": 18619.082522971963, "examples_seen": 51200000.0, "progress": 0.44852301371583375, "epoch": 40.36724734005858, "img/sec/core": 189.7309604439923, "core_hours_Tesla V100-SXM2-32GB": 75.0061408337961, "core_hours": 75.0061408337961, "minival/prec@1": 0.6611770215423041, "minival/loss": 1.4021833874157283, "minival/sample count": 12812.0, "minival/attn_weight_avg": [13312, 12, 281], "minival/attn_mag": [13312, 12, 281], "minival/before_mlp": [13312, 12, 281], "z/secs/eval/minival": 2.8928237100481056, "real/prec@1": 0.704912782629118, "real/loss": 2.2292630538323066, "real/sample count": 46837.0, "real/attn_weight_avg": [50176, 12, 281], "real/attn_mag": [50176, 12, 281], "real/before_mlp": [50176, 12, 281], "z/secs/eval/real": 11.077853019000031, "train/prec@1": 0.6825508332357647, "train/loss": 1.3033645320067997, "train/sample count": 25623.0, "train/attn_weight_avg": [26624, 12, 281], "train/attn_mag": [26624, 12, 281], "train/before_mlp": [26624, 12, 281], "z/secs/eval/train": 6.581718856992666, "v2/prec@1": 0.5055, "v2/loss": 2.211890246582031, "v2/sample count": 10000.0, "v2/attn_weight_avg": [10240, 12, 281], "v2/attn_mag": [10240, 12, 281], "v2/before_mlp": [10240, 12, 281], "z/secs/eval/v2": 3.38368490699213, "val/prec@1": 0.62928, "val/loss": 1.5590307763671876, "val/sample count": 50000.0, "val/attn_weight_avg": [50176, 12, 281], "val/attn_mag": [50176, 12, 281], "val/before_mlp": [50176, 12, 281], "z/secs/eval/val": 12.321498280973174}
{"step": 50050, "global_schedule": 0.662462592124939, "l2_grads": 1.3555755615234375, "l2_params": 315.762939453125, "l2_updates": 0.7117067575454712, "training_loss": 2.762335777282715, "uptime": 18672.739681451, "examples_seen": 51251200.0, "progress": 0.4489715367295496, "epoch": 40.40761458739864, "img/sec/core": 189.4449012171809, "core_hours_Tesla V100-SXM2-32GB": 75.081213966569, "core_hours": 75.081213966569}
{"step": 50100, "global_schedule": 0.6617304682731628, "l2_grads": 1.4132858514785767, "l2_params": 315.6827392578125, "l2_updates": 0.7192888259887695, "training_loss": 2.5327868461608887, "uptime": 18689.578229546954, "examples_seen": 51302400.0, "progress": 0.44942005974326543, "epoch": 40.4479818347387, "img/sec/core": 190.04013776987716, "core_hours_Tesla V100-SXM2-32GB": 75.15605195810657, "core_hours": 75.15605195810657}
{"step": 50150, "global_schedule": 0.6609979271888733, "l2_grads": 1.4777053594589233, "l2_params": 315.63397216796875, "l2_updates": 0.7185825109481812, "training_loss": 2.611356735229492, "uptime": 18706.440582698968, "examples_seen": 51353600.0, "progress": 0.4498685827569813, "epoch": 40.488349082078756, "img/sec/core": 189.77185278662702, "core_hours_Tesla V100-SXM2-32GB": 75.23099574989328, "core_hours": 75.23099574989328}
{"step": 50200, "global_schedule": 0.6602649688720703, "l2_grads": 1.2308562994003296, "l2_params": 315.5444641113281, "l2_updates": 0.6936029195785522, "training_loss": 4.780708312988281, "uptime": 18723.295555261953, "examples_seen": 51404800.0, "progress": 0.4503171057706971, "epoch": 40.52871632941881, "img/sec/core": 189.85495159021423, "core_hours_Tesla V100-SXM2-32GB": 75.30590673906211, "core_hours": 75.30590673906211}
{"step": 50250, "global_schedule": 0.6595316529273987, "l2_grads": 1.490227222442627, "l2_params": 315.4606628417969, "l2_updates": 0.7058221101760864, "training_loss": 2.5764338970184326, "uptime": 18740.153451169957, "examples_seen": 51456000.0, "progress": 0.45076562878441295, "epoch": 40.56908357675887, "img/sec/core": 189.82202864834622, "core_hours_Tesla V100-SXM2-32GB": 75.38083072087547, "core_hours": 75.38083072087547}
{"step": 50300, "global_schedule": 0.6587979793548584, "l2_grads": 1.4421025514602661, "l2_params": 315.412109375, "l2_updates": 0.7193979620933533, "training_loss": 2.3964853286743164, "uptime": 18757.01695247297, "examples_seen": 51507200.0, "progress": 0.45121415179812874, "epoch": 40.60945082409893, "img/sec/core": 189.7589321754908, "core_hours_Tesla V100-SXM2-32GB": 75.45577961555553, "core_hours": 75.45577961555553}
{"step": 50350, "global_schedule": 0.6580638885498047, "l2_grads": 1.328879475593567, "l2_params": 315.3423767089844, "l2_updates": 0.6888872981071472, "training_loss": 4.0702619552612305, "uptime": 18773.882855428965, "examples_seen": 51558400.0, "progress": 0.4516626748118446, "epoch": 40.64981807143899, "img/sec/core": 189.73191108412738, "core_hours_Tesla V100-SXM2-32GB": 75.53073918424883, "core_hours": 75.53073918424883}
{"step": 50400, "global_schedule": 0.6573293805122375, "l2_grads": 1.7742632627487183, "l2_params": 315.25067138671875, "l2_updates": 0.7006886005401611, "training_loss": 2.5375163555145264, "uptime": 18790.74248734, "examples_seen": 51609600.0, "progress": 0.4521111978255604, "epoch": 40.69018531877905, "img/sec/core": 189.80248304859097, "core_hours_Tesla V100-SXM2-32GB": 75.60567088163121, "core_hours": 75.60567088163121}
{"step": 50450, "global_schedule": 0.6565945744514465, "l2_grads": 1.3668450117111206, "l2_params": 315.16650390625, "l2_updates": 0.6894773244857788, "training_loss": 3.8367550373077393, "uptime": 18807.59694810596, "examples_seen": 51660800.0, "progress": 0.45255972083927626, "epoch": 40.73055256611911, "img/sec/core": 189.86071666341573, "core_hours_Tesla V100-SXM2-32GB": 75.68057959614657, "core_hours": 75.68057959614657}
{"step": 50500, "global_schedule": 0.6558593511581421, "l2_grads": 1.5297811031341553, "l2_params": 315.0876770019531, "l2_updates": 0.6883320808410645, "training_loss": 2.425006628036499, "uptime": 18824.48387612996, "examples_seen": 51712000.0, "progress": 0.4530082438529921, "epoch": 40.770919813459166, "img/sec/core": 189.49568538762537, "core_hours_Tesla V100-SXM2-32GB": 75.7556326095866, "core_hours": 75.7556326095866}
{"step": 50550, "global_schedule": 0.655123770236969, "l2_grads": 1.2918421030044556, "l2_params": 315.0011291503906, "l2_updates": 0.6991780400276184, "training_loss": 3.7344350814819336, "uptime": 18841.319245636987, "examples_seen": 51763200.0, "progress": 0.45345676686670794, "epoch": 40.81128706079922, "img/sec/core": 190.07601815122788, "core_hours_Tesla V100-SXM2-32GB": 75.83045647406226, "core_hours": 75.83045647406226}
{"step": 50600, "global_schedule": 0.6543877720832825, "l2_grads": 1.4905377626419067, "l2_params": 314.9200134277344, "l2_updates": 0.7135938405990601, "training_loss": 2.476370334625244, "uptime": 18858.19594598899, "examples_seen": 51814400.0, "progress": 0.4539052898804238, "epoch": 40.85165430813928, "img/sec/core": 189.61052416978953, "core_hours_Tesla V100-SXM2-32GB": 75.90546403118228, "core_hours": 75.90546403118228}
{"step": 50650, "global_schedule": 0.6536514759063721, "l2_grads": 1.4321949481964111, "l2_params": 314.84063720703125, "l2_updates": 0.7069688439369202, "training_loss": 4.370255947113037, "uptime": 18875.06506146898, "examples_seen": 51865600.0, "progress": 0.4543538128941396, "epoch": 40.89202155547934, "img/sec/core": 189.69577888040465, "core_hours_Tesla V100-SXM2-32GB": 75.98043787776001, "core_hours": 75.98043787776001}
{"step": 50700, "global_schedule": 0.6529147624969482, "l2_grads": 1.2174707651138306, "l2_params": 314.74945068359375, "l2_updates": 0.710701048374176, "training_loss": 4.280279636383057, "uptime": 18891.897084267985, "examples_seen": 51916800.0, "progress": 0.45480233590785546, "epoch": 40.9323888028194, "img/sec/core": 190.11381093122625, "core_hours_Tesla V100-SXM2-32GB": 76.0552468679778, "core_hours": 76.0552468679778}
{"step": 50750, "global_schedule": 0.6521776914596558, "l2_grads": 1.4391024112701416, "l2_params": 314.66754150390625, "l2_updates": 0.7102967500686646, "training_loss": 2.977572441101074, "uptime": 18908.760661561973, "examples_seen": 51968000.0, "progress": 0.45525085892157124, "epoch": 40.97275605015946, "img/sec/core": 189.7580770801624, "core_hours_Tesla V100-SXM2-32GB": 76.13019610039554, "core_hours": 76.13019610039554}
{"step": 50800, "global_schedule": 0.6514402627944946, "l2_grads": 1.3805330991744995, "l2_params": 314.60107421875, "l2_updates": 0.6987720727920532, "training_loss": 4.543438911437988, "uptime": 18925.61477717897, "examples_seen": 52019200.0, "progress": 0.4556993819352871, "epoch": 41.01312329749952, "img/sec/core": 189.8646047481181, "core_hours_Tesla V100-SXM2-32GB": 76.20510328091551, "core_hours": 76.20510328091551}
{"step": 50851, "global_schedule": 0.6507024765014648, "l2_grads": 1.503636121749878, "l2_params": 314.5164489746094, "l2_updates": 0.6904080510139465, "training_loss": 4.9568257331848145, "uptime": 18942.474579898, "examples_seen": 52070400.0, "progress": 0.4561479049490029, "epoch": 41.053490544839576, "img/sec/core": 189.8005601446277, "core_hours_Tesla V100-SXM2-32GB": 76.28003573744454, "core_hours": 76.28003573744454}
{"step": 50900, "global_schedule": 0.6499643325805664, "l2_grads": 1.3260197639465332, "l2_params": 314.4452819824219, "l2_updates": 0.7098727822303772, "training_loss": 3.504533290863037, "uptime": 18959.345486378996, "examples_seen": 52121600.0, "progress": 0.45659642796271876, "epoch": 41.093857792179634, "img/sec/core": 189.67564093871874, "core_hours_Tesla V100-SXM2-32GB": 76.35501754402675, "core_hours": 76.35501754402675}
{"step": 50950, "global_schedule": 0.6492258310317993, "l2_grads": 1.4422672986984253, "l2_params": 314.3760986328125, "l2_updates": 0.6941400170326233, "training_loss": 4.974437236785889, "uptime": 18976.193838820967, "examples_seen": 52172800.0, "progress": 0.4570449509764346, "epoch": 41.13422503951969, "img/sec/core": 189.92955014570697, "core_hours_Tesla V100-SXM2-32GB": 76.42989911043551, "core_hours": 76.42989911043551}
{"step": 51000, "global_schedule": 0.6484869122505188, "l2_grads": 1.456584095954895, "l2_params": 314.2917175292969, "l2_updates": 0.6732382774353027, "training_loss": 4.760926246643066, "uptime": 18993.067722406005, "examples_seen": 52224000.0, "progress": 0.45749347399015045, "epoch": 41.17459228685975, "img/sec/core": 189.64217596223088, "core_hours_Tesla V100-SXM2-32GB": 76.50489414859122, "core_hours": 76.50489414859122}
{"step": 51050, "global_schedule": 0.6477476954460144, "l2_grads": 1.2975205183029175, "l2_params": 314.2178039550781, "l2_updates": 0.6947107315063477, "training_loss": 4.742712020874023, "uptime": 19010.83544924599, "examples_seen": 52275200.0, "progress": 0.4579419970038663, "epoch": 41.21495953419981, "img/sec/core": 189.46765948197557, "core_hours_Tesla V100-SXM2-32GB": 76.57995826381335, "core_hours": 76.57995826381335}
{"step": 51100, "global_schedule": 0.6470081210136414, "l2_grads": 1.5110236406326294, "l2_params": 314.1314697265625, "l2_updates": 0.7027860283851624, "training_loss": 2.336216926574707, "uptime": 19027.73247743596, "examples_seen": 52326400.0, "progress": 0.4583905200175821, "epoch": 41.25532678153987, "img/sec/core": 189.382414707694, "core_hours_Tesla V100-SXM2-32GB": 76.65505616687989, "core_hours": 76.65505616687989}
{"step": 51150, "global_schedule": 0.6462681889533997, "l2_grads": 1.3175820112228394, "l2_params": 314.0466003417969, "l2_updates": 0.6918759346008301, "training_loss": 4.6879425048828125, "uptime": 19044.602801704954, "examples_seen": 52377600.0, "progress": 0.4588390430312979, "epoch": 41.29569402887993, "img/sec/core": 189.68218683745374, "core_hours_Tesla V100-SXM2-32GB": 76.7300353858532, "core_hours": 76.7300353858532}
{"step": 51200, "global_schedule": 0.6455278992652893, "l2_grads": 1.614544153213501, "l2_params": 313.966796875, "l2_updates": 0.6901606321334839, "training_loss": 2.434709072113037, "uptime": 19061.483210904, "examples_seen": 52428800.0, "progress": 0.45928756604501375, "epoch": 41.336061276219986, "img/sec/core": 189.5688642536494, "core_hours_Tesla V100-SXM2-32GB": 76.80505942673786, "core_hours": 76.80505942673786}
{"step": 51250, "global_schedule": 0.6447872519493103, "l2_grads": 1.538686990737915, "l2_params": 313.8843078613281, "l2_updates": 0.6927749514579773, "training_loss": 2.4031238555908203, "uptime": 19078.363402852963, "examples_seen": 52480000.0, "progress": 0.4597360890587296, "epoch": 41.376428523560044, "img/sec/core": 189.57130402753052, "core_hours_Tesla V100-SXM2-32GB": 76.88008250206657, "core_hours": 76.88008250206657}
{"step": 51300, "global_schedule": 0.6440463066101074, "l2_grads": 1.4658608436584473, "l2_params": 313.8067321777344, "l2_updates": 0.7089676856994629, "training_loss": 2.4029431343078613, "uptime": 19095.23048227298, "examples_seen": 52531200.0, "progress": 0.46018461207244543, "epoch": 41.4167957709001, "img/sec/core": 189.7186774494427, "core_hours_Tesla V100-SXM2-32GB": 76.95504729948885, "core_hours": 76.95504729948885}
{"step": 51350, "global_schedule": 0.6433049440383911, "l2_grads": 1.4766223430633545, "l2_params": 313.71636962890625, "l2_updates": 0.7047121524810791, "training_loss": 2.453007221221924, "uptime": 19112.097435413976, "examples_seen": 52582400.0, "progress": 0.46063313508616127, "epoch": 41.45716301824016, "img/sec/core": 189.7200978297553, "core_hours_Tesla V100-SXM2-32GB": 77.03001153567108, "core_hours": 77.03001153567108}
{"step": 51400, "global_schedule": 0.6425632834434509, "l2_grads": 1.3183881044387817, "l2_params": 313.6396789550781, "l2_updates": 0.6879961490631104, "training_loss": 2.9127919673919678, "uptime": 19128.981336183962, "examples_seen": 52633600.0, "progress": 0.4610816580998771, "epoch": 41.49753026558022, "img/sec/core": 189.52966163414695, "core_hours_Tesla V100-SXM2-32GB": 77.1050510946488, "core_hours": 77.1050510946488}
{"step": 51450, "global_schedule": 0.6418212652206421, "l2_grads": 1.5436384677886963, "l2_params": 313.55108642578125, "l2_updates": 0.7017918825149536, "training_loss": 2.427093505859375, "uptime": 19145.831746054988, "examples_seen": 52684800.0, "progress": 0.46153018111359295, "epoch": 41.53789751292028, "img/sec/core": 189.90635981516664, "core_hours_Tesla V100-SXM2-32GB": 77.17994180518669, "core_hours": 77.17994180518669}
{"step": 51500, "global_schedule": 0.6410789489746094, "l2_grads": 1.4670969247817993, "l2_params": 313.4839172363281, "l2_updates": 0.6914559602737427, "training_loss": 2.4957637786865234, "uptime": 19162.716157863964, "examples_seen": 52736000.0, "progress": 0.4619787041273088, "epoch": 41.57826476026034, "img/sec/core": 189.5239251567384, "core_hours_Tesla V100-SXM2-32GB": 77.2549836354488, "core_hours": 77.2549836354488}
{"step": 51550, "global_schedule": 0.6403362154960632, "l2_grads": 1.2654650211334229, "l2_params": 313.4215087890625, "l2_updates": 0.6876266002655029, "training_loss": 3.5760459899902344, "uptime": 19179.587460676965, "examples_seen": 52787200.0, "progress": 0.46242722714102463, "epoch": 41.6186320076004, "img/sec/core": 189.67118517570424, "core_hours_Tesla V100-SXM2-32GB": 77.32996720350658, "core_hours": 77.32996720350658}
{"step": 51600, "global_schedule": 0.6395931839942932, "l2_grads": 1.6417073011398315, "l2_params": 313.34124755859375, "l2_updates": 0.6779351234436035, "training_loss": 2.5238888263702393, "uptime": 19196.457757311, "examples_seen": 52838400.0, "progress": 0.4628757501547404, "epoch": 41.658999254940454, "img/sec/core": 189.68249755277694, "core_hours_Tesla V100-SXM2-32GB": 77.40494629965785, "core_hours": 77.40494629965785}
{"step": 51650, "global_schedule": 0.6388497948646545, "l2_grads": 1.3407665491104126, "l2_params": 313.2707214355469, "l2_updates": 0.6847367286682129, "training_loss": 3.7948355674743652, "uptime": 19213.31869929796, "examples_seen": 52889600.0, "progress": 0.46332427316845626, "epoch": 41.69936650228051, "img/sec/core": 189.78773561255804, "core_hours_Tesla V100-SXM2-32GB": 77.4798838195999, "core_hours": 77.4798838195999}
{"step": 51700, "global_schedule": 0.638106107711792, "l2_grads": 1.244766116142273, "l2_params": 313.2045593261719, "l2_updates": 0.6918233036994934, "training_loss": 3.8736367225646973, "uptime": 19230.191246578994, "examples_seen": 52940800.0, "progress": 0.4637727961821721, "epoch": 41.73973374962057, "img/sec/core": 189.6571956030165, "core_hours_Tesla V100-SXM2-32GB": 77.5548729186267, "core_hours": 77.5548729186267}
{"step": 51750, "global_schedule": 0.6373621225357056, "l2_grads": 1.3394407033920288, "l2_params": 313.1331481933594, "l2_updates": 0.6776254177093506, "training_loss": 3.579895257949829, "uptime": 19247.061363327957, "examples_seen": 52992000.0, "progress": 0.46422131919588794, "epoch": 41.78010099696063, "img/sec/core": 189.68452012619363, "core_hours_Tesla V100-SXM2-32GB": 77.62985121528877, "core_hours": 77.62985121528877}
{"step": 51800, "global_schedule": 0.6366177797317505, "l2_grads": 1.3388910293579102, "l2_params": 313.0439758300781, "l2_updates": 0.6683074831962585, "training_loss": 4.528901100158691, "uptime": 19263.949824299954, "examples_seen": 53043200.0, "progress": 0.4646698422096038, "epoch": 41.82046824430069, "img/sec/core": 189.47848506183857, "core_hours_Tesla V100-SXM2-32GB": 77.70491104183097, "core_hours": 77.70491104183097}
{"step": 51850, "global_schedule": 0.6358730792999268, "l2_grads": 1.4194883108139038, "l2_params": 312.9863586425781, "l2_updates": 0.6769528388977051, "training_loss": 3.9800567626953125, "uptime": 19280.82427375397, "examples_seen": 53094400.0, "progress": 0.4651183652233196, "epoch": 41.86083549164075, "img/sec/core": 189.63581648813965, "core_hours_Tesla V100-SXM2-32GB": 77.77990859495993, "core_hours": 77.77990859495993}
{"step": 51901, "global_schedule": 0.6351280808448792, "l2_grads": 1.6416805982589722, "l2_params": 312.8963928222656, "l2_updates": 0.6694393754005432, "training_loss": 2.5502986907958984, "uptime": 19297.704050565953, "examples_seen": 53145600.0, "progress": 0.46556688823703546, "epoch": 41.90120273898081, "img/sec/core": 189.5759662964347, "core_hours_Tesla V100-SXM2-32GB": 77.85492982523542, "core_hours": 77.85492982523542}
{"step": 51950, "global_schedule": 0.6343827247619629, "l2_grads": 1.2854186296463013, "l2_params": 312.8361511230469, "l2_updates": 0.6765980124473572, "training_loss": 4.272420883178711, "uptime": 19314.584643510985, "examples_seen": 53196800.0, "progress": 0.4660154112507513, "epoch": 41.941569986320864, "img/sec/core": 189.56680078834563, "core_hours_Tesla V100-SXM2-32GB": 77.9299546827689, "core_hours": 77.9299546827689}
{"step": 52000, "global_schedule": 0.6336370706558228, "l2_grads": 1.512825608253479, "l2_params": 312.7268981933594, "l2_updates": 0.6916075944900513, "training_loss": 2.458712577819824, "uptime": 19331.457076683, "examples_seen": 53248000.0, "progress": 0.4664639342644671, "epoch": 41.98193723366092, "img/sec/core": 189.6584782630872, "core_hours_Tesla V100-SXM2-32GB": 78.00494327464452, "core_hours": 78.00494327464452}
{"step": 52050, "global_schedule": 0.6328911185264587, "l2_grads": 1.476454257965088, "l2_params": 312.66949462890625, "l2_updates": 0.692787230014801, "training_loss": 2.457324743270874, "uptime": 19348.867464168987, "examples_seen": 53299200.0, "progress": 0.4669124572781829, "epoch": 42.02230448100098, "img/sec/core": 189.39635332294026, "core_hours_Tesla V100-SXM2-32GB": 78.08003565088458, "core_hours": 78.08003565088458}
{"step": 52100, "global_schedule": 0.6321448087692261, "l2_grads": 1.2134299278259277, "l2_params": 312.5750427246094, "l2_updates": 0.6652112603187561, "training_loss": 4.521340847015381, "uptime": 19365.761729424004, "examples_seen": 53350400.0, "progress": 0.46736098029189876, "epoch": 42.06267172834104, "img/sec/core": 189.41338683252803, "core_hours_Tesla V100-SXM2-32GB": 78.15512127424022, "core_hours": 78.15512127424022}
{"step": 52150, "global_schedule": 0.6313982009887695, "l2_grads": 1.557914137840271, "l2_params": 312.5069274902344, "l2_updates": 0.6843934059143066, "training_loss": 2.4557838439941406, "uptime": 19382.64497377997, "examples_seen": 53401600.0, "progress": 0.4678095033056146, "epoch": 42.1030389756811, "img/sec/core": 189.53703047419594, "core_hours_Tesla V100-SXM2-32GB": 78.23015791582228, "core_hours": 78.23015791582228}
{"step": 52200, "global_schedule": 0.6306512951850891, "l2_grads": 1.5616906881332397, "l2_params": 312.43072509765625, "l2_updates": 0.6820982694625854, "training_loss": 2.5539839267730713, "uptime": 19399.558649907995, "examples_seen": 53452800.0, "progress": 0.46825802631933044, "epoch": 42.14340622302116, "img/sec/core": 189.1960077619038, "core_hours_Tesla V100-SXM2-32GB": 78.30532980972461, "core_hours": 78.30532980972461}
{"step": 52250, "global_schedule": 0.6299040913581848, "l2_grads": 1.4907721281051636, "l2_params": 312.328369140625, "l2_updates": 0.6789114475250244, "training_loss": 2.5701866149902344, "uptime": 19416.47651864396, "examples_seen": 53504000.0, "progress": 0.4687065493330463, "epoch": 42.18377347036122, "img/sec/core": 189.1491209644413, "core_hours_Tesla V100-SXM2-32GB": 78.38052033744002, "core_hours": 78.38052033744002}
{"step": 52300, "global_schedule": 0.6291565299034119, "l2_grads": 1.4373258352279663, "l2_params": 312.27008056640625, "l2_updates": 0.6847111582756042, "training_loss": 2.810183048248291, "uptime": 19433.389705385955, "examples_seen": 53555200.0, "progress": 0.4691550723467621, "epoch": 42.224140717701275, "img/sec/core": 189.20148218164553, "core_hours_Tesla V100-SXM2-32GB": 78.45569005629334, "core_hours": 78.45569005629334}
{"step": 52350, "global_schedule": 0.628408670425415, "l2_grads": 1.436937689781189, "l2_params": 312.1759338378906, "l2_updates": 0.6913280487060547, "training_loss": 2.3848979473114014, "uptime": 19450.281850634958, "examples_seen": 53606400.0, "progress": 0.46960359536047797, "epoch": 42.26450796504133, "img/sec/core": 189.43715868112452, "core_hours_Tesla V100-SXM2-32GB": 78.5307662574, "core_hours": 78.5307662574}
{"step": 52400, "global_schedule": 0.6276605129241943, "l2_grads": 1.518441081047058, "l2_params": 312.1088562011719, "l2_updates": 0.6788763999938965, "training_loss": 2.4463753700256348, "uptime": 19467.179087422963, "examples_seen": 53657600.0, "progress": 0.4700521183741938, "epoch": 42.30487521238139, "img/sec/core": 189.38007676329627, "core_hours_Tesla V100-SXM2-32GB": 78.60586508756892, "core_hours": 78.60586508756892}
{"step": 52450, "global_schedule": 0.6269120573997498, "l2_grads": 1.5472899675369263, "l2_params": 312.0340270996094, "l2_updates": 0.6667422652244568, "training_loss": 4.950223922729492, "uptime": 19484.059656379977, "examples_seen": 53708800.0, "progress": 0.4705006413879096, "epoch": 42.34524245972145, "img/sec/core": 189.56707017095454, "core_hours_Tesla V100-SXM2-32GB": 78.68088983848898, "core_hours": 78.68088983848898}
{"step": 52500, "global_schedule": 0.6261633038520813, "l2_grads": 1.5607563257217407, "l2_params": 311.94952392578125, "l2_updates": 0.6781601905822754, "training_loss": 2.514782667160034, "uptime": 19500.960273836972, "examples_seen": 53760000.0, "progress": 0.47094916440162543, "epoch": 42.38560970706151, "img/sec/core": 189.34219463535402, "core_hours_Tesla V100-SXM2-32GB": 78.7560036938534, "core_hours": 78.7560036938534, "minival/prec@1": 0.6747580393381205, "minival/loss": 1.366498763137708, "minival/sample count": 12812.0, "minival/attn_weight_avg": [13312, 12, 281], "minival/attn_mag": [13312, 12, 281], "minival/before_mlp": [13312, 12, 281], "z/secs/eval/minival": 2.9113781269988976, "real/prec@1": 0.7162713239532847, "real/loss": 2.1846252685093384, "real/sample count": 46837.0, "real/attn_weight_avg": [50176, 12, 281], "real/attn_mag": [50176, 12, 281], "real/before_mlp": [50176, 12, 281], "z/secs/eval/real": 11.127187062986195, "train/prec@1": 0.6972251492799438, "train/loss": 1.2426045562234382, "train/sample count": 25623.0, "train/attn_weight_avg": [26624, 12, 281], "train/attn_mag": [26624, 12, 281], "train/before_mlp": [26624, 12, 281], "z/secs/eval/train": 6.576671896036714, "v2/prec@1": 0.5151, "v2/loss": 2.1687700927734377, "v2/sample count": 10000.0, "v2/attn_weight_avg": [10240, 12, 281], "v2/attn_mag": [10240, 12, 281], "v2/before_mlp": [10240, 12, 281], "z/secs/eval/v2": 3.391013180022128, "val/prec@1": 0.63998, "val/loss": 1.5091917260742187, "val/sample count": 50000.0, "val/attn_weight_avg": [50176, 12, 281], "val/attn_mag": [50176, 12, 281], "val/before_mlp": [50176, 12, 281], "z/secs/eval/val": 12.323688552016392}
{"step": 52550, "global_schedule": 0.6254141926765442, "l2_grads": 1.3810808658599854, "l2_params": 311.8827819824219, "l2_updates": 0.6698980927467346, "training_loss": 3.1239218711853027, "uptime": 19554.224003584997, "examples_seen": 53811200.0, "progress": 0.47139768741534127, "epoch": 42.42597695440157, "img/sec/core": 188.99380273356053, "core_hours_Tesla V100-SXM2-32GB": 78.83125601438728, "core_hours": 78.83125601438728}
{"step": 52601, "global_schedule": 0.624664843082428, "l2_grads": 1.3821265697479248, "l2_params": 311.8002624511719, "l2_updates": 0.6754590272903442, "training_loss": 3.1415507793426514, "uptime": 19571.09599966096, "examples_seen": 53862400.0, "progress": 0.4718462104290571, "epoch": 42.46634420174163, "img/sec/core": 189.66339166940665, "core_hours_Tesla V100-SXM2-32GB": 78.90624266361378, "core_hours": 78.90624266361378}
{"step": 52650, "global_schedule": 0.6239151954650879, "l2_grads": 1.5378817319869995, "l2_params": 311.73138427734375, "l2_updates": 0.6959551572799683, "training_loss": 2.4513816833496094, "uptime": 19587.958073837974, "examples_seen": 53913600.0, "progress": 0.47229473344277295, "epoch": 42.506711449081685, "img/sec/core": 189.7749924716986, "core_hours_Tesla V100-SXM2-32GB": 78.98118521551162, "core_hours": 78.98118521551162}
{"step": 52700, "global_schedule": 0.6231651902198792, "l2_grads": 1.4869846105575562, "l2_params": 311.68365478515625, "l2_updates": 0.6846522092819214, "training_loss": 2.744997501373291, "uptime": 19604.811444727995, "examples_seen": 53964800.0, "progress": 0.4727432564564888, "epoch": 42.54707869642174, "img/sec/core": 189.87299460042627, "core_hours_Tesla V100-SXM2-32GB": 79.05608908613392, "core_hours": 79.05608908613392}
{"step": 52750, "global_schedule": 0.6224149465560913, "l2_grads": 1.5351264476776123, "l2_params": 311.59619140625, "l2_updates": 0.6606695652008057, "training_loss": 2.504053831100464, "uptime": 19621.670514119964, "examples_seen": 54016000.0, "progress": 0.47319177947020463, "epoch": 42.5874459437618, "img/sec/core": 189.808815991019, "core_hours_Tesla V100-SXM2-32GB": 79.13101828343157, "core_hours": 79.13101828343157}
{"step": 52800, "global_schedule": 0.6216644048690796, "l2_grads": 1.661789894104004, "l2_params": 311.4913330078125, "l2_updates": 0.6662428379058838, "training_loss": 2.6499791145324707, "uptime": 19638.541627145954, "examples_seen": 54067200.0, "progress": 0.4736403024839205, "epoch": 42.62781319110186, "img/sec/core": 189.67331883025398, "core_hours_Tesla V100-SXM2-32GB": 79.20600100799153, "core_hours": 79.20600100799153}
{"step": 52850, "global_schedule": 0.6209135055541992, "l2_grads": 1.5234113931655884, "l2_params": 311.3988342285156, "l2_updates": 0.6799126863479614, "training_loss": 2.5678513050079346, "uptime": 19655.426473981992, "examples_seen": 54118400.0, "progress": 0.47408882549763626, "epoch": 42.66818043844192, "img/sec/core": 189.51904219647486, "core_hours_Tesla V100-SXM2-32GB": 79.28104477170726, "core_hours": 79.28104477170726}
{"step": 52900, "global_schedule": 0.6201623678207397, "l2_grads": 1.3612463474273682, "l2_params": 311.3089599609375, "l2_updates": 0.6741781830787659, "training_loss": 2.7208919525146484, "uptime": 19672.28954761097, "examples_seen": 54169600.0, "progress": 0.4745373485113521, "epoch": 42.70854768578198, "img/sec/core": 189.76374476009227, "core_hours_Tesla V100-SXM2-32GB": 79.35599176561382, "core_hours": 79.35599176561382}
{"step": 52950, "global_schedule": 0.6194109916687012, "l2_grads": 1.458008050918579, "l2_params": 311.25225830078125, "l2_updates": 0.6820357441902161, "training_loss": 2.4378256797790527, "uptime": 19689.17992198898, "examples_seen": 54220800.0, "progress": 0.47498587152506794, "epoch": 42.74891493312204, "img/sec/core": 189.45702021656362, "core_hours_Tesla V100-SXM2-32GB": 79.43106009618276, "core_hours": 79.43106009618276}
{"step": 53000, "global_schedule": 0.618659257888794, "l2_grads": 1.3077118396759033, "l2_params": 311.16796875, "l2_updates": 0.6657298803329468, "training_loss": 4.502776145935059, "uptime": 19706.06006124895, "examples_seen": 54272000.0, "progress": 0.4754343945387838, "epoch": 42.789282180462095, "img/sec/core": 189.57189574782842, "core_hours_Tesla V100-SXM2-32GB": 79.50608293733818, "core_hours": 79.50608293733818}
{"step": 53050, "global_schedule": 0.6179072260856628, "l2_grads": 1.6856194734573364, "l2_params": 311.1050720214844, "l2_updates": 0.6536126136779785, "training_loss": 2.450812578201294, "uptime": 19723.456168504956, "examples_seen": 54323200.0, "progress": 0.4758829175524996, "epoch": 42.82964942780215, "img/sec/core": 189.65818393670475, "core_hours_Tesla V100-SXM2-32GB": 79.58107164558696, "core_hours": 79.58107164558696}
{"step": 53100, "global_schedule": 0.6171549558639526, "l2_grads": 1.2737164497375488, "l2_params": 311.0331726074219, "l2_updates": 0.6676105260848999, "training_loss": 4.320574760437012, "uptime": 19740.35326949798, "examples_seen": 54374400.0, "progress": 0.47633144056621546, "epoch": 42.87001667514221, "img/sec/core": 189.38159873229156, "core_hours_Tesla V100-SXM2-32GB": 79.65616987222262, "core_hours": 79.65616987222262}
{"step": 53150, "global_schedule": 0.6164023876190186, "l2_grads": 1.4280650615692139, "l2_params": 310.93310546875, "l2_updates": 0.6610454320907593, "training_loss": 3.0725555419921875, "uptime": 19757.223131879, "examples_seen": 54425600.0, "progress": 0.4767799635799313, "epoch": 42.91038392248227, "img/sec/core": 189.6873802361504, "core_hours_Tesla V100-SXM2-32GB": 79.73114703836049, "core_hours": 79.73114703836049}
{"step": 53200, "global_schedule": 0.6156495809555054, "l2_grads": 1.4783438444137573, "l2_params": 310.8399963378906, "l2_updates": 0.6790086627006531, "training_loss": 2.531996965408325, "uptime": 19774.078301602975, "examples_seen": 54476800.0, "progress": 0.47722848659364714, "epoch": 42.950751169822325, "img/sec/core": 189.8527307884873, "core_hours_Tesla V100-SXM2-32GB": 79.80605890380038, "core_hours": 79.80605890380038}
{"step": 53250, "global_schedule": 0.6148964762687683, "l2_grads": 1.5812355279922485, "l2_params": 310.77349853515625, "l2_updates": 0.6543920636177063, "training_loss": 2.4241089820861816, "uptime": 19790.94558895199, "examples_seen": 54528000.0, "progress": 0.477677009607363, "epoch": 42.99111841716239, "img/sec/core": 189.71633872040755, "core_hours_Tesla V100-SXM2-32GB": 79.88102462535154, "core_hours": 79.88102462535154}
{"step": 53300, "global_schedule": 0.6141430735588074, "l2_grads": 1.5865548849105835, "l2_params": 310.6736145019531, "l2_updates": 0.6539778113365173, "training_loss": 2.4471535682678223, "uptime": 19807.81736907299, "examples_seen": 54579200.0, "progress": 0.47812553262107876, "epoch": 43.03148566450245, "img/sec/core": 189.66581931783986, "core_hours_Tesla V100-SXM2-32GB": 79.95601031477823, "core_hours": 79.95601031477823}
{"step": 53350, "global_schedule": 0.6133893728256226, "l2_grads": 1.4123667478561401, "l2_params": 310.58575439453125, "l2_updates": 0.6522428393363953, "training_loss": 4.81170654296875, "uptime": 19824.699453737005, "examples_seen": 54630400.0, "progress": 0.4785740556347946, "epoch": 43.071852911842505, "img/sec/core": 189.55005046390102, "core_hours_Tesla V100-SXM2-32GB": 80.03104180217385, "core_hours": 80.03104180217385}
{"step": 53400, "global_schedule": 0.6126354932785034, "l2_grads": 1.3293744325637817, "l2_params": 310.503173828125, "l2_updates": 0.6627855896949768, "training_loss": 4.699680805206299, "uptime": 19841.548452257004, "examples_seen": 54681600.0, "progress": 0.47902257864851044, "epoch": 43.11222015918256, "img/sec/core": 189.92226726126546, "core_hours_Tesla V100-SXM2-32GB": 80.10592624004052, "core_hours": 80.10592624004052}
{"step": 53450, "global_schedule": 0.6118813157081604, "l2_grads": 1.4883450269699097, "l2_params": 310.41058349609375, "l2_updates": 0.6421567797660828, "training_loss": 2.9619431495666504, "uptime": 19858.42017161299, "examples_seen": 54732800.0, "progress": 0.4794711016622263, "epoch": 43.15258740652262, "img/sec/core": 189.66650241634434, "core_hours_Tesla V100-SXM2-32GB": 80.18091165940044, "core_hours": 80.18091165940044}
{"step": 53500, "global_schedule": 0.6111268401145935, "l2_grads": 1.3589868545532227, "l2_params": 310.3400573730469, "l2_updates": 0.6578052043914795, "training_loss": 4.823017120361328, "uptime": 19875.286972075002, "examples_seen": 54784000.0, "progress": 0.4799196246759421, "epoch": 43.19295465386268, "img/sec/core": 189.72181518404267, "core_hours_Tesla V100-SXM2-32GB": 80.25587521700939, "core_hours": 80.25587521700939}
{"step": 53550, "global_schedule": 0.6103720664978027, "l2_grads": 1.607551097869873, "l2_params": 310.2621765136719, "l2_updates": 0.6393547058105469, "training_loss": 2.4893996715545654, "uptime": 19892.15944595798, "examples_seen": 54835200.0, "progress": 0.48036814768965796, "epoch": 43.233321901202736, "img/sec/core": 189.65802064323026, "core_hours_Tesla V100-SXM2-32GB": 80.33086398982262, "core_hours": 80.33086398982262}
{"step": 53600, "global_schedule": 0.6096171140670776, "l2_grads": 1.5522626638412476, "l2_params": 310.1694030761719, "l2_updates": 0.6518250703811646, "training_loss": 2.3967809677124023, "uptime": 19909.038273607963, "examples_seen": 54886400.0, "progress": 0.4808166707033738, "epoch": 43.2736891485428, "img/sec/core": 189.58662688893048, "core_hours_Tesla V100-SXM2-32GB": 80.40588100160032, "core_hours": 80.40588100160032}
{"step": 53650, "global_schedule": 0.6088618040084839, "l2_grads": 1.394926905632019, "l2_params": 310.0893859863281, "l2_updates": 0.6558807492256165, "training_loss": 4.005866050720215, "uptime": 19925.89434726996, "examples_seen": 54937600.0, "progress": 0.48126519371708965, "epoch": 43.31405639588286, "img/sec/core": 189.8425495858104, "core_hours_Tesla V100-SXM2-32GB": 80.48079688454254, "core_hours": 80.48079688454254}
{"step": 53700, "global_schedule": 0.608106255531311, "l2_grads": 1.4596134424209595, "l2_params": 310.0195617675781, "l2_updates": 0.6514392495155334, "training_loss": 3.0710980892181396, "uptime": 19942.770788327965, "examples_seen": 54988800.0, "progress": 0.48171371673080543, "epoch": 43.354423643222916, "img/sec/core": 189.61343739486364, "core_hours_Tesla V100-SXM2-32GB": 80.55580328924478, "core_hours": 80.55580328924478}
{"step": 53750, "global_schedule": 0.6073504686355591, "l2_grads": 1.289174199104309, "l2_params": 309.93402099609375, "l2_updates": 0.6654032468795776, "training_loss": 3.2204463481903076, "uptime": 19959.633284713957, "examples_seen": 55040000.0, "progress": 0.48216223974452127, "epoch": 43.39479089056297, "img/sec/core": 189.77024082024244, "core_hours_Tesla V100-SXM2-32GB": 80.63074771762696, "core_hours": 80.63074771762696}
{"step": 53800, "global_schedule": 0.6065943837165833, "l2_grads": 1.5528203248977661, "l2_params": 309.86077880859375, "l2_updates": 0.6480799913406372, "training_loss": 2.6830694675445557, "uptime": 19976.49299998395, "examples_seen": 55091200.0, "progress": 0.4826107627582371, "epoch": 43.43515813790303, "img/sec/core": 189.80154461416143, "core_hours_Tesla V100-SXM2-32GB": 80.70567978549361, "core_hours": 80.70567978549361}
{"step": 53850, "global_schedule": 0.6058381199836731, "l2_grads": 1.533321738243103, "l2_params": 309.7729797363281, "l2_updates": 0.6560184955596924, "training_loss": 2.460861921310425, "uptime": 19993.372530010995, "examples_seen": 55142400.0, "progress": 0.48305928577195295, "epoch": 43.47552538524309, "img/sec/core": 189.57873796682776, "core_hours_Tesla V100-SXM2-32GB": 80.78069991894714, "core_hours": 80.78069991894714}
{"step": 53900, "global_schedule": 0.6050815582275391, "l2_grads": 1.5405992269515991, "l2_params": 309.6857604980469, "l2_updates": 0.6430902481079102, "training_loss": 2.705739974975586, "uptime": 20010.23736068199, "examples_seen": 55193600.0, "progress": 0.4835078087856688, "epoch": 43.515892632583146, "img/sec/core": 189.7439744535105, "core_hours_Tesla V100-SXM2-32GB": 80.85565472192933, "core_hours": 80.85565472192933}
{"step": 53950, "global_schedule": 0.6043247580528259, "l2_grads": 1.4918553829193115, "l2_params": 309.6253662109375, "l2_updates": 0.6584542393684387, "training_loss": 2.65910267829895, "uptime": 20027.107374262996, "examples_seen": 55244800.0, "progress": 0.48395633179938463, "epoch": 43.55625987992321, "img/sec/core": 189.6856801350024, "core_hours_Tesla V100-SXM2-32GB": 80.93063256006714, "core_hours": 80.93063256006714}
{"step": 54000, "global_schedule": 0.6035676598548889, "l2_grads": 1.5207903385162354, "l2_params": 309.5335693359375, "l2_updates": 0.642169713973999, "training_loss": 4.847518444061279, "uptime": 20043.99774212297, "examples_seen": 55296000.0, "progress": 0.48440485481310047, "epoch": 43.59662712726327, "img/sec/core": 189.45709332850672, "core_hours_Tesla V100-SXM2-32GB": 81.00570086166702, "core_hours": 81.00570086166702}
{"step": 54050, "global_schedule": 0.6028103828430176, "l2_grads": 1.599642276763916, "l2_params": 309.4435729980469, "l2_updates": 0.6541128754615784, "training_loss": 2.4914207458496094, "uptime": 20061.343367097958, "examples_seen": 55347200.0, "progress": 0.4848533778268163, "epoch": 43.636994374603326, "img/sec/core": 189.62398891457258, "core_hours_Tesla V100-SXM2-32GB": 81.08070309268027, "core_hours": 81.08070309268027}
{"step": 54100, "global_schedule": 0.6020528078079224, "l2_grads": 1.402303695678711, "l2_params": 309.3826904296875, "l2_updates": 0.6594641208648682, "training_loss": 3.0264999866485596, "uptime": 20078.197024184978, "examples_seen": 55398400.0, "progress": 0.48530190084053215, "epoch": 43.67736162194338, "img/sec/core": 189.86977031023662, "core_hours_Tesla V100-SXM2-32GB": 81.15560823528924, "core_hours": 81.15560823528924}
{"step": 54150, "global_schedule": 0.601294994354248, "l2_grads": 1.440669059753418, "l2_params": 309.2911071777344, "l2_updates": 0.6427627801895142, "training_loss": 4.784171104431152, "uptime": 20095.086249082, "examples_seen": 55449600.0, "progress": 0.48575042385424794, "epoch": 43.71772886928344, "img/sec/core": 189.4699146651883, "core_hours_Tesla V100-SXM2-32GB": 81.23067145705379, "core_hours": 81.23067145705379}
{"step": 54200, "global_schedule": 0.6005370020866394, "l2_grads": 1.2737641334533691, "l2_params": 309.2235412597656, "l2_updates": 0.6453017592430115, "training_loss": 4.7125091552734375, "uptime": 20111.942451487004, "examples_seen": 55500800.0, "progress": 0.4861989468679638, "epoch": 43.7580961166235, "img/sec/core": 189.8410996209905, "core_hours_Tesla V100-SXM2-32GB": 81.30558791218714, "core_hours": 81.30558791218714}
{"step": 54250, "global_schedule": 0.5997787117958069, "l2_grads": 1.5331742763519287, "l2_params": 309.1170654296875, "l2_updates": 0.6442047953605652, "training_loss": 2.4448325634002686, "uptime": 20128.793831901974, "examples_seen": 55552000.0, "progress": 0.4866474698816796, "epoch": 43.798463363963556, "img/sec/core": 189.89542228583912, "core_hours_Tesla V100-SXM2-32GB": 81.38048293625367, "core_hours": 81.38048293625367}
{"step": 54300, "global_schedule": 0.5990201830863953, "l2_grads": 1.3107088804244995, "l2_params": 309.04217529296875, "l2_updates": 0.6481375694274902, "training_loss": 4.831414222717285, "uptime": 20145.681543854997, "examples_seen": 55603200.0, "progress": 0.48709599289539546, "epoch": 43.83883061130362, "img/sec/core": 189.48688898185952, "core_hours_Tesla V100-SXM2-32GB": 81.45553943382265, "core_hours": 81.45553943382265}
{"step": 54350, "global_schedule": 0.5982614159584045, "l2_grads": 1.6136491298675537, "l2_params": 308.95166015625, "l2_updates": 0.6505311131477356, "training_loss": 2.348860263824463, "uptime": 20162.543505058973, "examples_seen": 55654400.0, "progress": 0.4875445159091113, "epoch": 43.87919785864368, "img/sec/core": 189.7762639404809, "core_hours_Tesla V100-SXM2-32GB": 81.5304814836181, "core_hours": 81.5304814836181}
{"step": 54400, "global_schedule": 0.5975024700164795, "l2_grads": 1.5173313617706299, "l2_params": 308.88189697265625, "l2_updates": 0.6448913812637329, "training_loss": 2.4832491874694824, "uptime": 20179.41482854, "examples_seen": 55705600.0, "progress": 0.48799303892282714, "epoch": 43.919565105983736, "img/sec/core": 189.67095282113058, "core_hours_Tesla V100-SXM2-32GB": 81.60546514353379, "core_hours": 81.60546514353379}
{"step": 54450, "global_schedule": 0.5967432260513306, "l2_grads": 1.5347998142242432, "l2_params": 308.7816467285156, "l2_updates": 0.6388142704963684, "training_loss": 2.6195578575134277, "uptime": 20196.271736531984, "examples_seen": 55756800.0, "progress": 0.488441561936543, "epoch": 43.959932353323794, "img/sec/core": 189.83315335895554, "core_hours_Tesla V100-SXM2-32GB": 81.68038473460928, "core_hours": 81.68038473460928}
{"step": 54500, "global_schedule": 0.5959837436676025, "l2_grads": 1.485779881477356, "l2_params": 308.70050048828125, "l2_updates": 0.6380477547645569, "training_loss": 3.015674591064453, "uptime": 20213.126354714972, "examples_seen": 55808000.0, "progress": 0.4888900849502588, "epoch": 44.00029960066385, "img/sec/core": 189.85894342180342, "core_hours_Tesla V100-SXM2-32GB": 81.75529414875588, "core_hours": 81.75529414875588}
{"step": 54550, "global_schedule": 0.5952240824699402, "l2_grads": 1.335871934890747, "l2_params": 308.6226806640625, "l2_updates": 0.6445227861404419, "training_loss": 3.4887843132019043, "uptime": 20230.009194979968, "examples_seen": 55859200.0, "progress": 0.48933860796397466, "epoch": 44.04066684800391, "img/sec/core": 189.54156704513184, "core_hours_Tesla V100-SXM2-32GB": 81.83032899437808, "core_hours": 81.83032899437808}
{"step": 54600, "global_schedule": 0.5944641828536987, "l2_grads": 1.5402790307998657, "l2_params": 308.5417785644531, "l2_updates": 0.6465950608253479, "training_loss": 2.4354238510131836, "uptime": 20246.867947591003, "examples_seen": 55910400.0, "progress": 0.48978713097769044, "epoch": 44.081034095343966, "img/sec/core": 189.812382554651, "core_hours_Tesla V100-SXM2-32GB": 81.90525678376046, "core_hours": 81.90525678376046}
{"step": 54650, "global_schedule": 0.5937040448188782, "l2_grads": 1.48183012008667, "l2_params": 308.4607238769531, "l2_updates": 0.6365882754325867, "training_loss": 3.4760608673095703, "uptime": 20263.747428942996, "examples_seen": 55961600.0, "progress": 0.4902356539914063, "epoch": 44.12140134268403, "img/sec/core": 189.57928465155405, "core_hours_Tesla V100-SXM2-32GB": 81.98027670088044, "core_hours": 81.98027670088044}
{"step": 54700, "global_schedule": 0.5929436683654785, "l2_grads": 1.4096263647079468, "l2_params": 308.38458251953125, "l2_updates": 0.6381645202636719, "training_loss": 4.0685811042785645, "uptime": 20280.622067350952, "examples_seen": 56012800.0, "progress": 0.4906841770051221, "epoch": 44.16176859002409, "img/sec/core": 189.63369303908289, "core_hours_Tesla V100-SXM2-32GB": 82.05527509380468, "core_hours": 82.05527509380468}
{"step": 54750, "global_schedule": 0.5921830534934998, "l2_grads": 1.387670636177063, "l2_params": 308.3145446777344, "l2_updates": 0.6179599165916443, "training_loss": 4.231362819671631, "uptime": 20297.481108184962, "examples_seen": 56064000.0, "progress": 0.49113270001883796, "epoch": 44.202135837364146, "img/sec/core": 189.8091375130107, "core_hours_Tesla V100-SXM2-32GB": 82.13020416417807, "core_hours": 82.13020416417807}
{"step": 54800, "global_schedule": 0.5914222598075867, "l2_grads": 1.519303560256958, "l2_params": 308.23736572265625, "l2_updates": 0.6406162977218628, "training_loss": 2.411902904510498, "uptime": 20314.343556235952, "examples_seen": 56115200.0, "progress": 0.4915812230325538, "epoch": 44.242503084704204, "img/sec/core": 189.77078478306538, "core_hours_Tesla V100-SXM2-32GB": 82.20514837773801, "core_hours": 82.20514837773801}
{"step": 54850, "global_schedule": 0.5906612277030945, "l2_grads": 1.4872325658798218, "l2_params": 308.1541748046875, "l2_updates": 0.6513491272926331, "training_loss": 2.2680983543395996, "uptime": 20331.20084698999, "examples_seen": 56166400.0, "progress": 0.49202974604626964, "epoch": 44.28287033204426, "img/sec/core": 189.82884300276743, "core_hours_Tesla V100-SXM2-32GB": 82.28006966997818, "core_hours": 82.28006966997818}
{"step": 54900, "global_schedule": 0.589900016784668, "l2_grads": 1.4312396049499512, "l2_params": 308.0896301269531, "l2_updates": 0.630346953868866, "training_loss": 4.78377628326416, "uptime": 20348.067745499953, "examples_seen": 56217600.0, "progress": 0.4924782690599855, "epoch": 44.32323757938432, "img/sec/core": 189.72071232357678, "core_hours_Tesla V100-SXM2-32GB": 82.3550336633558, "core_hours": 82.3550336633558}
{"step": 54950, "global_schedule": 0.5891385078430176, "l2_grads": 1.4667531251907349, "l2_params": 308.0141906738281, "l2_updates": 0.6464322805404663, "training_loss": 2.714416265487671, "uptime": 20364.930091733986, "examples_seen": 56268800.0, "progress": 0.4929267920737013, "epoch": 44.36360482672438, "img/sec/core": 189.77193064281374, "core_hours_Tesla V100-SXM2-32GB": 82.42997742439594, "core_hours": 82.42997742439594}
{"step": 55000, "global_schedule": 0.5883768796920776, "l2_grads": 1.464097499847412, "l2_params": 307.9350891113281, "l2_updates": 0.625579833984375, "training_loss": 2.923308849334717, "uptime": 20381.79441174597, "examples_seen": 56320000.0, "progress": 0.4933753150874171, "epoch": 44.40397207406444, "img/sec/core": 189.74971998432324, "core_hours_Tesla V100-SXM2-32GB": 82.50492995778254, "core_hours": 82.50492995778254, "minival/prec@1": 0.6807680299719013, "minival/loss": 1.2976707818170954, "minival/sample count": 12812.0, "minival/attn_weight_avg": [13312, 12, 281], "minival/attn_mag": [13312, 12, 281], "minival/before_mlp": [13312, 12, 281], "z/secs/eval/minival": 2.8843445950187743, "real/prec@1": 0.7265623331981126, "real/loss": 2.115689830159816, "real/sample count": 46837.0, "real/attn_weight_avg": [50176, 12, 281], "real/attn_mag": [50176, 12, 281], "real/before_mlp": [50176, 12, 281], "z/secs/eval/real": 11.083077831019182, "train/prec@1": 0.7047184170471842, "train/loss": 1.1845835092563388, "train/sample count": 25623.0, "train/attn_weight_avg": [26624, 12, 281], "train/attn_mag": [26624, 12, 281], "train/before_mlp": [26624, 12, 281], "z/secs/eval/train": 6.609667882032227, "v2/prec@1": 0.5183, "v2/loss": 2.129552978515625, "v2/sample count": 10000.0, "v2/attn_weight_avg": [10240, 12, 281], "v2/attn_mag": [10240, 12, 281], "v2/before_mlp": [10240, 12, 281], "z/secs/eval/v2": 3.399155157036148, "val/prec@1": 0.64874, "val/loss": 1.450047119140625, "val/sample count": 50000.0, "val/attn_weight_avg": [50176, 12, 281], "val/attn_mag": [50176, 12, 281], "val/before_mlp": [50176, 12, 281], "z/secs/eval/val": 12.242235490994062}
{"step": 55050, "global_schedule": 0.5876149535179138, "l2_grads": 1.5075219869613647, "l2_params": 307.8639831542969, "l2_updates": 0.6261905431747437, "training_loss": 2.7695581912994385, "uptime": 20435.710605259985, "examples_seen": 56371200.0, "progress": 0.49382383810113295, "epoch": 44.4443393214045, "img/sec/core": 189.20221429216716, "core_hours_Tesla V100-SXM2-32GB": 82.58009938576957, "core_hours": 82.58009938576957}
{"step": 55100, "global_schedule": 0.5868528485298157, "l2_grads": 1.5125443935394287, "l2_params": 307.7633361816406, "l2_updates": 0.6306156516075134, "training_loss": 2.747760057449341, "uptime": 20452.582608082972, "examples_seen": 56422400.0, "progress": 0.4942723611148488, "epoch": 44.484706568744556, "img/sec/core": 189.66331582402051, "core_hours_Tesla V100-SXM2-32GB": 82.65508606498285, "core_hours": 82.65508606498285}
{"step": 55150, "global_schedule": 0.5860905647277832, "l2_grads": 1.5057753324508667, "l2_params": 307.6730041503906, "l2_updates": 0.6327486038208008, "training_loss": 4.803770065307617, "uptime": 20469.447612507967, "examples_seen": 56473600.0, "progress": 0.49472088412856463, "epoch": 44.525073816084614, "img/sec/core": 189.74201959042156, "core_hours_Tesla V100-SXM2-32GB": 82.73004164020504, "core_hours": 82.73004164020504}
{"step": 55200, "global_schedule": 0.5853280425071716, "l2_grads": 1.4973716735839844, "l2_params": 307.59271240234375, "l2_updates": 0.6394392251968384, "training_loss": 2.3881306648254395, "uptime": 20486.297140411974, "examples_seen": 56524800.0, "progress": 0.49516940714228047, "epoch": 44.56544106342467, "img/sec/core": 189.91630022102774, "core_hours_Tesla V100-SXM2-32GB": 82.80492843088952, "core_hours": 82.80492843088952}
{"step": 55250, "global_schedule": 0.5845653414726257, "l2_grads": 1.5089737176895142, "l2_params": 307.5203552246094, "l2_updates": 0.6279762983322144, "training_loss": 2.4552063941955566, "uptime": 20503.142334026983, "examples_seen": 56576000.0, "progress": 0.4956179301559963, "epoch": 44.60580831076473, "img/sec/core": 189.96516591824073, "core_hours_Tesla V100-SXM2-32GB": 82.87979595806733, "core_hours": 82.87979595806733}
{"step": 55300, "global_schedule": 0.5838024020195007, "l2_grads": 1.5323634147644043, "l2_params": 307.4302673339844, "l2_updates": 0.6269571185112, "training_loss": 2.698688268661499, "uptime": 20520.029121164, "examples_seen": 56627200.0, "progress": 0.49606645316971215, "epoch": 44.64617555810479, "img/sec/core": 189.49726635598108, "core_hours_Tesla V100-SXM2-32GB": 82.95484834534297, "core_hours": 82.95484834534297}
{"step": 55350, "global_schedule": 0.5830392837524414, "l2_grads": 1.5889183282852173, "l2_params": 307.3468933105469, "l2_updates": 0.6318322420120239, "training_loss": 2.377342700958252, "uptime": 20536.86663590197, "examples_seen": 56678400.0, "progress": 0.496514976183428, "epoch": 44.686542805444844, "img/sec/core": 190.05180098127522, "core_hours_Tesla V100-SXM2-32GB": 83.02968174417839, "core_hours": 83.02968174417839}
{"step": 55400, "global_schedule": 0.5822759866714478, "l2_grads": 1.5277647972106934, "l2_params": 307.2463684082031, "l2_updates": 0.632142186164856, "training_loss": 2.2962512969970703, "uptime": 20553.72842256399, "examples_seen": 56729600.0, "progress": 0.49696349919714383, "epoch": 44.72691005278491, "img/sec/core": 189.77822837766024, "core_hours_Tesla V100-SXM2-32GB": 83.10462301823182, "core_hours": 83.10462301823182}
{"step": 55450, "global_schedule": 0.581512451171875, "l2_grads": 1.5580803155899048, "l2_params": 307.1726989746094, "l2_updates": 0.6343878507614136, "training_loss": 2.4089014530181885, "uptime": 20570.609810698952, "examples_seen": 56780800.0, "progress": 0.4974120222108596, "epoch": 44.76727730012497, "img/sec/core": 189.5578713324186, "core_hours_Tesla V100-SXM2-32GB": 83.17965140994276, "core_hours": 83.17965140994276}
{"step": 55500, "global_schedule": 0.5807487964630127, "l2_grads": 1.4370468854904175, "l2_params": 307.080810546875, "l2_updates": 0.6308496594429016, "training_loss": 4.227753162384033, "uptime": 20587.507276458957, "examples_seen": 56832000.0, "progress": 0.49786054522457546, "epoch": 44.807644547465024, "img/sec/core": 189.3775105361781, "core_hours_Tesla V100-SXM2-32GB": 83.25475125776501, "core_hours": 83.25475125776501}
{"step": 55550, "global_schedule": 0.5799848437309265, "l2_grads": 1.6027625799179077, "l2_params": 306.99945068359375, "l2_updates": 0.6417596936225891, "training_loss": 2.2856717109680176, "uptime": 20604.350213733967, "examples_seen": 56883200.0, "progress": 0.4983090682382913, "epoch": 44.84801179480508, "img/sec/core": 189.99061432994506, "core_hours_Tesla V100-SXM2-32GB": 83.32960875676505, "core_hours": 83.32960875676505}
{"step": 55600, "global_schedule": 0.5792207717895508, "l2_grads": 1.4640874862670898, "l2_params": 306.9261169433594, "l2_updates": 0.622154951095581, "training_loss": 3.3064827919006348, "uptime": 20621.22161340696, "examples_seen": 56934400.0, "progress": 0.49875759125200714, "epoch": 44.88837904214514, "img/sec/core": 189.67009625896193, "core_hours_Tesla V100-SXM2-32GB": 83.4045927553117, "core_hours": 83.4045927553117}
{"step": 55650, "global_schedule": 0.578456461429596, "l2_grads": 1.492611050605774, "l2_params": 306.83746337890625, "l2_updates": 0.627271294593811, "training_loss": 2.4954099655151367, "uptime": 20638.097249885963, "examples_seen": 56985600.0, "progress": 0.499206114265723, "epoch": 44.9287462894852, "img/sec/core": 189.62247758664466, "core_hours_Tesla V100-SXM2-32GB": 83.47959558410726, "core_hours": 83.47959558410726}
{"step": 55700, "global_schedule": 0.5776920318603516, "l2_grads": 1.3493924140930176, "l2_params": 306.7303161621094, "l2_updates": 0.6020630598068237, "training_loss": 4.684353351593018, "uptime": 20654.93614705099, "examples_seen": 57036800.0, "progress": 0.4996546372794388, "epoch": 44.969113536825255, "img/sec/core": 190.03619825210708, "core_hours_Tesla V100-SXM2-32GB": 83.55443512706293, "core_hours": 83.55443512706293}
{"step": 55750, "global_schedule": 0.5769273638725281, "l2_grads": 1.4265562295913696, "l2_params": 306.6421813964844, "l2_updates": 0.6056723594665527, "training_loss": 4.1305928230285645, "uptime": 20671.821863435965, "examples_seen": 57088000.0, "progress": 0.5001031602931546, "epoch": 45.00948078416532, "img/sec/core": 189.5092827004563, "core_hours_Tesla V100-SXM2-32GB": 83.6294827554406, "core_hours": 83.6294827554406}
{"step": 55800, "global_schedule": 0.5761625170707703, "l2_grads": 1.487794280052185, "l2_params": 306.56024169921875, "l2_updates": 0.6190031170845032, "training_loss": 2.915473461151123, "uptime": 20688.662668376986, "examples_seen": 57139200.0, "progress": 0.5005516833068705, "epoch": 45.04984803150538, "img/sec/core": 190.01467039175938, "core_hours_Tesla V100-SXM2-32GB": 83.70433077740068, "core_hours": 83.70433077740068}
{"step": 55850, "global_schedule": 0.5753974914550781, "l2_grads": 1.5957461595535278, "l2_params": 306.47650146484375, "l2_updates": 0.6355955004692078, "training_loss": 2.6539883613586426, "uptime": 20705.53485292598, "examples_seen": 57190400.0, "progress": 0.5010002063205863, "epoch": 45.090215278845434, "img/sec/core": 189.66127300871972, "core_hours_Tesla V100-SXM2-32GB": 83.77931826428511, "core_hours": 83.77931826428511}
{"step": 55900, "global_schedule": 0.5746322870254517, "l2_grads": 1.4378883838653564, "l2_params": 306.39398193359375, "l2_updates": 0.623197615146637, "training_loss": 2.763282537460327, "uptime": 20722.39794289699, "examples_seen": 57241600.0, "progress": 0.5014487293343022, "epoch": 45.13058252618549, "img/sec/core": 189.76356085989934, "core_hours_Tesla V100-SXM2-32GB": 83.85426533082293, "core_hours": 83.85426533082293}
{"step": 55950, "global_schedule": 0.5738669037818909, "l2_grads": 1.4643199443817139, "l2_params": 306.32525634765625, "l2_updates": 0.6228829622268677, "training_loss": 2.7380449771881104, "uptime": 20739.271456582996, "examples_seen": 57292800.0, "progress": 0.501897252348018, "epoch": 45.17094977352555, "img/sec/core": 189.64633327402908, "core_hours_Tesla V100-SXM2-32GB": 83.92925872498294, "core_hours": 83.92925872498294}
{"step": 56000, "global_schedule": 0.5731013417243958, "l2_grads": 1.4853788614273071, "l2_params": 306.24102783203125, "l2_updates": 0.6222028732299805, "training_loss": 3.60536527633667, "uptime": 20756.13248852297, "examples_seen": 57344000.0, "progress": 0.5023457753617339, "epoch": 45.21131702086561, "img/sec/core": 189.78672310165402, "core_hours_Tesla V100-SXM2-32GB": 84.00419664471617, "core_hours": 84.00419664471617}
{"step": 56050, "global_schedule": 0.5723356008529663, "l2_grads": 1.4889158010482788, "l2_params": 306.158203125, "l2_updates": 0.6114161014556885, "training_loss": 2.8340201377868652, "uptime": 20773.497743619955, "examples_seen": 57395200.0, "progress": 0.5027942983754496, "epoch": 45.251684268205665, "img/sec/core": 189.56530977754713, "core_hours_Tesla V100-SXM2-32GB": 84.07922209235167, "core_hours": 84.07922209235167}
{"step": 56100, "global_schedule": 0.5715696811676025, "l2_grads": 1.6062098741531372, "l2_params": 306.06390380859375, "l2_updates": 0.6006911396980286, "training_loss": 2.1875014305114746, "uptime": 20790.38121614995, "examples_seen": 57446400.0, "progress": 0.5032428213891654, "epoch": 45.29205151554573, "img/sec/core": 189.534468949714, "core_hours_Tesla V100-SXM2-32GB": 84.15425974804053, "core_hours": 84.15425974804053}
{"step": 56150, "global_schedule": 0.5708035826683044, "l2_grads": 1.5853612422943115, "l2_params": 305.9612731933594, "l2_updates": 0.623948335647583, "training_loss": 2.6907691955566406, "uptime": 20807.236997446977, "examples_seen": 57497600.0, "progress": 0.5036913444028813, "epoch": 45.33241876288579, "img/sec/core": 189.84584242112993, "core_hours_Tesla V100-SXM2-32GB": 84.22917433158288, "core_hours": 84.22917433158288}
{"step": 56200, "global_schedule": 0.5700373649597168, "l2_grads": 1.4290294647216797, "l2_params": 305.87103271484375, "l2_updates": 0.6082112789154053, "training_loss": 2.681256055831909, "uptime": 20824.121731388965, "examples_seen": 57548800.0, "progress": 0.5041398674165971, "epoch": 45.372786010225845, "img/sec/core": 189.52030935130134, "core_hours_Tesla V100-SXM2-32GB": 84.30421759354726, "core_hours": 84.30421759354726}
{"step": 56250, "global_schedule": 0.56927090883255, "l2_grads": 1.5947185754776, "l2_params": 305.7940673828125, "l2_updates": 0.6129107475280762, "training_loss": 2.3383357524871826, "uptime": 20840.987286749005, "examples_seen": 57600000.0, "progress": 0.504588390430313, "epoch": 45.4131532575659, "img/sec/core": 189.7358214234565, "core_hours_Tesla V100-SXM2-32GB": 84.37917561736967, "core_hours": 84.37917561736967}
{"step": 56300, "global_schedule": 0.5685043334960938, "l2_grads": 1.6514314413070679, "l2_params": 305.70220947265625, "l2_updates": 0.6111034154891968, "training_loss": 2.4410080909729004, "uptime": 20857.832906054973, "examples_seen": 57651200.0, "progress": 0.5050369134440288, "epoch": 45.45352050490596, "img/sec/core": 189.96036547414215, "core_hours_Tesla V100-SXM2-32GB": 84.45404503650731, "core_hours": 84.45404503650731}
{"step": 56350, "global_schedule": 0.5677375793457031, "l2_grads": 1.5639913082122803, "l2_params": 305.61297607421875, "l2_updates": 0.6114895939826965, "training_loss": 2.313746690750122, "uptime": 20874.70915068395, "examples_seen": 57702400.0, "progress": 0.5054854364577447, "epoch": 45.49388775224602, "img/sec/core": 189.6156443777539, "core_hours_Tesla V100-SXM2-32GB": 84.52905056819165, "core_hours": 84.52905056819165}
{"step": 56400, "global_schedule": 0.566970705986023, "l2_grads": 1.5958847999572754, "l2_params": 305.5223388671875, "l2_updates": 0.612392008304596, "training_loss": 2.3502509593963623, "uptime": 20891.55762466695, "examples_seen": 57753600.0, "progress": 0.5059339594714605, "epoch": 45.534254999586075, "img/sec/core": 189.92818003745734, "core_hours_Tesla V100-SXM2-32GB": 84.60393267478277, "core_hours": 84.60393267478277}
{"step": 56450, "global_schedule": 0.5662035942077637, "l2_grads": 1.5181008577346802, "l2_params": 305.447509765625, "l2_updates": 0.6141707301139832, "training_loss": 3.694239616394043, "uptime": 20908.39900359098, "examples_seen": 57804800.0, "progress": 0.5063824824851764, "epoch": 45.57462224692614, "img/sec/core": 190.0081943666866, "core_hours_Tesla V100-SXM2-32GB": 84.67878324777845, "core_hours": 84.67878324777845}
{"step": 56500, "global_schedule": 0.5654363632202148, "l2_grads": 1.5832487344741821, "l2_params": 305.3668212890625, "l2_updates": 0.6157792210578918, "training_loss": 2.3127572536468506, "uptime": 20925.27686981298, "examples_seen": 57856000.0, "progress": 0.5068310054988922, "epoch": 45.6149894942662, "img/sec/core": 189.59742647023666, "core_hours_Tesla V100-SXM2-32GB": 84.75379598654288, "core_hours": 84.75379598654288}
{"step": 56550, "global_schedule": 0.5646690130233765, "l2_grads": 1.3764127492904663, "l2_params": 305.2779846191406, "l2_updates": 0.5971426963806152, "training_loss": 4.655908584594727, "uptime": 20942.11786540196, "examples_seen": 57907200.0, "progress": 0.5072795285126079, "epoch": 45.655356741606255, "img/sec/core": 190.01251933667803, "core_hours_Tesla V100-SXM2-32GB": 84.82864485582725, "core_hours": 84.82864485582725}
{"step": 56600, "global_schedule": 0.563901424407959, "l2_grads": 1.6140801906585693, "l2_params": 305.1798400878906, "l2_updates": 0.616364598274231, "training_loss": 2.422741651535034, "uptime": 20958.98600359395, "examples_seen": 57958400.0, "progress": 0.5077280515263238, "epoch": 45.69572398894631, "img/sec/core": 189.70676926987707, "core_hours_Tesla V100-SXM2-32GB": 84.90361435890276, "core_hours": 84.90361435890276}
{"step": 56650, "global_schedule": 0.5631337761878967, "l2_grads": 1.4827464818954468, "l2_params": 305.1182556152344, "l2_updates": 0.6130415797233582, "training_loss": 2.7415707111358643, "uptime": 20975.863161313988, "examples_seen": 58009600.0, "progress": 0.5081765745400396, "epoch": 45.73609123628637, "img/sec/core": 189.60538575761254, "core_hours_Tesla V100-SXM2-32GB": 84.9786239487696, "core_hours": 84.9786239487696}
{"step": 56700, "global_schedule": 0.5623658895492554, "l2_grads": 1.4248312711715698, "l2_params": 305.02740478515625, "l2_updates": 0.6064403653144836, "training_loss": 3.000354290008545, "uptime": 20992.690745280997, "examples_seen": 58060800.0, "progress": 0.5086250975537555, "epoch": 45.77645848362643, "img/sec/core": 190.16395973858118, "core_hours_Tesla V100-SXM2-32GB": 85.05341321084519, "core_hours": 85.05341321084519}
{"step": 56750, "global_schedule": 0.5615979433059692, "l2_grads": 1.637160301208496, "l2_params": 304.9461364746094, "l2_updates": 0.6107062101364136, "training_loss": 2.380781412124634, "uptime": 21009.584361116984, "examples_seen": 58112000.0, "progress": 0.5090736205674713, "epoch": 45.816825730966485, "img/sec/core": 189.42066820197252, "core_hours_Tesla V100-SXM2-32GB": 85.12849594789401, "core_hours": 85.12849594789401}
{"step": 56800, "global_schedule": 0.560829758644104, "l2_grads": 1.5061181783676147, "l2_params": 304.8584289550781, "l2_updates": 0.6075848937034607, "training_loss": 2.404953956604004, "uptime": 21026.450841791986, "examples_seen": 58163200.0, "progress": 0.5095221435811872, "epoch": 45.85719297830655, "img/sec/core": 189.72541229319629, "core_hours_Tesla V100-SXM2-32GB": 85.20345808422736, "core_hours": 85.20345808422736}
{"step": 56850, "global_schedule": 0.5600614547729492, "l2_grads": 1.3439583778381348, "l2_params": 304.7743225097656, "l2_updates": 0.606910765171051, "training_loss": 2.894188404083252, "uptime": 21043.312264484004, "examples_seen": 58214400.0, "progress": 0.509970666594903, "epoch": 45.89756022564661, "img/sec/core": 189.78232492296303, "core_hours_Tesla V100-SXM2-32GB": 85.27839774063634, "core_hours": 85.27839774063634}
{"step": 56900, "global_schedule": 0.5592930316925049, "l2_grads": 1.5830341577529907, "l2_params": 304.6783142089844, "l2_updates": 0.5948189496994019, "training_loss": 2.454720973968506, "uptime": 21060.183124429954, "examples_seen": 58265600.0, "progress": 0.5104191896086189, "epoch": 45.937927472986665, "img/sec/core": 189.6761641227576, "core_hours_Tesla V100-SXM2-32GB": 85.3533793403961, "core_hours": 85.3533793403961}
{"step": 56950, "global_schedule": 0.558524489402771, "l2_grads": 1.3864398002624512, "l2_params": 304.58197021484375, "l2_updates": 0.6018280982971191, "training_loss": 4.304353713989258, "uptime": 21077.048321851995, "examples_seen": 58316800.0, "progress": 0.5108677126223347, "epoch": 45.97829472032672, "img/sec/core": 189.73984827583024, "core_hours_Tesla V100-SXM2-32GB": 85.42833577338295, "core_hours": 85.42833577338295}
{"step": 57000, "global_schedule": 0.5577557682991028, "l2_grads": 1.4458507299423218, "l2_params": 304.4881591796875, "l2_updates": 0.5958211421966553, "training_loss": 4.379544258117676, "uptime": 21093.90906341799, "examples_seen": 58368000.0, "progress": 0.5113162356360504, "epoch": 46.01866196766678, "img/sec/core": 189.78999158934323, "core_hours_Tesla V100-SXM2-32GB": 85.50327240256516, "core_hours": 85.50327240256516}
{"step": 57050, "global_schedule": 0.556986927986145, "l2_grads": 1.2940278053283691, "l2_params": 304.4224548339844, "l2_updates": 0.6084461212158203, "training_loss": 4.682967185974121, "uptime": 21111.30765828298, "examples_seen": 58419200.0, "progress": 0.5117647586497663, "epoch": 46.05902921500684, "img/sec/core": 189.59924752764232, "core_hours_Tesla V100-SXM2-32GB": 85.57828442084939, "core_hours": 85.57828442084939}
{"step": 57100, "global_schedule": 0.5562179088592529, "l2_grads": 1.4585508108139038, "l2_params": 304.34814453125, "l2_updates": 0.6097527146339417, "training_loss": 2.4970476627349854, "uptime": 21128.17399797798, "examples_seen": 58470400.0, "progress": 0.5122132816634821, "epoch": 46.099396462346895, "img/sec/core": 189.72699814345054, "core_hours_Tesla V100-SXM2-32GB": 85.65324593060495, "core_hours": 85.65324593060495}
{"step": 57150, "global_schedule": 0.5554487705230713, "l2_grads": 1.441231608390808, "l2_params": 304.2701416015625, "l2_updates": 0.5947101712226868, "training_loss": 4.0431437492370605, "uptime": 21145.04784982797, "examples_seen": 58521600.0, "progress": 0.512661804677198, "epoch": 46.13976370968696, "img/sec/core": 189.6425326267261, "core_hours_Tesla V100-SXM2-32GB": 85.72824082771601, "core_hours": 85.72824082771601}
{"step": 57200, "global_schedule": 0.5546795129776001, "l2_grads": 1.6516598463058472, "l2_params": 304.2044372558594, "l2_updates": 0.6019457578659058, "training_loss": 2.3934435844421387, "uptime": 21161.92770434497, "examples_seen": 58572800.0, "progress": 0.5131103276909138, "epoch": 46.18013095702702, "img/sec/core": 189.57509359913917, "core_hours_Tesla V100-SXM2-32GB": 85.80326240334712, "core_hours": 85.80326240334712}
{"step": 57250, "global_schedule": 0.5539101362228394, "l2_grads": 1.5395562648773193, "l2_params": 304.1240539550781, "l2_updates": 0.6065751314163208, "training_loss": 2.4229111671447754, "uptime": 21178.81759245397, "examples_seen": 58624000.0, "progress": 0.5135588507046297, "epoch": 46.220498204367075, "img/sec/core": 189.46247478661667, "core_hours_Tesla V100-SXM2-32GB": 85.87832857272045, "core_hours": 85.87832857272045}
{"step": 57300, "global_schedule": 0.5531406402587891, "l2_grads": 1.5129408836364746, "l2_params": 304.0326232910156, "l2_updates": 0.5889766812324524, "training_loss": 4.806497573852539, "uptime": 21195.68891836499, "examples_seen": 58675200.0, "progress": 0.5140073737183455, "epoch": 46.26086545170713, "img/sec/core": 189.6709255026192, "core_hours_Tesla V100-SXM2-32GB": 85.9533122434361, "core_hours": 85.9533122434361}
{"step": 57350, "global_schedule": 0.5523709654808044, "l2_grads": 1.578624963760376, "l2_params": 303.9429626464844, "l2_updates": 0.6008204221725464, "training_loss": 2.4183850288391113, "uptime": 21212.577993176004, "examples_seen": 58726400.0, "progress": 0.5144558967320613, "epoch": 46.30123269904719, "img/sec/core": 189.4715984035591, "core_hours_Tesla V100-SXM2-32GB": 86.02837479815172, "core_hours": 86.02837479815172}
{"step": 57400, "global_schedule": 0.5516011714935303, "l2_grads": 1.595244288444519, "l2_params": 303.8558349609375, "l2_updates": 0.6052985787391663, "training_loss": 2.218616247177124, "uptime": 21229.46310716099, "examples_seen": 58777600.0, "progress": 0.5149044197457772, "epoch": 46.34159994638725, "img/sec/core": 189.516043708397, "core_hours_Tesla V100-SXM2-32GB": 86.10341974919609, "core_hours": 86.10341974919609}
{"step": 57450, "global_schedule": 0.5508313179016113, "l2_grads": 1.5418593883514404, "l2_params": 303.7725524902344, "l2_updates": 0.5938324928283691, "training_loss": 2.628298759460449, "uptime": 21246.33387969999, "examples_seen": 58828800.0, "progress": 0.515352942759493, "epoch": 46.381967193727306, "img/sec/core": 189.677146829111, "core_hours_Tesla V100-SXM2-32GB": 86.17840096048053, "core_hours": 86.17840096048053}
{"step": 57500, "global_schedule": 0.5500612854957581, "l2_grads": 1.7153023481369019, "l2_params": 303.67730712890625, "l2_updates": 0.5875210165977478, "training_loss": 2.3517370223999023, "uptime": 21263.208138908958, "examples_seen": 58880000.0, "progress": 0.5158014657732088, "epoch": 46.42233444106736, "img/sec/core": 189.63795449456407, "core_hours_Tesla V100-SXM2-32GB": 86.25339766807595, "core_hours": 86.25339766807595, "minival/prec@1": 0.6856072432094911, "minival/loss": 1.3166572697044274, "minival/sample count": 12812.0, "minival/attn_weight_avg": [13312, 12, 281], "minival/attn_mag": [13312, 12, 281], "minival/before_mlp": [13312, 12, 281], "z/secs/eval/minival": 2.912366029981058, "real/prec@1": 0.7277579691269722, "real/loss": 2.129143111286383, "real/sample count": 46837.0, "real/attn_weight_avg": [50176, 12, 281], "real/attn_mag": [50176, 12, 281], "real/before_mlp": [50176, 12, 281], "z/secs/eval/real": 11.1346966670244, "train/prec@1": 0.7099090660734496, "train/loss": 1.1976635144651344, "train/sample count": 25623.0, "train/attn_weight_avg": [26624, 12, 281], "train/attn_mag": [26624, 12, 281], "train/before_mlp": [26624, 12, 281], "z/secs/eval/train": 6.547186215000693, "v2/prec@1": 0.5296, "v2/loss": 2.0994830078125, "v2/sample count": 10000.0, "v2/attn_weight_avg": [10240, 12, 281], "v2/attn_mag": [10240, 12, 281], "v2/before_mlp": [10240, 12, 281], "z/secs/eval/v2": 3.348380877985619, "val/prec@1": 0.65146, "val/loss": 1.4606420385742187, "val/sample count": 50000.0, "val/attn_weight_avg": [50176, 12, 281], "val/attn_mag": [50176, 12, 281], "val/before_mlp": [50176, 12, 281], "z/secs/eval/val": 12.305257503001485}
{"step": 57550, "global_schedule": 0.5492911338806152, "l2_grads": 1.5749220848083496, "l2_params": 303.5915832519531, "l2_updates": 0.6021054983139038, "training_loss": 2.826474905014038, "uptime": 21316.37624524499, "examples_seen": 58931200.0, "progress": 0.5162499887869246, "epoch": 46.46270168840743, "img/sec/core": 189.1452887914713, "core_hours_Tesla V100-SXM2-32GB": 86.32858971918701, "core_hours": 86.32858971918701}
{"step": 57600, "global_schedule": 0.5485209226608276, "l2_grads": 1.631441354751587, "l2_params": 303.5121154785156, "l2_updates": 0.578307032585144, "training_loss": 2.213198184967041, "uptime": 21333.26140131295, "examples_seen": 58982400.0, "progress": 0.5166985118006405, "epoch": 46.503068935747486, "img/sec/core": 189.51557137643644, "core_hours_Tesla V100-SXM2-32GB": 86.40363485726682, "core_hours": 86.40363485726682}
{"step": 57650, "global_schedule": 0.5477505326271057, "l2_grads": 1.3882694244384766, "l2_params": 303.4223937988281, "l2_updates": 0.5934940576553345, "training_loss": 3.830087184906006, "uptime": 21350.141628314974, "examples_seen": 59033600.0, "progress": 0.5171470348143563, "epoch": 46.54343618308754, "img/sec/core": 189.5709103684609, "core_hours_Tesla V100-SXM2-32GB": 86.47865808838694, "core_hours": 86.47865808838694}
{"step": 57700, "global_schedule": 0.5469800233840942, "l2_grads": 1.7708295583724976, "l2_params": 303.3442687988281, "l2_updates": 0.5759347677230835, "training_loss": 2.301316022872925, "uptime": 21367.024406968965, "examples_seen": 59084800.0, "progress": 0.5175955578280722, "epoch": 46.5838034304276, "img/sec/core": 189.54225874681237, "core_hours_Tesla V100-SXM2-32GB": 86.55369266018245, "core_hours": 86.55369266018245}
{"step": 57750, "global_schedule": 0.546209454536438, "l2_grads": 1.4087055921554565, "l2_params": 303.2436828613281, "l2_updates": 0.5778045058250427, "training_loss": 3.8006515502929688, "uptime": 21383.892943368992, "examples_seen": 59136000.0, "progress": 0.518044080841788, "epoch": 46.62417067776766, "img/sec/core": 189.70229094653084, "core_hours_Tesla V100-SXM2-32GB": 86.62866393307146, "core_hours": 86.62866393307146}
{"step": 57800, "global_schedule": 0.5454387068748474, "l2_grads": 1.631637454032898, "l2_params": 303.1522521972656, "l2_updates": 0.5966692566871643, "training_loss": 2.5091772079467773, "uptime": 21400.773817224952, "examples_seen": 59187200.0, "progress": 0.5184926038555038, "epoch": 46.664537925107716, "img/sec/core": 189.5636462486913, "core_hours_Tesla V100-SXM2-32GB": 86.70369003909795, "core_hours": 86.70369003909795}
{"step": 57850, "global_schedule": 0.5446678996086121, "l2_grads": 1.6438874006271362, "l2_params": 303.06903076171875, "l2_updates": 0.5851090550422668, "training_loss": 2.59394907951355, "uptime": 21417.655485331954, "examples_seen": 59238400.0, "progress": 0.5189411268692197, "epoch": 46.70490517244777, "img/sec/core": 189.5547276322018, "core_hours_Tesla V100-SXM2-32GB": 86.77871967512907, "core_hours": 86.77871967512907}
{"step": 57900, "global_schedule": 0.5438969731330872, "l2_grads": 1.3907253742218018, "l2_params": 302.9826965332031, "l2_updates": 0.5893722176551819, "training_loss": 3.5826072692871094, "uptime": 21434.54889643495, "examples_seen": 59289600.0, "progress": 0.5193896498829355, "epoch": 46.74527241978784, "img/sec/core": 189.42296381057923, "core_hours_Tesla V100-SXM2-32GB": 86.85380150225349, "core_hours": 86.85380150225349}
{"step": 57950, "global_schedule": 0.5431259870529175, "l2_grads": 1.5570406913757324, "l2_params": 302.903564453125, "l2_updates": 0.5975256562232971, "training_loss": 2.38059139251709, "uptime": 21451.430922927975, "examples_seen": 59340800.0, "progress": 0.5198381728966514, "epoch": 46.785639667127896, "img/sec/core": 189.5507036031501, "core_hours_Tesla V100-SXM2-32GB": 86.9288327311114, "core_hours": 86.9288327311114}
{"step": 58000, "global_schedule": 0.5423548221588135, "l2_grads": 1.509867548942566, "l2_params": 302.8223571777344, "l2_updates": 0.578299880027771, "training_loss": 4.513884544372559, "uptime": 21468.307426810963, "examples_seen": 59392000.0, "progress": 0.5202866959103671, "epoch": 46.82600691446795, "img/sec/core": 189.61273153414865, "core_hours_Tesla V100-SXM2-32GB": 87.00383941503578, "core_hours": 87.00383941503578}
{"step": 58051, "global_schedule": 0.5415835380554199, "l2_grads": 1.5357557535171509, "l2_params": 302.7278747558594, "l2_updates": 0.5816565155982971, "training_loss": 2.314182996749878, "uptime": 21485.70243476797, "examples_seen": 59443200.0, "progress": 0.520735218924083, "epoch": 46.86637416180801, "img/sec/core": 189.5807862717625, "core_hours_Tesla V100-SXM2-32GB": 87.07885873794245, "core_hours": 87.07885873794245}
{"step": 58100, "global_schedule": 0.5408121943473816, "l2_grads": 1.5988073348999023, "l2_params": 302.6283874511719, "l2_updates": 0.5916268229484558, "training_loss": 2.207132577896118, "uptime": 21502.608992277004, "examples_seen": 59494400.0, "progress": 0.5211837419377988, "epoch": 46.90674140914807, "img/sec/core": 189.27567000495696, "core_hours_Tesla V100-SXM2-32GB": 87.15399899353817, "core_hours": 87.15399899353817}
{"step": 58150, "global_schedule": 0.5400407910346985, "l2_grads": 1.5005040168762207, "l2_params": 302.5556640625, "l2_updates": 0.5882490873336792, "training_loss": 2.6995534896850586, "uptime": 21519.477596477955, "examples_seen": 59545600.0, "progress": 0.5216322649515147, "epoch": 46.947108656488126, "img/sec/core": 189.70152846550965, "core_hours_Tesla V100-SXM2-32GB": 87.22897056776462, "core_hours": 87.22897056776462}
{"step": 58200, "global_schedule": 0.539269208908081, "l2_grads": 1.6364132165908813, "l2_params": 302.4793701171875, "l2_updates": 0.5844878554344177, "training_loss": 2.3694708347320557, "uptime": 21536.34648102295, "examples_seen": 59596800.0, "progress": 0.5220807879652305, "epoch": 46.987475903828184, "img/sec/core": 189.69837581522773, "core_hours_Tesla V100-SXM2-32GB": 87.3039433879646, "core_hours": 87.3039433879646}
{"step": 58250, "global_schedule": 0.5384976267814636, "l2_grads": 1.4525946378707886, "l2_params": 302.3878479003906, "l2_updates": 0.5820039510726929, "training_loss": 2.8355777263641357, "uptime": 21553.21294570499, "examples_seen": 59648000.0, "progress": 0.5225293109789463, "epoch": 47.02784315116825, "img/sec/core": 189.72559219286236, "core_hours_Tesla V100-SXM2-32GB": 87.3789054532181, "core_hours": 87.3789054532181}
{"step": 58300, "global_schedule": 0.5377259254455566, "l2_grads": 1.3744977712631226, "l2_params": 302.3121337890625, "l2_updates": 0.5803694725036621, "training_loss": 4.726423263549805, "uptime": 21570.101017155976, "examples_seen": 59699200.0, "progress": 0.5229778339926622, "epoch": 47.068210398508306, "img/sec/core": 189.48285535664283, "core_hours_Tesla V100-SXM2-32GB": 87.4539635485558, "core_hours": 87.4539635485558}
{"step": 58350, "global_schedule": 0.5369541049003601, "l2_grads": 1.5279302597045898, "l2_params": 302.2317810058594, "l2_updates": 0.5788824558258057, "training_loss": 2.260167360305786, "uptime": 21586.964620382, "examples_seen": 59750400.0, "progress": 0.523426357006378, "epoch": 47.108577645848364, "img/sec/core": 189.75778527933116, "core_hours_Tesla V100-SXM2-32GB": 87.52891289622704, "core_hours": 87.52891289622704}
{"step": 58400, "global_schedule": 0.5361822247505188, "l2_grads": 1.6449931859970093, "l2_params": 302.1537780761719, "l2_updates": 0.584260880947113, "training_loss": 2.404815196990967, "uptime": 21603.84954170999, "examples_seen": 59801600.0, "progress": 0.5238748800200939, "epoch": 47.14894489318842, "img/sec/core": 189.51820608695303, "core_hours_Tesla V100-SXM2-32GB": 87.60395699101811, "core_hours": 87.60395699101811}
{"step": 58450, "global_schedule": 0.5354102253913879, "l2_grads": 1.6251471042633057, "l2_params": 302.07666015625, "l2_updates": 0.5829998850822449, "training_loss": 2.3499858379364014, "uptime": 21620.70481962897, "examples_seen": 59852800.0, "progress": 0.5243234030338096, "epoch": 47.18931214052848, "img/sec/core": 189.8515121128357, "core_hours_Tesla V100-SXM2-32GB": 87.67886933732467, "core_hours": 87.67886933732467}
{"step": 58500, "global_schedule": 0.5346381664276123, "l2_grads": 1.5440071821212769, "l2_params": 301.9802551269531, "l2_updates": 0.5789586901664734, "training_loss": 2.3783602714538574, "uptime": 21637.565614186984, "examples_seen": 59904000.0, "progress": 0.5247719260475255, "epoch": 47.229679387868536, "img/sec/core": 189.78939509578464, "core_hours_Tesla V100-SXM2-32GB": 87.75380620202696, "core_hours": 87.75380620202696}
{"step": 58550, "global_schedule": 0.5338659882545471, "l2_grads": 1.6079596281051636, "l2_params": 301.8911437988281, "l2_updates": 0.5705162882804871, "training_loss": 2.2744107246398926, "uptime": 21654.45200949296, "examples_seen": 59955200.0, "progress": 0.5252204490612413, "epoch": 47.270046635208594, "img/sec/core": 189.50166344070544, "core_hours_Tesla V100-SXM2-32GB": 87.8288568478313, "core_hours": 87.8288568478313}
{"step": 58600, "global_schedule": 0.5330937504768372, "l2_grads": 1.4668998718261719, "l2_params": 301.79095458984375, "l2_updates": 0.5760279297828674, "training_loss": 3.76162052154541, "uptime": 21671.297512875986, "examples_seen": 60006400.0, "progress": 0.5256689720749572, "epoch": 47.31041388254866, "img/sec/core": 189.961672693295, "core_hours_Tesla V100-SXM2-32GB": 87.90372575175587, "core_hours": 87.90372575175587}
{"step": 58650, "global_schedule": 0.5323214530944824, "l2_grads": 1.5176856517791748, "l2_params": 301.68377685546875, "l2_updates": 0.5608223080635071, "training_loss": 4.689838409423828, "uptime": 21688.187718776986, "examples_seen": 60057600.0, "progress": 0.526117495088673, "epoch": 47.350781129888716, "img/sec/core": 189.45891001900662, "core_hours_Tesla V100-SXM2-32GB": 87.97879333353808, "core_hours": 87.97879333353808}
{"step": 58700, "global_schedule": 0.5315490961074829, "l2_grads": 1.585952639579773, "l2_params": 301.5862731933594, "l2_updates": 0.5582394003868103, "training_loss": 4.749842166900635, "uptime": 21705.06268444797, "examples_seen": 60108800.0, "progress": 0.5265660181023888, "epoch": 47.391148377228774, "img/sec/core": 189.63001539625407, "core_hours_Tesla V100-SXM2-32GB": 88.05379318096468, "core_hours": 88.05379318096468}
{"step": 58750, "global_schedule": 0.5307766199111938, "l2_grads": 1.5205588340759277, "l2_params": 301.4947509765625, "l2_updates": 0.5603581666946411, "training_loss": 4.618302822113037, "uptime": 21721.938586187956, "examples_seen": 60160000.0, "progress": 0.5270145411161047, "epoch": 47.43151562456883, "img/sec/core": 189.6194970380662, "core_hours_Tesla V100-SXM2-32GB": 88.12879718869794, "core_hours": 88.12879718869794}
{"step": 58800, "global_schedule": 0.53000408411026, "l2_grads": 1.752030849456787, "l2_params": 301.4221496582031, "l2_updates": 0.5806198716163635, "training_loss": 2.339531898498535, "uptime": 21738.788937153004, "examples_seen": 60211200.0, "progress": 0.5274630641298205, "epoch": 47.47188287190889, "img/sec/core": 189.90702369569462, "core_hours_Tesla V100-SXM2-32GB": 88.2036876374315, "core_hours": 88.2036876374315}
{"step": 58850, "global_schedule": 0.5292314887046814, "l2_grads": 1.5946688652038574, "l2_params": 301.3324279785156, "l2_updates": 0.5747492909431458, "training_loss": 2.3517568111419678, "uptime": 21755.66088970995, "examples_seen": 60262400.0, "progress": 0.5279115871435364, "epoch": 47.51225011924895, "img/sec/core": 189.66388088155492, "core_hours_Tesla V100-SXM2-32GB": 88.27867409324016, "core_hours": 88.27867409324016}
{"step": 58900, "global_schedule": 0.5284587740898132, "l2_grads": 1.4284406900405884, "l2_params": 301.2476501464844, "l2_updates": 0.5688567757606506, "training_loss": 3.970306396484375, "uptime": 21772.532736431982, "examples_seen": 60313600.0, "progress": 0.5283601101572521, "epoch": 47.552617366589004, "img/sec/core": 189.66507061858252, "core_hours_Tesla V100-SXM2-32GB": 88.35366007867141, "core_hours": 88.35366007867141}
{"step": 58950, "global_schedule": 0.5276860594749451, "l2_grads": 1.4640581607818604, "l2_params": 301.1565246582031, "l2_updates": 0.5672692060470581, "training_loss": 4.1217570304870605, "uptime": 21789.395754902973, "examples_seen": 60364800.0, "progress": 0.528808633170968, "epoch": 47.59298461392907, "img/sec/core": 189.76436546665036, "core_hours_Tesla V100-SXM2-32GB": 88.42860682743137, "core_hours": 88.42860682743137}
{"step": 59000, "global_schedule": 0.5269132256507874, "l2_grads": 1.4471038579940796, "l2_params": 301.0590515136719, "l2_updates": 0.5721775889396667, "training_loss": 4.305671215057373, "uptime": 21806.280675749993, "examples_seen": 60416000.0, "progress": 0.5292571561846838, "epoch": 47.63335186126913, "img/sec/core": 189.51821148541202, "core_hours_Tesla V100-SXM2-32GB": 88.50365092008478, "core_hours": 88.50365092008478}
{"step": 59050, "global_schedule": 0.5261403918266296, "l2_grads": 1.6514980792999268, "l2_params": 300.96258544921875, "l2_updates": 0.5624080300331116, "training_loss": 2.5257396697998047, "uptime": 21823.94427128695, "examples_seen": 60467200.0, "progress": 0.5297056791983996, "epoch": 47.673719108609184, "img/sec/core": 189.89293501641492, "core_hours_Tesla V100-SXM2-32GB": 88.57854692514675, "core_hours": 88.57854692514675}
{"step": 59100, "global_schedule": 0.5253674387931824, "l2_grads": 1.7015937566757202, "l2_params": 300.872314453125, "l2_updates": 0.5641830563545227, "training_loss": 2.2106974124908447, "uptime": 21840.812238438986, "examples_seen": 60518400.0, "progress": 0.5301542022121155, "epoch": 47.71408635594924, "img/sec/core": 189.70869288262844, "core_hours_Tesla V100-SXM2-32GB": 88.6535156680447, "core_hours": 88.6535156680447}
{"step": 59150, "global_schedule": 0.5245944857597351, "l2_grads": 1.4904602766036987, "l2_params": 300.7949523925781, "l2_updates": 0.5730878114700317, "training_loss": 2.5355541706085205, "uptime": 21857.680406528, "examples_seen": 60569600.0, "progress": 0.5306027252258313, "epoch": 47.7544536032893, "img/sec/core": 189.70643303489106, "core_hours_Tesla V100-SXM2-32GB": 88.72848530399588, "core_hours": 88.72848530399588}
{"step": 59200, "global_schedule": 0.5238214135169983, "l2_grads": 1.5845082998275757, "l2_params": 300.7092590332031, "l2_updates": 0.5637711882591248, "training_loss": 3.1175894737243652, "uptime": 21874.53467044595, "examples_seen": 60620800.0, "progress": 0.5310512482395472, "epoch": 47.79482085062936, "img/sec/core": 189.86293412623468, "core_hours_Tesla V100-SXM2-32GB": 88.80339314363121, "core_hours": 88.80339314363121}
{"step": 59250, "global_schedule": 0.5230483412742615, "l2_grads": 1.5746442079544067, "l2_params": 300.6200866699219, "l2_updates": 0.5630395412445068, "training_loss": 2.3097984790802, "uptime": 21891.411297349958, "examples_seen": 60672000.0, "progress": 0.531499771253263, "epoch": 47.835188097969414, "img/sec/core": 189.611349365103, "core_hours_Tesla V100-SXM2-32GB": 88.87840037431569, "core_hours": 88.87840037431569}
{"step": 59300, "global_schedule": 0.5222751498222351, "l2_grads": 1.633867859840393, "l2_params": 300.5411071777344, "l2_updates": 0.5651152729988098, "training_loss": 2.184403419494629, "uptime": 21908.279884018004, "examples_seen": 60723200.0, "progress": 0.5319482942669789, "epoch": 47.87555534530948, "img/sec/core": 189.70172563785042, "core_hours_Tesla V100-SXM2-32GB": 88.95337187061811, "core_hours": 88.95337187061811}
{"step": 59350, "global_schedule": 0.521501898765564, "l2_grads": 1.6739801168441772, "l2_params": 300.4422912597656, "l2_updates": 0.5621345043182373, "training_loss": 2.3884072303771973, "uptime": 21925.11988352897, "examples_seen": 60774400.0, "progress": 0.5323968172806947, "epoch": 47.91592259264954, "img/sec/core": 190.02375848742864, "core_hours_Tesla V100-SXM2-32GB": 89.02821631288906, "core_hours": 89.02821631288906}
{"step": 59400, "global_schedule": 0.5207286477088928, "l2_grads": 1.4626154899597168, "l2_params": 300.3567199707031, "l2_updates": 0.5594987273216248, "training_loss": 3.33747935295105, "uptime": 21941.993111790973, "examples_seen": 60825600.0, "progress": 0.5328453402944106, "epoch": 47.956289839989594, "img/sec/core": 189.64954129174725, "core_hours_Tesla V100-SXM2-32GB": 89.10320843849796, "core_hours": 89.10320843849796}
{"step": 59450, "global_schedule": 0.5199553370475769, "l2_grads": 1.6284043788909912, "l2_params": 300.2703552246094, "l2_updates": 0.56600421667099, "training_loss": 2.4884204864501953, "uptime": 21958.871875251003, "examples_seen": 60876800.0, "progress": 0.5332938633081263, "epoch": 47.99665708732965, "img/sec/core": 189.5873478870503, "core_hours_Tesla V100-SXM2-32GB": 89.178225164987, "core_hours": 89.178225164987}
{"step": 59500, "global_schedule": 0.5191819667816162, "l2_grads": 1.7111068964004517, "l2_params": 300.1968688964844, "l2_updates": 0.5683639645576477, "training_loss": 2.229971408843994, "uptime": 21975.740782848967, "examples_seen": 60928000.0, "progress": 0.5337423863218421, "epoch": 48.03702433466971, "img/sec/core": 189.69811657432297, "core_hours_Tesla V100-SXM2-32GB": 89.25319808764462, "core_hours": 89.25319808764462}
{"step": 59550, "global_schedule": 0.5184085369110107, "l2_grads": 1.6029577255249023, "l2_params": 300.0926208496094, "l2_updates": 0.5636590123176575, "training_loss": 4.847917079925537, "uptime": 21992.619270930998, "examples_seen": 60979200.0, "progress": 0.534190909335558, "epoch": 48.07739158200977, "img/sec/core": 189.59044106602786, "core_hours_Tesla V100-SXM2-32GB": 89.32821359023141, "core_hours": 89.32821359023141}
{"step": 59600, "global_schedule": 0.5176350474357605, "l2_grads": 1.6572301387786865, "l2_params": 300.0117492675781, "l2_updates": 0.5479713082313538, "training_loss": 2.243572950363159, "uptime": 22009.48968693998, "examples_seen": 61030400.0, "progress": 0.5346394323492738, "epoch": 48.117758829349825, "img/sec/core": 189.68115536071866, "core_hours_Tesla V100-SXM2-32GB": 89.403193216938, "core_hours": 89.403193216938}
{"step": 59650, "global_schedule": 0.5168615579605103, "l2_grads": 1.6338722705841064, "l2_params": 299.9271545410156, "l2_updates": 0.5564932227134705, "training_loss": 2.254453182220459, "uptime": 22026.33093687496, "examples_seen": 61081600.0, "progress": 0.5350879553629897, "epoch": 48.15812607668988, "img/sec/core": 190.0096496610692, "core_hours_Tesla V100-SXM2-32GB": 89.47804321664903, "core_hours": 89.47804321664903}
{"step": 59700, "global_schedule": 0.5160880088806152, "l2_grads": 1.7101986408233643, "l2_params": 299.8310241699219, "l2_updates": 0.5592057704925537, "training_loss": 2.2369704246520996, "uptime": 22043.189744127973, "examples_seen": 61132800.0, "progress": 0.5355364783767055, "epoch": 48.19849332402995, "img/sec/core": 189.81176734365178, "core_hours_Tesla V100-SXM2-32GB": 89.55297124888463, "core_hours": 89.55297124888463}
{"step": 59750, "global_schedule": 0.5153144001960754, "l2_grads": 1.480621099472046, "l2_params": 299.7582702636719, "l2_updates": 0.563949704170227, "training_loss": 3.242694854736328, "uptime": 22060.055426742998, "examples_seen": 61184000.0, "progress": 0.5359850013904214, "epoch": 48.238860571370004, "img/sec/core": 189.73438982832266, "core_hours_Tesla V100-SXM2-32GB": 89.62792983828474, "core_hours": 89.62792983828474}
{"step": 59800, "global_schedule": 0.5145407915115356, "l2_grads": 1.621728777885437, "l2_params": 299.6694641113281, "l2_updates": 0.5620017051696777, "training_loss": 2.1932718753814697, "uptime": 22076.89807522198, "examples_seen": 61235200.0, "progress": 0.5364335244041372, "epoch": 48.27922781871006, "img/sec/core": 189.9938720441368, "core_hours_Tesla V100-SXM2-32GB": 89.70278605374689, "core_hours": 89.70278605374689}
{"step": 59850, "global_schedule": 0.5137671232223511, "l2_grads": 1.4015341997146606, "l2_params": 299.5744934082031, "l2_updates": 0.5526585578918457, "training_loss": 3.6064579486846924, "uptime": 22093.773661134997, "examples_seen": 61286400.0, "progress": 0.5368820474178531, "epoch": 48.31959506605012, "img/sec/core": 189.6230457711998, "core_hours_Tesla V100-SXM2-32GB": 89.77778865780473, "core_hours": 89.77778865780473}
{"step": 59900, "global_schedule": 0.5129934549331665, "l2_grads": 1.3953688144683838, "l2_params": 299.4986267089844, "l2_updates": 0.5566349029541016, "training_loss": 3.8453593254089355, "uptime": 22110.634048611973, "examples_seen": 61337600.0, "progress": 0.5373305704315688, "epoch": 48.35996231339018, "img/sec/core": 189.79397741420894, "core_hours_Tesla V100-SXM2-32GB": 89.85272371325797, "core_hours": 89.85272371325797}
{"step": 59950, "global_schedule": 0.5122197270393372, "l2_grads": 1.666443109512329, "l2_params": 299.420654296875, "l2_updates": 0.5639898777008057, "training_loss": 2.33034086227417, "uptime": 22127.479076890973, "examples_seen": 61388800.0, "progress": 0.5377790934452846, "epoch": 48.400329560730235, "img/sec/core": 189.9670304495312, "core_hours_Tesla V100-SXM2-32GB": 89.92759050560907, "core_hours": 89.92759050560907}
{"step": 60000, "global_schedule": 0.5114459991455078, "l2_grads": 1.6405391693115234, "l2_params": 299.3470458984375, "l2_updates": 0.5534558296203613, "training_loss": 2.2857508659362793, "uptime": 22144.358356132987, "examples_seen": 61440000.0, "progress": 0.5382276164590005, "epoch": 48.44069680807029, "img/sec/core": 189.5815546457102, "core_hours_Tesla V100-SXM2-32GB": 90.00260952446247, "core_hours": 90.00260952446247, "minival/prec@1": 0.6952076178582579, "minival/loss": 1.2567232139699354, "minival/sample count": 12812.0, "minival/attn_weight_avg": [13312, 12, 281], "minival/attn_mag": [13312, 12, 281], "minival/before_mlp": [13312, 12, 281], "z/secs/eval/minival": 2.877439920033794, "real/prec@1": 0.7369814462924611, "real/loss": 2.0794097081367293, "real/sample count": 46837.0, "real/attn_weight_avg": [50176, 12, 281], "real/attn_mag": [50176, 12, 281], "real/before_mlp": [50176, 12, 281], "z/secs/eval/real": 11.149004417005926, "train/prec@1": 0.722788120048394, "train/loss": 1.1220182295180183, "train/sample count": 25623.0, "train/attn_weight_avg": [26624, 12, 281], "train/attn_mag": [26624, 12, 281], "train/before_mlp": [26624, 12, 281], "z/secs/eval/train": 6.601436612952966, "v2/prec@1": 0.5403, "v2/loss": 2.0606457397460938, "v2/sample count": 10000.0, "v2/attn_weight_avg": [10240, 12, 281], "v2/attn_mag": [10240, 12, 281], "v2/before_mlp": [10240, 12, 281], "z/secs/eval/v2": 3.3453118169563822, "val/prec@1": 0.66166, "val/loss": 1.4035690112304688, "val/sample count": 50000.0, "val/attn_weight_avg": [50176, 12, 281], "val/attn_mag": [50176, 12, 281], "val/before_mlp": [50176, 12, 281], "z/secs/eval/val": 12.314909086970147}
{"step": 60050, "global_schedule": 0.5106722116470337, "l2_grads": 1.6414984464645386, "l2_params": 299.25823974609375, "l2_updates": 0.556515097618103, "training_loss": 2.302733898162842, "uptime": 22198.08185161295, "examples_seen": 61491200.0, "progress": 0.5386761394727163, "epoch": 48.48106405541036, "img/sec/core": 189.04011292800934, "core_hours_Tesla V100-SXM2-32GB": 90.0778434100222, "core_hours": 90.0778434100222}
{"step": 60100, "global_schedule": 0.5098984241485596, "l2_grads": 1.6516692638397217, "l2_params": 299.18377685546875, "l2_updates": 0.5571080446243286, "training_loss": 2.428730010986328, "uptime": 22214.943355428986, "examples_seen": 61542400.0, "progress": 0.5391246624864322, "epoch": 48.521431302750415, "img/sec/core": 189.78141184280574, "core_hours_Tesla V100-SXM2-32GB": 90.15278342698235, "core_hours": 90.15278342698235}
{"step": 60150, "global_schedule": 0.5091245770454407, "l2_grads": 1.5558311939239502, "l2_params": 299.0953063964844, "l2_updates": 0.5477028489112854, "training_loss": 2.406132221221924, "uptime": 22231.82482299197, "examples_seen": 61593600.0, "progress": 0.539573185500148, "epoch": 48.56179855009047, "img/sec/core": 189.55697945459966, "core_hours_Tesla V100-SXM2-32GB": 90.22781217170673, "core_hours": 90.22781217170673}
{"step": 60200, "global_schedule": 0.508350670337677, "l2_grads": 1.652297019958496, "l2_params": 299.0014953613281, "l2_updates": 0.548511803150177, "training_loss": 2.3226466178894043, "uptime": 22248.703112079995, "examples_seen": 61644800.0, "progress": 0.5400217085138639, "epoch": 48.60216579743053, "img/sec/core": 189.59267632584977, "core_hours_Tesla V100-SXM2-32GB": 90.30282678987572, "core_hours": 90.30282678987572}
{"step": 60250, "global_schedule": 0.5075768232345581, "l2_grads": 1.5165354013442993, "l2_params": 298.9124450683594, "l2_updates": 0.5406985878944397, "training_loss": 3.147496461868286, "uptime": 22265.54988486896, "examples_seen": 61696000.0, "progress": 0.5404702315275797, "epoch": 48.64253304477059, "img/sec/core": 189.94735906309327, "core_hours_Tesla V100-SXM2-32GB": 90.37770133560447, "core_hours": 90.37770133560447}
{"step": 60300, "global_schedule": 0.5068029165267944, "l2_grads": 1.669579267501831, "l2_params": 298.822509765625, "l2_updates": 0.5455359220504761, "training_loss": 2.3488802909851074, "uptime": 22282.435758220963, "examples_seen": 61747200.0, "progress": 0.5409187545412956, "epoch": 48.682900292110645, "img/sec/core": 189.50752106762965, "core_hours_Tesla V100-SXM2-32GB": 90.45274966161335, "core_hours": 90.45274966161335}
{"step": 60350, "global_schedule": 0.5060290098190308, "l2_grads": 1.6396617889404297, "l2_params": 298.73675537109375, "l2_updates": 0.5401087999343872, "training_loss": 4.796647071838379, "uptime": 22299.29647504096, "examples_seen": 61798400.0, "progress": 0.5413672775550114, "epoch": 48.7232675394507, "img/sec/core": 189.79027013874943, "core_hours_Tesla V100-SXM2-32GB": 90.52768618081335, "core_hours": 90.52768618081335}
{"step": 60400, "global_schedule": 0.5052551031112671, "l2_grads": 1.470625877380371, "l2_params": 298.64068603515625, "l2_updates": 0.5501924753189087, "training_loss": 4.095247268676758, "uptime": 22316.161608062976, "examples_seen": 61849600.0, "progress": 0.5418158005687271, "epoch": 48.76363478679077, "img/sec/core": 189.7405728032266, "core_hours_Tesla V100-SXM2-32GB": 90.60264232757785, "core_hours": 90.60264232757785}
{"step": 60450, "global_schedule": 0.5044811964035034, "l2_grads": 1.6055614948272705, "l2_params": 298.5499572753906, "l2_updates": 0.5581844449043274, "training_loss": 2.339430093765259, "uptime": 22333.034070555994, "examples_seen": 61900800.0, "progress": 0.542264323582443, "epoch": 48.804002034130825, "img/sec/core": 189.65814867415745, "core_hours_Tesla V100-SXM2-32GB": 90.67763104976906, "core_hours": 90.67763104976906}
{"step": 60500, "global_schedule": 0.503707230091095, "l2_grads": 1.4109585285186768, "l2_params": 298.4626159667969, "l2_updates": 0.5445730686187744, "training_loss": 3.277602195739746, "uptime": 22349.90600158798, "examples_seen": 61952000.0, "progress": 0.5427128465961588, "epoch": 48.84436928147088, "img/sec/core": 189.66412285193013, "core_hours_Tesla V100-SXM2-32GB": 90.75261740991121, "core_hours": 90.75261740991121}
{"step": 60550, "global_schedule": 0.5029332637786865, "l2_grads": 1.63065767288208, "l2_params": 298.36767578125, "l2_updates": 0.5336358547210693, "training_loss": 2.479321002960205, "uptime": 22366.765188763966, "examples_seen": 62003200.0, "progress": 0.5431613696098747, "epoch": 48.88473652881094, "img/sec/core": 189.80748992206136, "core_hours_Tesla V100-SXM2-32GB": 90.82754713069338, "core_hours": 90.82754713069338}
{"step": 60600, "global_schedule": 0.5021593570709229, "l2_grads": 1.6017295122146606, "l2_params": 298.28155517578125, "l2_updates": 0.5495850443840027, "training_loss": 2.33042573928833, "uptime": 22383.619427661004, "examples_seen": 62054400.0, "progress": 0.5436098926235905, "epoch": 48.925103776151, "img/sec/core": 189.8632159867121, "core_hours_Tesla V100-SXM2-32GB": 90.90245485912465, "core_hours": 90.90245485912465}
{"step": 60650, "global_schedule": 0.5013853907585144, "l2_grads": 1.4717057943344116, "l2_params": 298.18621826171875, "l2_updates": 0.5330904722213745, "training_loss": 4.4418158531188965, "uptime": 22400.485177546972, "examples_seen": 62105600.0, "progress": 0.5440584156373064, "epoch": 48.965471023491055, "img/sec/core": 189.73363305133955, "core_hours_Tesla V100-SXM2-32GB": 90.97741374750673, "core_hours": 90.97741374750673}
{"step": 60700, "global_schedule": 0.500611424446106, "l2_grads": 1.6080905199050903, "l2_params": 298.09771728515625, "l2_updates": 0.5435307025909424, "training_loss": 2.212716817855835, "uptime": 22417.35299146996, "examples_seen": 62156800.0, "progress": 0.5445069386510222, "epoch": 49.00583827083111, "img/sec/core": 189.71041621693496, "core_hours_Tesla V100-SXM2-32GB": 91.05238180938667, "core_hours": 91.05238180938667}
{"step": 60750, "global_schedule": 0.4998374283313751, "l2_grads": 1.5127513408660889, "l2_params": 298.0050354003906, "l2_updates": 0.5332714319229126, "training_loss": 4.543831825256348, "uptime": 22434.235981591977, "examples_seen": 62208000.0, "progress": 0.5449554616647381, "epoch": 49.04620551817118, "img/sec/core": 189.53988463376993, "core_hours_Tesla V100-SXM2-32GB": 91.1274173210401, "core_hours": 91.1274173210401}
{"step": 60800, "global_schedule": 0.49906352162361145, "l2_grads": 1.7397024631500244, "l2_params": 297.9232482910156, "l2_updates": 0.5366344451904297, "training_loss": 3.962902307510376, "uptime": 22451.101248049003, "examples_seen": 62259200.0, "progress": 0.5454039846784539, "epoch": 49.086572765511235, "img/sec/core": 189.73907160933126, "core_hours_Tesla V100-SXM2-32GB": 91.20237406084908, "core_hours": 91.20237406084908}
{"step": 60850, "global_schedule": 0.4982894957065582, "l2_grads": 1.6353622674942017, "l2_params": 297.81298828125, "l2_updates": 0.5410531759262085, "training_loss": 2.453279495239258, "uptime": 22467.973379540956, "examples_seen": 62310400.0, "progress": 0.5458525076921696, "epoch": 49.12694001285129, "img/sec/core": 189.66186942806848, "core_hours_Tesla V100-SXM2-32GB": 91.27736131192442, "core_hours": 91.27736131192442}
{"step": 60900, "global_schedule": 0.49751561880111694, "l2_grads": 1.6578869819641113, "l2_params": 297.7345275878906, "l2_updates": 0.5445851683616638, "training_loss": 2.3430304527282715, "uptime": 22484.844294447976, "examples_seen": 62361600.0, "progress": 0.5463010307058855, "epoch": 49.16730726019135, "img/sec/core": 189.6755462069498, "core_hours_Tesla V100-SXM2-32GB": 91.35234315595564, "core_hours": 91.35234315595564}
{"step": 60950, "global_schedule": 0.4967415928840637, "l2_grads": 1.6488317251205444, "l2_params": 297.6480712890625, "l2_updates": 0.530074417591095, "training_loss": 2.5867197513580322, "uptime": 22501.722010875004, "examples_seen": 62412800.0, "progress": 0.5467495537196013, "epoch": 49.20767450753141, "img/sec/core": 189.59910920623082, "core_hours_Tesla V100-SXM2-32GB": 91.42735522896466, "core_hours": 91.42735522896466}
{"step": 61000, "global_schedule": 0.49596771597862244, "l2_grads": 1.398563265800476, "l2_params": 297.5533447265625, "l2_updates": 0.5332615375518799, "training_loss": 3.6472630500793457, "uptime": 22518.597260659968, "examples_seen": 62464000.0, "progress": 0.5471980767333172, "epoch": 49.248041754871466, "img/sec/core": 189.62682275976096, "core_hours_Tesla V100-SXM2-32GB": 91.50235633912006, "core_hours": 91.50235633912006}
{"step": 61050, "global_schedule": 0.4951937198638916, "l2_grads": 1.5180058479309082, "l2_params": 297.4787902832031, "l2_updates": 0.5345906019210815, "training_loss": 4.710230350494385, "uptime": 22535.988567088963, "examples_seen": 62515200.0, "progress": 0.547646599747033, "epoch": 49.28840900221152, "img/sec/core": 189.70176641651386, "core_hours_Tesla V100-SXM2-32GB": 91.57732781930646, "core_hours": 91.57732781930646}
{"step": 61100, "global_schedule": 0.4944198429584503, "l2_grads": 1.5670887231826782, "l2_params": 297.3999328613281, "l2_updates": 0.5311426520347595, "training_loss": 2.5268054008483887, "uptime": 22552.856672419002, "examples_seen": 62566400.0, "progress": 0.5480951227607489, "epoch": 49.32877624955159, "img/sec/core": 189.70713885106125, "core_hours_Tesla V100-SXM2-32GB": 91.65229717632884, "core_hours": 91.65229717632884}
{"step": 61150, "global_schedule": 0.49364587664604187, "l2_grads": 1.6279213428497314, "l2_params": 297.31646728515625, "l2_updates": 0.5346667170524597, "training_loss": 2.552338123321533, "uptime": 22569.715664903983, "examples_seen": 62617600.0, "progress": 0.5485436457744647, "epoch": 49.369143496891645, "img/sec/core": 189.80968185678304, "core_hours_Tesla V100-SXM2-32GB": 91.72722603181765, "core_hours": 91.72722603181765}
{"step": 61200, "global_schedule": 0.492872029542923, "l2_grads": 1.4130064249038696, "l2_params": 297.2328186035156, "l2_updates": 0.5380489826202393, "training_loss": 4.032074451446533, "uptime": 22586.58837456, "examples_seen": 62668800.0, "progress": 0.5489921687881805, "epoch": 49.4095107442317, "img/sec/core": 189.65537043178395, "core_hours_Tesla V100-SXM2-32GB": 91.80221585251107, "core_hours": 91.80221585251107}
{"step": 61250, "global_schedule": 0.4920980930328369, "l2_grads": 1.5893720388412476, "l2_params": 297.1439514160156, "l2_updates": 0.5330819487571716, "training_loss": 2.8454537391662598, "uptime": 22603.442548978957, "examples_seen": 62720000.0, "progress": 0.5494406918018964, "epoch": 49.44987799157176, "img/sec/core": 189.86394233589718, "core_hours_Tesla V100-SXM2-32GB": 91.8771232943731, "core_hours": 91.8771232943731}
{"step": 61300, "global_schedule": 0.49132418632507324, "l2_grads": 1.5541833639144897, "l2_params": 297.0569152832031, "l2_updates": 0.5382959842681885, "training_loss": 2.515303134918213, "uptime": 22620.323940416973, "examples_seen": 62771200.0, "progress": 0.5498892148156121, "epoch": 49.49024523891182, "img/sec/core": 189.55783424308896, "core_hours_Tesla V100-SXM2-32GB": 91.95215170076428, "core_hours": 91.95215170076428}
{"step": 61350, "global_schedule": 0.4905503988265991, "l2_grads": 1.6339362859725952, "l2_params": 296.9804382324219, "l2_updates": 0.5390374064445496, "training_loss": 2.4017086029052734, "uptime": 22637.206858432968, "examples_seen": 62822400.0, "progress": 0.550337737829328, "epoch": 49.530612486251876, "img/sec/core": 189.54069414826256, "core_hours_Tesla V100-SXM2-32GB": 92.02718689194647, "core_hours": 92.02718689194647}
{"step": 61400, "global_schedule": 0.48977652192115784, "l2_grads": 1.7291181087493896, "l2_params": 296.8941345214844, "l2_updates": 0.5321174263954163, "training_loss": 2.23980450630188, "uptime": 22654.054539378965, "examples_seen": 62873600.0, "progress": 0.5507862608430438, "epoch": 49.57097973359193, "img/sec/core": 189.93712014473388, "core_hours_Tesla V100-SXM2-32GB": 92.10206547392868, "core_hours": 92.10206547392868}
{"step": 61450, "global_schedule": 0.4890027940273285, "l2_grads": 1.664229154586792, "l2_params": 296.80035400390625, "l2_updates": 0.5297836065292358, "training_loss": 2.297335624694824, "uptime": 22670.934406140994, "examples_seen": 62924800.0, "progress": 0.5512347838567597, "epoch": 49.611346980932, "img/sec/core": 189.57495607716749, "core_hours_Tesla V100-SXM2-32GB": 92.17708710398215, "core_hours": 92.17708710398215}
{"step": 61500, "global_schedule": 0.488228976726532, "l2_grads": 1.7604936361312866, "l2_params": 296.70855712890625, "l2_updates": 0.5246245861053467, "training_loss": 2.3634562492370605, "uptime": 22687.784675780975, "examples_seen": 62976000.0, "progress": 0.5516833068704755, "epoch": 49.651714228272056, "img/sec/core": 189.90794025083696, "core_hours_Tesla V100-SXM2-32GB": 92.25197719127095, "core_hours": 92.25197719127095}
{"step": 61550, "global_schedule": 0.487455278635025, "l2_grads": 1.601189374923706, "l2_params": 296.6364440917969, "l2_updates": 0.5234653353691101, "training_loss": 2.888997793197632, "uptime": 22704.631523491, "examples_seen": 63027200.0, "progress": 0.5521318298841914, "epoch": 49.69208147561211, "img/sec/core": 189.94651433192337, "core_hours_Tesla V100-SXM2-32GB": 92.32685206998217, "core_hours": 92.32685206998217}
{"step": 61600, "global_schedule": 0.48668158054351807, "l2_grads": 1.6789432764053345, "l2_params": 296.5468444824219, "l2_updates": 0.5278023481369019, "training_loss": 2.3595757484436035, "uptime": 22721.508788164996, "examples_seen": 63078400.0, "progress": 0.5525803528979072, "epoch": 49.73244872295217, "img/sec/core": 189.60418419759807, "core_hours_Tesla V100-SXM2-32GB": 92.40186213519993, "core_hours": 92.40186213519993}
{"step": 61650, "global_schedule": 0.4859079122543335, "l2_grads": 1.5003770589828491, "l2_params": 296.4739685058594, "l2_updates": 0.5272362232208252, "training_loss": 4.599471569061279, "uptime": 22738.35498702497, "examples_seen": 63129600.0, "progress": 0.553028875911623, "epoch": 49.77281597029223, "img/sec/core": 189.9538303327956, "core_hours_Tesla V100-SXM2-32GB": 92.47673413013315, "core_hours": 92.47673413013315}
{"step": 61700, "global_schedule": 0.4851342737674713, "l2_grads": 1.5915879011154175, "l2_params": 296.37957763671875, "l2_updates": 0.5250977873802185, "training_loss": 2.8253414630889893, "uptime": 22755.237893124984, "examples_seen": 63180800.0, "progress": 0.5534773989253389, "epoch": 49.813183217632286, "img/sec/core": 189.54082792637837, "core_hours_Tesla V100-SXM2-32GB": 92.55176926835543, "core_hours": 92.55176926835543}
{"step": 61750, "global_schedule": 0.4843606650829315, "l2_grads": 1.6953706741333008, "l2_params": 296.2878723144531, "l2_updates": 0.5234089493751526, "training_loss": 2.206754684448242, "uptime": 22772.107215366967, "examples_seen": 63232000.0, "progress": 0.5539259219390547, "epoch": 49.85355046497234, "img/sec/core": 189.69345383872061, "core_hours_Tesla V100-SXM2-32GB": 92.62674403387535, "core_hours": 92.62674403387535}
{"step": 61800, "global_schedule": 0.4835870862007141, "l2_grads": 1.7424167394638062, "l2_params": 296.18670654296875, "l2_updates": 0.5170203447341919, "training_loss": 2.376396656036377, "uptime": 22788.95602172299, "examples_seen": 63283200.0, "progress": 0.5543744449527706, "epoch": 49.8939177123124, "img/sec/core": 189.924433362387, "core_hours_Tesla V100-SXM2-32GB": 92.70162761767989, "core_hours": 92.70162761767989}
{"step": 61850, "global_schedule": 0.4828135669231415, "l2_grads": 1.6485693454742432, "l2_params": 296.1007385253906, "l2_updates": 0.5050463080406189, "training_loss": 4.521457672119141, "uptime": 22805.834583975957, "examples_seen": 63334400.0, "progress": 0.5548229679664863, "epoch": 49.934284959652466, "img/sec/core": 189.58960793222738, "core_hours_Tesla V100-SXM2-32GB": 92.77664344991531, "core_hours": 92.77664344991531}
{"step": 61900, "global_schedule": 0.48204007744789124, "l2_grads": 1.7276310920715332, "l2_params": 295.9941101074219, "l2_updates": 0.515562117099762, "training_loss": 2.2339553833007812, "uptime": 22822.693638172, "examples_seen": 63385600.0, "progress": 0.5552714909802022, "epoch": 49.97465220699252, "img/sec/core": 189.8089870753787, "core_hours_Tesla V100-SXM2-32GB": 92.85157257967552, "core_hours": 92.85157257967552}
{"step": 61950, "global_schedule": 0.4812666177749634, "l2_grads": 1.637738585472107, "l2_params": 295.90484619140625, "l2_updates": 0.5257070660591125, "training_loss": 2.2589874267578125, "uptime": 22839.570669551962, "examples_seen": 63436800.0, "progress": 0.555720013993918, "epoch": 50.01501945433258, "img/sec/core": 189.6068051280306, "core_hours_Tesla V100-SXM2-32GB": 92.92658160803089, "core_hours": 92.92658160803089}
{"step": 62000, "global_schedule": 0.4804932177066803, "l2_grads": 1.6654911041259766, "l2_params": 295.8207092285156, "l2_updates": 0.5229262709617615, "training_loss": 2.2930359840393066, "uptime": 22856.44169768796, "examples_seen": 63488000.0, "progress": 0.5561685370076339, "epoch": 50.05538670167264, "img/sec/core": 189.6742732099667, "core_hours_Tesla V100-SXM2-32GB": 93.00156395530198, "core_hours": 93.00156395530198}
{"step": 62050, "global_schedule": 0.479719877243042, "l2_grads": 1.6191567182540894, "l2_params": 295.7393798828125, "l2_updates": 0.5216959118843079, "training_loss": 2.207406997680664, "uptime": 22874.06339533499, "examples_seen": 63539200.0, "progress": 0.5566170600213497, "epoch": 50.095753949012696, "img/sec/core": 189.70408294517037, "core_hours_Tesla V100-SXM2-32GB": 93.07653451999107, "core_hours": 93.07653451999107}
{"step": 62100, "global_schedule": 0.4789465665817261, "l2_grads": 1.6512374877929688, "l2_params": 295.6495361328125, "l2_updates": 0.517855703830719, "training_loss": 2.3965282440185547, "uptime": 22890.895131642, "examples_seen": 63590400.0, "progress": 0.5570655830350655, "epoch": 50.136121196352754, "img/sec/core": 190.1170468472374, "core_hours_Tesla V100-SXM2-32GB": 93.1513422369111, "core_hours": 93.1513422369111}
{"step": 62150, "global_schedule": 0.47817331552505493, "l2_grads": 1.5170048475265503, "l2_params": 295.5483703613281, "l2_updates": 0.5032479166984558, "training_loss": 3.305360794067383, "uptime": 22907.75983210496, "examples_seen": 63641600.0, "progress": 0.5575141060487814, "epoch": 50.17648844369281, "img/sec/core": 189.74543941815855, "core_hours_Tesla V100-SXM2-32GB": 93.22629646119093, "core_hours": 93.22629646119093}
{"step": 62200, "global_schedule": 0.47740012407302856, "l2_grads": 1.5632710456848145, "l2_params": 295.4604797363281, "l2_updates": 0.5163577795028687, "training_loss": 3.391831398010254, "uptime": 22924.639536628965, "examples_seen": 63692800.0, "progress": 0.5579626290624972, "epoch": 50.216855691032876, "img/sec/core": 189.57677816273244, "core_hours_Tesla V100-SXM2-32GB": 93.30131737018651, "core_hours": 93.30131737018651}
{"step": 62250, "global_schedule": 0.4766269624233246, "l2_grads": 1.6342610120773315, "l2_params": 295.3678894042969, "l2_updates": 0.5222213864326477, "training_loss": 2.5225918292999268, "uptime": 22941.504170937988, "examples_seen": 63744000.0, "progress": 0.5584111520762131, "epoch": 50.257222938372934, "img/sec/core": 189.74618372175837, "core_hours_Tesla V100-SXM2-32GB": 93.37627130044883, "core_hours": 93.37627130044883}
{"step": 62300, "global_schedule": 0.4758538603782654, "l2_grads": 1.4520106315612793, "l2_params": 295.2678527832031, "l2_updates": 0.5125961899757385, "training_loss": 2.6757805347442627, "uptime": 22958.36112377199, "examples_seen": 63795200.0, "progress": 0.5588596750899288, "epoch": 50.29759018571299, "img/sec/core": 189.83264837435195, "core_hours_Tesla V100-SXM2-32GB": 93.45119109082218, "core_hours": 93.45119109082218}
{"step": 62350, "global_schedule": 0.47508084774017334, "l2_grads": 1.7436696290969849, "l2_params": 295.17791748046875, "l2_updates": 0.5080747604370117, "training_loss": 4.757720947265625, "uptime": 22975.210448846978, "examples_seen": 63846400.0, "progress": 0.5593081981036447, "epoch": 50.33795743305305, "img/sec/core": 189.91858639786562, "core_hours_Tesla V100-SXM2-32GB": 93.52607698004434, "core_hours": 93.52607698004434}
{"step": 62400, "global_schedule": 0.4743078649044037, "l2_grads": 1.4669474363327026, "l2_params": 295.08660888671875, "l2_updates": 0.5205287933349609, "training_loss": 4.6965532302856445, "uptime": 22992.06479053799, "examples_seen": 63897600.0, "progress": 0.5597567211173605, "epoch": 50.378324680393106, "img/sec/core": 189.86205801836448, "core_hours_Tesla V100-SXM2-32GB": 93.60098516533772, "core_hours": 93.60098516533772}
{"step": 62450, "global_schedule": 0.4735349416732788, "l2_grads": 1.4738813638687134, "l2_params": 294.9940490722656, "l2_updates": 0.5113641619682312, "training_loss": 3.380338668823242, "uptime": 23008.926940139965, "examples_seen": 63948800.0, "progress": 0.5602052441310764, "epoch": 50.418691927733164, "img/sec/core": 189.77414360176502, "core_hours_Tesla V100-SXM2-32GB": 93.67592805245762, "core_hours": 93.67592805245762}
{"step": 62500, "global_schedule": 0.4727621078491211, "l2_grads": 1.6699477434158325, "l2_params": 294.9146728515625, "l2_updates": 0.5099348425865173, "training_loss": 2.1264665126800537, "uptime": 23025.813025839976, "examples_seen": 64000000.0, "progress": 0.5606537671447922, "epoch": 50.45905917507322, "img/sec/core": 189.50513794904748, "core_hours_Tesla V100-SXM2-32GB": 93.75097732223544, "core_hours": 93.75097732223544, "minival/prec@1": 0.7059787699032157, "minival/loss": 1.1847260159847701, "minival/sample count": 12812.0, "minival/attn_weight_avg": [13312, 12, 281], "minival/attn_mag": [13312, 12, 281], "minival/before_mlp": [13312, 12, 281], "z/secs/eval/minival": 2.898523796990048, "real/prec@1": 0.7497491299613553, "real/loss": 1.9979737584351716, "real/sample count": 46837.0, "real/attn_weight_avg": [50176, 12, 281], "real/attn_mag": [50176, 12, 281], "real/before_mlp": [50176, 12, 281], "z/secs/eval/real": 11.114131508977152, "train/prec@1": 0.7311790188502517, "train/loss": 1.0424546567170023, "train/sample count": 25623.0, "train/attn_weight_avg": [26624, 12, 281], "train/attn_mag": [26624, 12, 281], "train/before_mlp": [26624, 12, 281], "z/secs/eval/train": 6.56453482399229, "v2/prec@1": 0.5459, "v2/loss": 1.9799359375, "v2/sample count": 10000.0, "v2/attn_weight_avg": [10240, 12, 281], "v2/attn_mag": [10240, 12, 281], "v2/before_mlp": [10240, 12, 281], "z/secs/eval/v2": 3.3281623519724235, "val/prec@1": 0.67316, "val/loss": 1.3305270336914063, "val/sample count": 50000.0, "val/attn_weight_avg": [50176, 12, 281], "val/attn_mag": [50176, 12, 281], "val/before_mlp": [50176, 12, 281], "z/secs/eval/val": 12.34979283704888}
{"step": 62550, "global_schedule": 0.47198939323425293, "l2_grads": 1.674625039100647, "l2_params": 294.8213806152344, "l2_updates": 0.5142439603805542, "training_loss": 2.3014090061187744, "uptime": 23078.965273418988, "examples_seen": 64051200.0, "progress": 0.561102290158508, "epoch": 50.499426422413286, "img/sec/core": 189.40458900819806, "core_hours_Tesla V100-SXM2-32GB": 93.82606643331083, "core_hours": 93.82606643331083}
{"step": 62600, "global_schedule": 0.47121661901474, "l2_grads": 1.6182509660720825, "l2_params": 294.7299499511719, "l2_updates": 0.5142106413841248, "training_loss": 2.8591670989990234, "uptime": 23095.844348603976, "examples_seen": 64102400.0, "progress": 0.5615508131722239, "epoch": 50.539793669753344, "img/sec/core": 189.58384656322707, "core_hours_Tesla V100-SXM2-32GB": 93.9010845452441, "core_hours": 93.9010845452441}
{"step": 62650, "global_schedule": 0.4704440236091614, "l2_grads": 1.5600414276123047, "l2_params": 294.643310546875, "l2_updates": 0.508822500705719, "training_loss": 3.877324342727661, "uptime": 23112.72557749698, "examples_seen": 64153600.0, "progress": 0.5619993361859397, "epoch": 50.5801609170934, "img/sec/core": 189.55965944670217, "core_hours_Tesla V100-SXM2-32GB": 93.97611222921302, "core_hours": 93.97611222921302}
{"step": 62700, "global_schedule": 0.469671368598938, "l2_grads": 1.6877182722091675, "l2_params": 294.558837890625, "l2_updates": 0.5095267295837402, "training_loss": 2.2546603679656982, "uptime": 23129.579502321954, "examples_seen": 64204800.0, "progress": 0.5624478591996556, "epoch": 50.62052816443346, "img/sec/core": 189.86675407846406, "core_hours_Tesla V100-SXM2-32GB": 94.05101856176844, "core_hours": 94.05101856176844}
{"step": 62750, "global_schedule": 0.4688989222049713, "l2_grads": 1.547924280166626, "l2_params": 294.4674987792969, "l2_updates": 0.4966326355934143, "training_loss": 4.258721351623535, "uptime": 23146.460967602965, "examples_seen": 64256000.0, "progress": 0.5628963822133713, "epoch": 50.66089541177352, "img/sec/core": 189.55700507820092, "core_hours_Tesla V100-SXM2-32GB": 94.12604729635072, "core_hours": 94.12604729635072}
{"step": 62800, "global_schedule": 0.46812644600868225, "l2_grads": 1.5358620882034302, "l2_params": 294.39093017578125, "l2_updates": 0.50333571434021, "training_loss": 3.4998273849487305, "uptime": 23163.31795460597, "examples_seen": 64307200.0, "progress": 0.5633449052270872, "epoch": 50.701262659113574, "img/sec/core": 189.83226358480968, "core_hours_Tesla V100-SXM2-32GB": 94.2009672385863, "core_hours": 94.2009672385863}
{"step": 62850, "global_schedule": 0.4673541486263275, "l2_grads": 1.4643715620040894, "l2_params": 294.3077087402344, "l2_updates": 0.5043631196022034, "training_loss": 3.8850860595703125, "uptime": 23180.17277700198, "examples_seen": 64358400.0, "progress": 0.563793428240803, "epoch": 50.74162990645363, "img/sec/core": 189.85664309091658, "core_hours_Tesla V100-SXM2-32GB": 94.27587756034633, "core_hours": 94.27587756034633}
{"step": 62900, "global_schedule": 0.4665818214416504, "l2_grads": 1.5563876628875732, "l2_params": 294.2226867675781, "l2_updates": 0.5162892937660217, "training_loss": 3.1073386669158936, "uptime": 23197.053440089978, "examples_seen": 64409600.0, "progress": 0.5642419512545188, "epoch": 50.7819971537937, "img/sec/core": 189.56601309547995, "core_hours_Tesla V100-SXM2-32GB": 94.35090272962633, "core_hours": 94.35090272962633}
{"step": 62950, "global_schedule": 0.4658096730709076, "l2_grads": 1.651452898979187, "l2_params": 294.13427734375, "l2_updates": 0.5058859586715698, "training_loss": 2.4495487213134766, "uptime": 23213.90941351495, "examples_seen": 64460800.0, "progress": 0.5646904742682347, "epoch": 50.822364401133754, "img/sec/core": 189.84367851809833, "core_hours_Tesla V100-SXM2-32GB": 94.42581816707066, "core_hours": 94.42581816707066}
{"step": 63000, "global_schedule": 0.4650374948978424, "l2_grads": 1.744890570640564, "l2_params": 294.0380554199219, "l2_updates": 0.5010397434234619, "training_loss": 2.2164933681488037, "uptime": 23230.781720531988, "examples_seen": 64512000.0, "progress": 0.5651389972819505, "epoch": 50.86273164847381, "img/sec/core": 189.65989634781738, "core_hours_Tesla V100-SXM2-32GB": 94.5008061982575, "core_hours": 94.5008061982575}
{"step": 63050, "global_schedule": 0.46426552534103394, "l2_grads": 1.658275842666626, "l2_params": 293.9462890625, "l2_updates": 0.502553403377533, "training_loss": 2.2311933040618896, "uptime": 23248.16613619699, "examples_seen": 64563200.0, "progress": 0.5655875202956664, "epoch": 50.90309889581387, "img/sec/core": 189.57343842228855, "core_hours_Tesla V100-SXM2-32GB": 94.57582842890639, "core_hours": 94.57582842890639}
{"step": 63100, "global_schedule": 0.4634935259819031, "l2_grads": 1.6313470602035522, "l2_params": 293.8524475097656, "l2_updates": 0.506299614906311, "training_loss": 2.7226853370666504, "uptime": 23265.035307979968, "examples_seen": 64614400.0, "progress": 0.5660360433093822, "epoch": 50.94346614315393, "img/sec/core": 189.6951457468017, "core_hours_Tesla V100-SXM2-32GB": 94.65080252571963, "core_hours": 94.65080252571963}
{"step": 63150, "global_schedule": 0.46272173523902893, "l2_grads": 1.6956524848937988, "l2_params": 293.7611999511719, "l2_updates": 0.5016270279884338, "training_loss": 2.2702226638793945, "uptime": 23281.895281869976, "examples_seen": 64665600.0, "progress": 0.5664845663230981, "epoch": 50.983833390493984, "img/sec/core": 189.7986331933996, "core_hours_Tesla V100-SXM2-32GB": 94.72573574300856, "core_hours": 94.72573574300856}
{"step": 63200, "global_schedule": 0.4619499146938324, "l2_grads": 1.880397915840149, "l2_params": 293.6675109863281, "l2_updates": 0.48445579409599304, "training_loss": 2.3387608528137207, "uptime": 23298.772093317006, "examples_seen": 64716800.0, "progress": 0.5669330893368139, "epoch": 51.02420063783404, "img/sec/core": 189.60927602015963, "core_hours_Tesla V100-SXM2-32GB": 94.80074379388424, "core_hours": 94.80074379388424}
{"step": 63250, "global_schedule": 0.4611783027648926, "l2_grads": 1.711737871170044, "l2_params": 293.58349609375, "l2_updates": 0.498162180185318, "training_loss": 2.2225091457366943, "uptime": 23315.641740374966, "examples_seen": 64768000.0, "progress": 0.5673816123505298, "epoch": 51.06456788517411, "img/sec/core": 189.68980139333178, "core_hours_Tesla V100-SXM2-32GB": 94.87572000303072, "core_hours": 94.87572000303072}
{"step": 63300, "global_schedule": 0.46040666103363037, "l2_grads": 1.7760452032089233, "l2_params": 293.49859619140625, "l2_updates": 0.49560603499412537, "training_loss": 2.18953800201416, "uptime": 23332.494204232993, "examples_seen": 64819200.0, "progress": 0.5678301353642455, "epoch": 51.104935132514164, "img/sec/core": 189.88321392991548, "core_hours_Tesla V100-SXM2-32GB": 94.95061984239973, "core_hours": 94.95061984239973}
{"step": 63350, "global_schedule": 0.4596352279186249, "l2_grads": 1.6515872478485107, "l2_params": 293.4046936035156, "l2_updates": 0.5049425363540649, "training_loss": 2.4232518672943115, "uptime": 23349.378744226997, "examples_seen": 64870400.0, "progress": 0.5682786583779613, "epoch": 51.14530237985422, "img/sec/core": 189.52248631804187, "core_hours_Tesla V100-SXM2-32GB": 95.02566224237309, "core_hours": 95.02566224237309}
{"step": 63400, "global_schedule": 0.458863765001297, "l2_grads": 1.6912680864334106, "l2_params": 293.3247985839844, "l2_updates": 0.4896591305732727, "training_loss": 2.2357678413391113, "uptime": 23366.261969730956, "examples_seen": 64921600.0, "progress": 0.5687271813916772, "epoch": 51.18566962719428, "img/sec/core": 189.53724211345104, "core_hours_Tesla V100-SXM2-32GB": 95.10069880016846, "core_hours": 95.10069880016846}
{"step": 63450, "global_schedule": 0.45809242129325867, "l2_grads": 1.6877014636993408, "l2_params": 293.2413024902344, "l2_updates": 0.5030743479728699, "training_loss": 2.2872424125671387, "uptime": 23383.118035801977, "examples_seen": 64972800.0, "progress": 0.569175704405393, "epoch": 51.22603687453434, "img/sec/core": 189.84263507969203, "core_hours_Tesla V100-SXM2-32GB": 95.175614649373, "core_hours": 95.175614649373}
{"step": 63500, "global_schedule": 0.45732128620147705, "l2_grads": 1.6537081003189087, "l2_params": 293.1402893066406, "l2_updates": 0.49570411443710327, "training_loss": 2.430551290512085, "uptime": 23399.997965530958, "examples_seen": 65024000.0, "progress": 0.5696242274191089, "epoch": 51.266404121874395, "img/sec/core": 189.5742489085139, "core_hours_Tesla V100-SXM2-32GB": 95.25063655927958, "core_hours": 95.25063655927958}
{"step": 63550, "global_schedule": 0.45655012130737305, "l2_grads": 1.7347208261489868, "l2_params": 293.0514221191406, "l2_updates": 0.4986932873725891, "training_loss": 2.2026782035827637, "uptime": 23416.84565021796, "examples_seen": 65075200.0, "progress": 0.5700727504328247, "epoch": 51.30677136921445, "img/sec/core": 189.93707796944457, "core_hours_Tesla V100-SXM2-32GB": 95.32551515788849, "core_hours": 95.32551515788849}
{"step": 63600, "global_schedule": 0.45577919483184814, "l2_grads": 1.5346308946609497, "l2_params": 292.9636535644531, "l2_updates": 0.48985618352890015, "training_loss": 3.9777238368988037, "uptime": 23433.703832334955, "examples_seen": 65126400.0, "progress": 0.5705212734465406, "epoch": 51.34713861655452, "img/sec/core": 189.81880595383268, "core_hours_Tesla V100-SXM2-32GB": 95.4004404117418, "core_hours": 95.4004404117418}
{"step": 63650, "global_schedule": 0.45500826835632324, "l2_grads": 1.4987142086029053, "l2_params": 292.861328125, "l2_updates": 0.4889282286167145, "training_loss": 4.526867389678955, "uptime": 23450.557265124982, "examples_seen": 65177600.0, "progress": 0.5709697964602564, "epoch": 51.387505863894575, "img/sec/core": 189.8722972268057, "core_hours_Tesla V100-SXM2-32GB": 95.47534455747524, "core_hours": 95.47534455747524}
{"step": 63700, "global_schedule": 0.45423755049705505, "l2_grads": 1.6907483339309692, "l2_params": 292.7871398925781, "l2_updates": 0.4927525520324707, "training_loss": 2.3358306884765625, "uptime": 23467.425412668963, "examples_seen": 65228800.0, "progress": 0.5714183194739723, "epoch": 51.42787311123463, "img/sec/core": 189.7066640931709, "core_hours_Tesla V100-SXM2-32GB": 95.55031410211517, "core_hours": 95.55031410211517}
{"step": 63750, "global_schedule": 0.45346683263778687, "l2_grads": 1.6978425979614258, "l2_params": 292.69586181640625, "l2_updates": 0.4929673969745636, "training_loss": 2.461930274963379, "uptime": 23484.285988406977, "examples_seen": 65280000.0, "progress": 0.571866842487688, "epoch": 51.46824035857469, "img/sec/core": 189.79185822138356, "core_hours_Tesla V100-SXM2-32GB": 95.6252499942841, "core_hours": 95.6252499942841}
{"step": 63800, "global_schedule": 0.4526963531970978, "l2_grads": 1.6036410331726074, "l2_params": 292.6157531738281, "l2_updates": 0.48962628841400146, "training_loss": 4.144932746887207, "uptime": 23501.15837617498, "examples_seen": 65331200.0, "progress": 0.5723153655014038, "epoch": 51.50860760591475, "img/sec/core": 189.65898863874295, "core_hours_Tesla V100-SXM2-32GB": 95.70023838436413, "core_hours": 95.70023838436413}
{"step": 63850, "global_schedule": 0.4519258439540863, "l2_grads": 1.6273324489593506, "l2_params": 292.51904296875, "l2_updates": 0.4945744574069977, "training_loss": 2.282270669937134, "uptime": 23518.032910723006, "examples_seen": 65382400.0, "progress": 0.5727638885151197, "epoch": 51.548974853254805, "img/sec/core": 189.63486020265168, "core_hours_Tesla V100-SXM2-32GB": 95.77523631568869, "core_hours": 95.77523631568869}
{"step": 63900, "global_schedule": 0.45115557312965393, "l2_grads": 1.6614001989364624, "l2_params": 292.4266052246094, "l2_updates": 0.49223828315734863, "training_loss": 2.169889450073242, "uptime": 23534.88400232297, "examples_seen": 65433600.0, "progress": 0.5732124115288355, "epoch": 51.58934210059486, "img/sec/core": 189.898676950201, "core_hours_Tesla V100-SXM2-32GB": 95.85013005613297, "core_hours": 95.85013005613297}
{"step": 63950, "global_schedule": 0.45038533210754395, "l2_grads": 1.725905179977417, "l2_params": 292.33856201171875, "l2_updates": 0.49018394947052, "training_loss": 2.0909037590026855, "uptime": 23551.77045924496, "examples_seen": 65484800.0, "progress": 0.5736609345425514, "epoch": 51.62970934793492, "img/sec/core": 189.50097197910767, "core_hours_Tesla V100-SXM2-32GB": 95.92518097578626, "core_hours": 95.92518097578626}
{"step": 64000, "global_schedule": 0.4496152997016907, "l2_grads": 1.7378346920013428, "l2_params": 292.2462158203125, "l2_updates": 0.48073452711105347, "training_loss": 2.2124199867248535, "uptime": 23568.618388804956, "examples_seen": 65536000.0, "progress": 0.5741094575562672, "epoch": 51.670076595274985, "img/sec/core": 189.9343173654933, "core_hours_Tesla V100-SXM2-32GB": 96.00006066271958, "core_hours": 96.00006066271958}
{"step": 64050, "global_schedule": 0.4488452672958374, "l2_grads": 1.656581163406372, "l2_params": 292.1628723144531, "l2_updates": 0.4850621521472931, "training_loss": 2.5546998977661133, "uptime": 23585.983432092995, "examples_seen": 65587200.0, "progress": 0.5745579805699831, "epoch": 51.71044384261504, "img/sec/core": 189.84783613072977, "core_hours_Tesla V100-SXM2-32GB": 96.07497445953751, "core_hours": 96.07497445953751}
{"step": 64100, "global_schedule": 0.44807547330856323, "l2_grads": 1.7329787015914917, "l2_params": 292.0652160644531, "l2_updates": 0.4959966540336609, "training_loss": 2.1069517135620117, "uptime": 23602.86626327096, "examples_seen": 65638400.0, "progress": 0.5750065035836989, "epoch": 51.7508110899551, "img/sec/core": 189.54166906416143, "core_hours_Tesla V100-SXM2-32GB": 96.15000926477292, "core_hours": 96.15000926477292}
{"step": 64150, "global_schedule": 0.44730570912361145, "l2_grads": 1.5421804189682007, "l2_params": 291.97796630859375, "l2_updates": 0.48607978224754333, "training_loss": 4.58195686340332, "uptime": 23619.714067984954, "examples_seen": 65689600.0, "progress": 0.5754550265974148, "epoch": 51.79117833729516, "img/sec/core": 189.9357248212872, "core_hours_Tesla V100-SXM2-32GB": 96.2248883968351, "core_hours": 96.2248883968351}
{"step": 64200, "global_schedule": 0.44653618335723877, "l2_grads": 1.510441541671753, "l2_params": 291.9035949707031, "l2_updates": 0.4780445396900177, "training_loss": 3.122523784637451, "uptime": 23636.606027750997, "examples_seen": 65740800.0, "progress": 0.5759035496111305, "epoch": 51.831545584635215, "img/sec/core": 189.43923880477732, "core_hours_Tesla V100-SXM2-32GB": 96.29996377357308, "core_hours": 96.29996377357308}
{"step": 64250, "global_schedule": 0.4457666575908661, "l2_grads": 1.8138588666915894, "l2_params": 291.8229675292969, "l2_updates": 0.4796641170978546, "training_loss": 2.323911666870117, "uptime": 23653.491417853977, "examples_seen": 65792000.0, "progress": 0.5763520726248463, "epoch": 51.87191283197527, "img/sec/core": 189.5129446512049, "core_hours_Tesla V100-SXM2-32GB": 96.37500995180855, "core_hours": 96.37500995180855}
{"step": 64300, "global_schedule": 0.4449973702430725, "l2_grads": 1.5212472677230835, "l2_params": 291.7200012207031, "l2_updates": 0.4903554320335388, "training_loss": 3.1426992416381836, "uptime": 23670.349828114966, "examples_seen": 65843200.0, "progress": 0.5768005956385622, "epoch": 51.91228007931533, "img/sec/core": 189.81623714573246, "core_hours_Tesla V100-SXM2-32GB": 96.44993621963516, "core_hours": 96.44993621963516}
{"step": 64350, "global_schedule": 0.4442281126976013, "l2_grads": 1.6381511688232422, "l2_params": 291.6331787109375, "l2_updates": 0.49074944853782654, "training_loss": 2.164649724960327, "uptime": 23687.231773509004, "examples_seen": 65894400.0, "progress": 0.577249118652278, "epoch": 51.952647326655395, "img/sec/core": 189.55161418364455, "core_hours_Tesla V100-SXM2-32GB": 96.5249670880531, "core_hours": 96.5249670880531}
{"step": 64400, "global_schedule": 0.44345909357070923, "l2_grads": 1.589409589767456, "l2_params": 291.54449462890625, "l2_updates": 0.473825603723526, "training_loss": 4.1047539710998535, "uptime": 23704.106835615006, "examples_seen": 65945600.0, "progress": 0.5776976416659939, "epoch": 51.99301457399545, "img/sec/core": 189.62893172770816, "core_hours_Tesla V100-SXM2-32GB": 96.59996736407977, "core_hours": 96.59996736407977}
{"step": 64450, "global_schedule": 0.4426901042461395, "l2_grads": 1.6485974788665771, "l2_params": 291.4674987792969, "l2_updates": 0.4808233380317688, "training_loss": 4.765459060668945, "uptime": 23721.002821889997, "examples_seen": 65996800.0, "progress": 0.5781461646797097, "epoch": 52.03338182133551, "img/sec/core": 189.39409324311598, "core_hours_Tesla V100-SXM2-32GB": 96.67506063641308, "core_hours": 96.67506063641308}
{"step": 64500, "global_schedule": 0.4419213533401489, "l2_grads": 1.592551350593567, "l2_params": 291.3789978027344, "l2_updates": 0.47056934237480164, "training_loss": 3.9285600185394287, "uptime": 23737.891992766003, "examples_seen": 66048000.0, "progress": 0.5785946876934256, "epoch": 52.07374906867557, "img/sec/core": 189.4705206959697, "core_hours_Tesla V100-SXM2-32GB": 96.75012361808422, "core_hours": 96.75012361808422}
{"step": 64550, "global_schedule": 0.4411526620388031, "l2_grads": 1.6456375122070312, "l2_params": 291.2881774902344, "l2_updates": 0.48024457693099976, "training_loss": 2.9749460220336914, "uptime": 23754.769060055958, "examples_seen": 66099200.0, "progress": 0.5790432107071414, "epoch": 52.114116316015625, "img/sec/core": 189.60640169423934, "core_hours_Tesla V100-SXM2-32GB": 96.82513280603958, "core_hours": 96.82513280603958}
{"step": 64600, "global_schedule": 0.4403842091560364, "l2_grads": 1.6087322235107422, "l2_params": 291.2021179199219, "l2_updates": 0.4736020267009735, "training_loss": 3.4798390865325928, "uptime": 23771.63853840297, "examples_seen": 66150400.0, "progress": 0.5794917337208573, "epoch": 52.15448356335568, "img/sec/core": 189.69169847309783, "core_hours_Tesla V100-SXM2-32GB": 96.90010826535963, "core_hours": 96.90010826535963}
{"step": 64650, "global_schedule": 0.43961575627326965, "l2_grads": 1.7352062463760376, "l2_params": 291.1112976074219, "l2_updates": 0.47871989011764526, "training_loss": 2.301335573196411, "uptime": 23788.53955222899, "examples_seen": 66201600.0, "progress": 0.5799402567345731, "epoch": 52.19485081069574, "img/sec/core": 189.33775410995878, "core_hours_Tesla V100-SXM2-32GB": 96.97522388236416, "core_hours": 96.97522388236416}
{"step": 64700, "global_schedule": 0.4388476014137268, "l2_grads": 1.789732575416565, "l2_params": 291.01092529296875, "l2_updates": 0.47157996892929077, "training_loss": 2.2405169010162354, "uptime": 23805.41253524, "examples_seen": 66252800.0, "progress": 0.5803887797482888, "epoch": 52.235218058035805, "img/sec/core": 189.6522978724033, "core_hours_Tesla V100-SXM2-32GB": 97.05021491796865, "core_hours": 97.05021491796865}
{"step": 64750, "global_schedule": 0.43807944655418396, "l2_grads": 1.7139383554458618, "l2_params": 290.9225158691406, "l2_updates": 0.4686836302280426, "training_loss": 2.1435279846191406, "uptime": 23822.289117523003, "examples_seen": 66304000.0, "progress": 0.5808373027620047, "epoch": 52.27558530537586, "img/sec/core": 189.6118506898682, "core_hours_Tesla V100-SXM2-32GB": 97.12522195033755, "core_hours": 97.12522195033755}
{"step": 64800, "global_schedule": 0.437311589717865, "l2_grads": 1.6166694164276123, "l2_params": 290.8542785644531, "l2_updates": 0.4735998213291168, "training_loss": 2.8739428520202637, "uptime": 23839.176344788983, "examples_seen": 66355200.0, "progress": 0.5812858257757205, "epoch": 52.31595255271592, "img/sec/core": 189.492327520616, "core_hours_Tesla V100-SXM2-32GB": 97.2002762937419, "core_hours": 97.2002762937419}
{"step": 64850, "global_schedule": 0.436543732881546, "l2_grads": 1.5506556034088135, "l2_params": 290.76263427734375, "l2_updates": 0.47268620133399963, "training_loss": 3.7538256645202637, "uptime": 23856.069522798993, "examples_seen": 66406400.0, "progress": 0.5817343487894364, "epoch": 52.35631980005598, "img/sec/core": 189.42557747889825, "core_hours_Tesla V100-SXM2-32GB": 97.2753570848975, "core_hours": 97.2753570848975}
{"step": 64900, "global_schedule": 0.4357761740684509, "l2_grads": 1.7352931499481201, "l2_params": 290.6624450683594, "l2_updates": 0.4745950698852539, "training_loss": 2.568117141723633, "uptime": 23872.938589800964, "examples_seen": 66457600.0, "progress": 0.5821828718031522, "epoch": 52.396687047396036, "img/sec/core": 189.6963240246796, "core_hours_Tesla V100-SXM2-32GB": 97.35033071601738, "core_hours": 97.35033071601738}
{"step": 64950, "global_schedule": 0.4350086748600006, "l2_grads": 1.598301887512207, "l2_params": 290.57281494140625, "l2_updates": 0.4811418056488037, "training_loss": 2.8175411224365234, "uptime": 23889.820423953002, "examples_seen": 66508800.0, "progress": 0.5826313948168681, "epoch": 52.43705429473609, "img/sec/core": 189.5528632245005, "core_hours_Tesla V100-SXM2-32GB": 97.42536109002643, "core_hours": 97.42536109002643}
{"step": 65000, "global_schedule": 0.4342413544654846, "l2_grads": 1.7025432586669922, "l2_params": 290.487060546875, "l2_updates": 0.47219958901405334, "training_loss": 2.1832690238952637, "uptime": 23906.69739418698, "examples_seen": 66560000.0, "progress": 0.5830799178305839, "epoch": 52.47742154207615, "img/sec/core": 189.6074920815799, "core_hours_Tesla V100-SXM2-32GB": 97.5003698466219, "core_hours": 97.5003698466219, "minival/prec@1": 0.7104277240087418, "minival/loss": 1.1894993920494459, "minival/sample count": 12812.0, "minival/attn_weight_avg": [13312, 12, 281], "minival/attn_mag": [13312, 12, 281], "minival/before_mlp": [13312, 12, 281], "z/secs/eval/minival": 2.8841775459586643, "real/prec@1": 0.7564959327027777, "real/loss": 1.9902764325321394, "real/sample count": 46837.0, "real/attn_weight_avg": [50176, 12, 281], "real/attn_mag": [50176, 12, 281], "real/before_mlp": [50176, 12, 281], "z/secs/eval/real": 11.166456514038146, "train/prec@1": 0.7398040822698357, "train/loss": 1.0402896904030705, "train/sample count": 25623.0, "train/attn_weight_avg": [26624, 12, 281], "train/attn_mag": [26624, 12, 281], "train/before_mlp": [26624, 12, 281], "z/secs/eval/train": 6.631489782012068, "v2/prec@1": 0.5522, "v2/loss": 1.9793887329101563, "v2/sample count": 10000.0, "v2/attn_weight_avg": [10240, 12, 281], "v2/attn_mag": [10240, 12, 281], "v2/before_mlp": [10240, 12, 281], "z/secs/eval/v2": 3.37678378802957, "val/prec@1": 0.68114, "val/loss": 1.3259506201171876, "val/sample count": 50000.0, "val/attn_weight_avg": [50176, 12, 281], "val/attn_mag": [50176, 12, 281], "val/before_mlp": [50176, 12, 281], "z/secs/eval/val": 12.289532133960165}
{"step": 65050, "global_schedule": 0.43347418308258057, "l2_grads": 1.4791467189788818, "l2_params": 290.397216796875, "l2_updates": 0.4700824022293091, "training_loss": 4.016301155090332, "uptime": 23960.562637913972, "examples_seen": 66611200.0, "progress": 0.5835284408442997, "epoch": 52.517788789416215, "img/sec/core": 188.90583572802302, "core_hours_Tesla V100-SXM2-32GB": 97.57565720959515, "core_hours": 97.57565720959515}
{"step": 65100, "global_schedule": 0.43270719051361084, "l2_grads": 1.5619031190872192, "l2_params": 290.30780029296875, "l2_updates": 0.4598393738269806, "training_loss": 3.669994831085205, "uptime": 23977.43842996197, "examples_seen": 66662400.0, "progress": 0.5839769638580156, "epoch": 52.55815603675627, "img/sec/core": 189.62072955737472, "core_hours_Tesla V100-SXM2-32GB": 97.65066072980848, "core_hours": 97.65066072980848}
{"step": 65150, "global_schedule": 0.43194034695625305, "l2_grads": 1.7072516679763794, "l2_params": 290.2156066894531, "l2_updates": 0.4777649939060211, "training_loss": 2.4266767501831055, "uptime": 23994.29991155595, "examples_seen": 66713600.0, "progress": 0.5844254868717313, "epoch": 52.59852328409633, "img/sec/core": 189.78166195920102, "core_hours_Tesla V100-SXM2-32GB": 97.72560064800395, "core_hours": 97.72560064800395}
{"step": 65200, "global_schedule": 0.4311736822128296, "l2_grads": 1.7310163974761963, "l2_params": 290.1249694824219, "l2_updates": 0.46305468678474426, "training_loss": 2.2230048179626465, "uptime": 24011.175079436973, "examples_seen": 66764800.0, "progress": 0.5848740098854472, "epoch": 52.63889053143639, "img/sec/core": 189.62774311707537, "core_hours_Tesla V100-SXM2-32GB": 97.80060139414181, "core_hours": 97.80060139414181}
{"step": 65250, "global_schedule": 0.43040716648101807, "l2_grads": 1.6297107934951782, "l2_params": 290.0465087890625, "l2_updates": 0.45853185653686523, "training_loss": 4.138426780700684, "uptime": 24028.049626692955, "examples_seen": 66816000.0, "progress": 0.585322532899163, "epoch": 52.679257778776446, "img/sec/core": 189.63471739163674, "core_hours_Tesla V100-SXM2-32GB": 97.87559938194617, "core_hours": 97.87559938194617}
{"step": 65300, "global_schedule": 0.4296407997608185, "l2_grads": 1.6557245254516602, "l2_params": 289.96319580078125, "l2_updates": 0.4645213484764099, "training_loss": 2.5904159545898438, "uptime": 24044.93146544299, "examples_seen": 66867200.0, "progress": 0.5857710559128789, "epoch": 52.7196250261165, "img/sec/core": 189.5528115972072, "core_hours_Tesla V100-SXM2-32GB": 97.95062977639078, "core_hours": 97.95062977639078}
{"step": 65350, "global_schedule": 0.4288746118545532, "l2_grads": 1.7117586135864258, "l2_params": 289.8643493652344, "l2_updates": 0.4540080726146698, "training_loss": 2.089487075805664, "uptime": 24061.793332383968, "examples_seen": 66918400.0, "progress": 0.5862195789265947, "epoch": 52.75999227345656, "img/sec/core": 189.77732484790783, "core_hours_Tesla V100-SXM2-32GB": 98.02557140723957, "core_hours": 98.02557140723957}
{"step": 65400, "global_schedule": 0.4281086027622223, "l2_grads": 1.7072577476501465, "l2_params": 289.7618408203125, "l2_updates": 0.467536598443985, "training_loss": 2.223205089569092, "uptime": 24078.651053336973, "examples_seen": 66969600.0, "progress": 0.5866681019403106, "epoch": 52.800359520796626, "img/sec/core": 189.82399868409246, "core_hours_Tesla V100-SXM2-32GB": 98.10049461147516, "core_hours": 98.10049461147516}
{"step": 65450, "global_schedule": 0.4273427724838257, "l2_grads": 1.7795928716659546, "l2_params": 289.6728820800781, "l2_updates": 0.4579128623008728, "training_loss": 2.212526798248291, "uptime": 24095.520129970973, "examples_seen": 67020800.0, "progress": 0.5871166249540264, "epoch": 52.84072676813668, "img/sec/core": 189.69621571048114, "core_hours_Tesla V100-SXM2-32GB": 98.17546828540405, "core_hours": 98.17546828540405}
{"step": 65500, "global_schedule": 0.426577091217041, "l2_grads": 1.5544337034225464, "l2_params": 289.5861511230469, "l2_updates": 0.4572382867336273, "training_loss": 3.540496349334717, "uptime": 24112.392639531987, "examples_seen": 67072000.0, "progress": 0.5875651479677422, "epoch": 52.88109401547674, "img/sec/core": 189.65761959881178, "core_hours_Tesla V100-SXM2-32GB": 98.25045721678633, "core_hours": 98.25045721678633}
{"step": 65550, "global_schedule": 0.42581161856651306, "l2_grads": 1.6235475540161133, "l2_params": 289.496826171875, "l2_updates": 0.46511298418045044, "training_loss": 2.859628200531006, "uptime": 24129.26034362195, "examples_seen": 67123200.0, "progress": 0.5880136709814581, "epoch": 52.9214612628168, "img/sec/core": 189.7116515047227, "core_hours_Tesla V100-SXM2-32GB": 98.32542479051949, "core_hours": 98.32542479051949}
{"step": 65600, "global_schedule": 0.42504632472991943, "l2_grads": 1.737924575805664, "l2_params": 289.4012145996094, "l2_updates": 0.4530887007713318, "training_loss": 4.473932266235352, "uptime": 24146.123580393963, "examples_seen": 67174400.0, "progress": 0.5884621939951739, "epoch": 52.961828510156856, "img/sec/core": 189.76190889467236, "core_hours_Tesla V100-SXM2-32GB": 98.40037250950623, "core_hours": 98.40037250950623}
{"step": 65650, "global_schedule": 0.42428117990493774, "l2_grads": 1.7393897771835327, "l2_params": 289.3134460449219, "l2_updates": 0.459546834230423, "training_loss": 2.170011281967163, "uptime": 24162.985342400963, "examples_seen": 67225600.0, "progress": 0.5889107170088898, "epoch": 53.002195757496914, "img/sec/core": 189.77850586857795, "core_hours_Tesla V100-SXM2-32GB": 98.47531367398179, "core_hours": 98.47531367398179}
{"step": 65700, "global_schedule": 0.4235161542892456, "l2_grads": 1.620046615600586, "l2_params": 289.2258605957031, "l2_updates": 0.45331767201423645, "training_loss": 2.373847007751465, "uptime": 24179.861604346952, "examples_seen": 67276800.0, "progress": 0.5893592400226055, "epoch": 53.04256300483697, "img/sec/core": 189.6154498100001, "core_hours_Tesla V100-SXM2-32GB": 98.55031928263061, "core_hours": 98.55031928263061}
{"step": 65750, "global_schedule": 0.42275145649909973, "l2_grads": 1.6236008405685425, "l2_params": 289.1409912109375, "l2_updates": 0.4545418620109558, "training_loss": 2.810154676437378, "uptime": 24196.72882321599, "examples_seen": 67328000.0, "progress": 0.5898077630363214, "epoch": 53.082930252177036, "img/sec/core": 189.71710895823387, "core_hours_Tesla V100-SXM2-32GB": 98.62528469982635, "core_hours": 98.62528469982635}
{"step": 65800, "global_schedule": 0.42198681831359863, "l2_grads": 1.8431652784347534, "l2_params": 289.0490417480469, "l2_updates": 0.4549700617790222, "training_loss": 2.245148181915283, "uptime": 24213.606927630957, "examples_seen": 67379200.0, "progress": 0.5902562860500372, "epoch": 53.12329749951709, "img/sec/core": 189.59475076849395, "core_hours_Tesla V100-SXM2-32GB": 98.70029849722619, "core_hours": 98.70029849722619}
{"step": 65850, "global_schedule": 0.4212225079536438, "l2_grads": 1.6537036895751953, "l2_params": 288.97119140625, "l2_updates": 0.45884576439857483, "training_loss": 3.885260581970215, "uptime": 24230.47603996296, "examples_seen": 67430400.0, "progress": 0.5907048090637531, "epoch": 53.16366474685715, "img/sec/core": 189.69581428000248, "core_hours_Tesla V100-SXM2-32GB": 98.77527232981286, "core_hours": 98.77527232981286}
{"step": 65900, "global_schedule": 0.42045822739601135, "l2_grads": 1.8213742971420288, "l2_params": 288.8749084472656, "l2_updates": 0.4595366418361664, "training_loss": 2.2776496410369873, "uptime": 24247.354813854967, "examples_seen": 67481600.0, "progress": 0.5911533320774689, "epoch": 53.20403199419721, "img/sec/core": 189.5872307120195, "core_hours_Tesla V100-SXM2-32GB": 98.85028910266624, "core_hours": 98.85028910266624}
{"step": 65950, "global_schedule": 0.41969427466392517, "l2_grads": 1.8037786483764648, "l2_params": 288.7926330566406, "l2_updates": 0.4424515664577484, "training_loss": 2.1767687797546387, "uptime": 24264.238501239975, "examples_seen": 67532800.0, "progress": 0.5916018550911847, "epoch": 53.244399241537266, "img/sec/core": 189.53205701032687, "core_hours_Tesla V100-SXM2-32GB": 98.92532771326628, "core_hours": 98.92532771326628}
{"step": 66000, "global_schedule": 0.41893038153648376, "l2_grads": 1.674518346786499, "l2_params": 288.6923522949219, "l2_updates": 0.45003947615623474, "training_loss": 4.692806720733643, "uptime": 24281.127230141952, "examples_seen": 67584000.0, "progress": 0.5920503781049006, "epoch": 53.284766488877324, "img/sec/core": 189.47547909454929, "core_hours_Tesla V100-SXM2-32GB": 99.00038873060839, "core_hours": 99.00038873060839}
{"step": 66050, "global_schedule": 0.4181668162345886, "l2_grads": 1.6346334218978882, "l2_params": 288.602783203125, "l2_updates": 0.4495474398136139, "training_loss": 3.0626180171966553, "uptime": 24298.764775393996, "examples_seen": 67635200.0, "progress": 0.5924989011186164, "epoch": 53.32513373621738, "img/sec/core": 189.77093921111748, "core_hours_Tesla V100-SXM2-32GB": 99.07533288318173, "core_hours": 99.07533288318173}
{"step": 66100, "global_schedule": 0.41740334033966064, "l2_grads": 1.7906864881515503, "l2_params": 288.52056884765625, "l2_updates": 0.4509662985801697, "training_loss": 2.1801552772521973, "uptime": 24315.622511984955, "examples_seen": 67686400.0, "progress": 0.5929474241323323, "epoch": 53.36550098355744, "img/sec/core": 189.82382259527418, "core_hours_Tesla V100-SXM2-32GB": 99.15025615691931, "core_hours": 99.15025615691931}
{"step": 66150, "global_schedule": 0.41664016246795654, "l2_grads": 1.7734471559524536, "l2_params": 288.42718505859375, "l2_updates": 0.4442000091075897, "training_loss": 4.577991485595703, "uptime": 24332.489759460965, "examples_seen": 67737600.0, "progress": 0.593395947146048, "epoch": 53.405868230897504, "img/sec/core": 189.71678719668824, "core_hours_Tesla V100-SXM2-32GB": 99.22522170125714, "core_hours": 99.22522170125714}
{"step": 66200, "global_schedule": 0.4158770740032196, "l2_grads": 1.833275556564331, "l2_params": 288.33514404296875, "l2_updates": 0.45668885111808777, "training_loss": 2.3374011516571045, "uptime": 24349.356350699964, "examples_seen": 67788800.0, "progress": 0.5938444701597639, "epoch": 53.44623547823756, "img/sec/core": 189.72416860384828, "core_hours_Tesla V100-SXM2-32GB": 99.30018432898602, "core_hours": 99.30018432898602}
{"step": 66250, "global_schedule": 0.41511428356170654, "l2_grads": 1.7980455160140991, "l2_params": 288.2348327636719, "l2_updates": 0.45380207896232605, "training_loss": 2.2751526832580566, "uptime": 24366.22338240198, "examples_seen": 67840000.0, "progress": 0.5942929931734797, "epoch": 53.48660272557762, "img/sec/core": 189.71921417671254, "core_hours_Tesla V100-SXM2-32GB": 99.3751489143283, "core_hours": 99.3751489143283}
{"step": 66300, "global_schedule": 0.41435161232948303, "l2_grads": 1.7400140762329102, "l2_params": 288.14605712890625, "l2_updates": 0.43553945422172546, "training_loss": 4.56214714050293, "uptime": 24383.116328779957, "examples_seen": 67891200.0, "progress": 0.5947415161871956, "epoch": 53.526969972917676, "img/sec/core": 189.4281748370114, "core_hours_Tesla V100-SXM2-32GB": 99.45022867600822, "core_hours": 99.45022867600822}
{"step": 66350, "global_schedule": 0.4135892391204834, "l2_grads": 1.6589593887329102, "l2_params": 288.0528869628906, "l2_updates": 0.44372332096099854, "training_loss": 2.5292325019836426, "uptime": 24399.96203726495, "examples_seen": 67942400.0, "progress": 0.5951900392009114, "epoch": 53.567337220257734, "img/sec/core": 189.9593598482654, "core_hours_Tesla V100-SXM2-32GB": 99.52509849149709, "core_hours": 99.52509849149709}
{"step": 66400, "global_schedule": 0.4128269553184509, "l2_grads": 1.639290452003479, "l2_params": 287.9547119140625, "l2_updates": 0.43979743123054504, "training_loss": 3.0275917053222656, "uptime": 24416.832805863, "examples_seen": 67993600.0, "progress": 0.5956385622146272, "epoch": 53.60770446759779, "img/sec/core": 189.67719113699698, "core_hours_Tesla V100-SXM2-32GB": 99.60007968526618, "core_hours": 99.60007968526618}
{"step": 66450, "global_schedule": 0.4120650291442871, "l2_grads": 1.7570500373840332, "l2_params": 287.8694152832031, "l2_updates": 0.44907858967781067, "training_loss": 2.2712135314941406, "uptime": 24433.696634856984, "examples_seen": 68044800.0, "progress": 0.5960870852283431, "epoch": 53.64807171493785, "img/sec/core": 189.75524485817976, "core_hours_Tesla V100-SXM2-32GB": 99.67503003635056, "core_hours": 99.67503003635056}
{"step": 66500, "global_schedule": 0.41130316257476807, "l2_grads": 1.7242567539215088, "l2_params": 287.7770690917969, "l2_updates": 0.441745400428772, "training_loss": 2.25346040725708, "uptime": 24450.57529679098, "examples_seen": 68096000.0, "progress": 0.5965356082420589, "epoch": 53.688438962277914, "img/sec/core": 189.58848826487122, "core_hours_Tesla V100-SXM2-32GB": 99.75004631161276, "core_hours": 99.75004631161276}
{"step": 66550, "global_schedule": 0.4105416238307953, "l2_grads": 1.7270005941390991, "l2_params": 287.6883544921875, "l2_updates": 0.44212278723716736, "training_loss": 2.0641307830810547, "uptime": 24467.446741818974, "examples_seen": 68147200.0, "progress": 0.5969841312557748, "epoch": 53.72880620961797, "img/sec/core": 189.66958637450523, "core_hours_Tesla V100-SXM2-32GB": 99.82503051173718, "core_hours": 99.82503051173718}
{"step": 66600, "global_schedule": 0.40978020429611206, "l2_grads": 1.7863717079162598, "l2_params": 287.6007385253906, "l2_updates": 0.44025981426239014, "training_loss": 2.2073357105255127, "uptime": 24484.306508723996, "examples_seen": 68198400.0, "progress": 0.5974326542694905, "epoch": 53.76917345695803, "img/sec/core": 189.8009633245247, "core_hours_Tesla V100-SXM2-32GB": 99.89996280909283, "core_hours": 99.89996280909283}
{"step": 66650, "global_schedule": 0.4090191125869751, "l2_grads": 1.7448203563690186, "l2_params": 287.50628662109375, "l2_updates": 0.4423699378967285, "training_loss": 2.06449818611145, "uptime": 24501.17681951396, "examples_seen": 68249600.0, "progress": 0.5978811772832064, "epoch": 53.80954070429809, "img/sec/core": 189.68233838962288, "core_hours_Tesla V100-SXM2-32GB": 99.97494196815934, "core_hours": 99.97494196815934}
{"step": 66700, "global_schedule": 0.4082581102848053, "l2_grads": 1.6306147575378418, "l2_params": 287.4222106933594, "l2_updates": 0.44047972559928894, "training_loss": 4.0894598960876465, "uptime": 24518.05082000798, "examples_seen": 68300800.0, "progress": 0.5983297002969222, "epoch": 53.849907951638144, "img/sec/core": 189.64086205486467, "core_hours_Tesla V100-SXM2-32GB": 100.04993752591054, "core_hours": 100.04993752591054}
{"step": 66751, "global_schedule": 0.40749746561050415, "l2_grads": 1.7757190465927124, "l2_params": 287.3262023925781, "l2_updates": 0.44190600514411926, "training_loss": 2.3473453521728516, "uptime": 24534.906168674002, "examples_seen": 68352000.0, "progress": 0.598778223310638, "epoch": 53.8902751989782, "img/sec/core": 189.85071524805545, "core_hours_Tesla V100-SXM2-32GB": 100.12485018664842, "core_hours": 100.12485018664842}
{"step": 66800, "global_schedule": 0.40673691034317017, "l2_grads": 1.8264137506484985, "l2_params": 287.2408142089844, "l2_updates": 0.4372616410255432, "training_loss": 2.190422773361206, "uptime": 24551.756589847966, "examples_seen": 68403200.0, "progress": 0.5992267463243539, "epoch": 53.93064244631826, "img/sec/core": 189.90623242963542, "core_hours_Tesla V100-SXM2-32GB": 100.19974094742159, "core_hours": 100.19974094742159}
{"step": 66850, "global_schedule": 0.40597668290138245, "l2_grads": 1.6103368997573853, "l2_params": 287.1578369140625, "l2_updates": 0.43676942586898804, "training_loss": 4.010396957397461, "uptime": 24568.608675864, "examples_seen": 68454400.0, "progress": 0.5996752693380697, "epoch": 53.971009693658324, "img/sec/core": 189.88747131691125, "core_hours_Tesla V100-SXM2-32GB": 100.27463910749286, "core_hours": 100.27463910749286}
{"step": 66900, "global_schedule": 0.4052165746688843, "l2_grads": 1.788910150527954, "l2_params": 287.0711364746094, "l2_updates": 0.4325239956378937, "training_loss": 2.2951903343200684, "uptime": 24585.474613089988, "examples_seen": 68505600.0, "progress": 0.6001237923517856, "epoch": 54.01137694099838, "img/sec/core": 189.73152556678468, "core_hours_Tesla V100-SXM2-32GB": 100.34959882849724, "core_hours": 100.34959882849724}
{"step": 66950, "global_schedule": 0.40445682406425476, "l2_grads": 1.6328837871551514, "l2_params": 286.9840393066406, "l2_updates": 0.44101810455322266, "training_loss": 4.410321235656738, "uptime": 24602.331580042955, "examples_seen": 68556800.0, "progress": 0.6005723153655014, "epoch": 54.05174418833844, "img/sec/core": 189.83248937535538, "core_hours_Tesla V100-SXM2-32GB": 100.42451868162154, "core_hours": 100.42451868162154}
{"step": 67000, "global_schedule": 0.4036971926689148, "l2_grads": 1.5935479402542114, "l2_params": 286.902099609375, "l2_updates": 0.44141966104507446, "training_loss": 4.483743667602539, "uptime": 24619.196957762993, "examples_seen": 68608000.0, "progress": 0.6010208383792173, "epoch": 54.0921114356785, "img/sec/core": 189.73781987687383, "core_hours_Tesla V100-SXM2-32GB": 100.49947591593282, "core_hours": 100.49947591593282}
{"step": 67050, "global_schedule": 0.4029378890991211, "l2_grads": 1.678886890411377, "l2_params": 286.8101806640625, "l2_updates": 0.44133442640304565, "training_loss": 2.0511579513549805, "uptime": 24636.566676821967, "examples_seen": 68659200.0, "progress": 0.601469361392933, "epoch": 54.132478683018554, "img/sec/core": 189.5790846669202, "core_hours_Tesla V100-SXM2-32GB": 100.57449591219037, "core_hours": 100.57449591219037}
{"step": 67100, "global_schedule": 0.40217870473861694, "l2_grads": 1.763814091682434, "l2_params": 286.71697998046875, "l2_updates": 0.4400878846645355, "training_loss": 2.074815511703491, "uptime": 24653.423730749986, "examples_seen": 68710400.0, "progress": 0.601917884406649, "epoch": 54.17284593035861, "img/sec/core": 189.83150992244904, "core_hours_Tesla V100-SXM2-32GB": 100.64941615187045, "core_hours": 100.64941615187045}
{"step": 67150, "global_schedule": 0.40141984820365906, "l2_grads": 1.6888796091079712, "l2_params": 286.6222839355469, "l2_updates": 0.440341979265213, "training_loss": 4.385763645172119, "uptime": 24670.301585646986, "examples_seen": 68761600.0, "progress": 0.6023664074203647, "epoch": 54.21321317769867, "img/sec/core": 189.59755368964122, "core_hours_Tesla V100-SXM2-32GB": 100.72442884030156, "core_hours": 100.72442884030156}
{"step": 67200, "global_schedule": 0.4006611406803131, "l2_grads": 1.8954877853393555, "l2_params": 286.5411071777344, "l2_updates": 0.43145260214805603, "training_loss": 2.388012409210205, "uptime": 24687.177932502003, "examples_seen": 68812800.0, "progress": 0.6028149304340805, "epoch": 54.253580425038734, "img/sec/core": 189.61449580829898, "core_hours_Tesla V100-SXM2-32GB": 100.79943482632387, "core_hours": 100.79943482632387}
{"step": 67250, "global_schedule": 0.3999027907848358, "l2_grads": 1.723536491394043, "l2_params": 286.4524230957031, "l2_updates": 0.4347180128097534, "training_loss": 2.189682722091675, "uptime": 24704.050120186992, "examples_seen": 68864000.0, "progress": 0.6032634534477964, "epoch": 54.29394767237879, "img/sec/core": 189.6612377568014, "core_hours_Tesla V100-SXM2-32GB": 100.87442232714604, "core_hours": 100.87442232714604}
{"step": 67300, "global_schedule": 0.3991445302963257, "l2_grads": 1.7066764831542969, "l2_params": 286.36883544921875, "l2_updates": 0.4315582513809204, "training_loss": 3.8863677978515625, "uptime": 24720.92443220096, "examples_seen": 68915200.0, "progress": 0.6037119764615122, "epoch": 54.33431491971885, "img/sec/core": 189.63736105808712, "core_hours_Tesla V100-SXM2-32GB": 100.94941926943035, "core_hours": 100.94941926943035}
{"step": 67350, "global_schedule": 0.3983866572380066, "l2_grads": 1.6388654708862305, "l2_params": 286.2739562988281, "l2_updates": 0.43245604634284973, "training_loss": 2.9067513942718506, "uptime": 24737.79896998295, "examples_seen": 68966400.0, "progress": 0.6041604994752281, "epoch": 54.37468216705891, "img/sec/core": 189.63482385964468, "core_hours_Tesla V100-SXM2-32GB": 101.02441721512807, "core_hours": 101.02441721512807}
{"step": 67400, "global_schedule": 0.39762890338897705, "l2_grads": 1.7489997148513794, "l2_params": 286.1879577636719, "l2_updates": 0.4339201748371124, "training_loss": 2.2427215576171875, "uptime": 24754.674031094997, "examples_seen": 69017600.0, "progress": 0.6046090224889439, "epoch": 54.415049414398965, "img/sec/core": 189.62894289699742, "core_hours_Tesla V100-SXM2-32GB": 101.09941748673717, "core_hours": 101.09941748673717}
{"step": 67450, "global_schedule": 0.39687153697013855, "l2_grads": 1.8016246557235718, "l2_params": 286.1084289550781, "l2_updates": 0.4368562400341034, "training_loss": 2.185126781463623, "uptime": 24771.566339818004, "examples_seen": 69068800.0, "progress": 0.6050575455026598, "epoch": 54.45541666173902, "img/sec/core": 189.4353254177558, "core_hours_Tesla V100-SXM2-32GB": 101.17449441439499, "core_hours": 101.17449441439499}
{"step": 67500, "global_schedule": 0.3961142599582672, "l2_grads": 1.9011818170547485, "l2_params": 286.003662109375, "l2_updates": 0.4164557158946991, "training_loss": 2.201624870300293, "uptime": 24788.439474102983, "examples_seen": 69120000.0, "progress": 0.6055060685163756, "epoch": 54.49578390907908, "img/sec/core": 189.65059756851414, "core_hours_Tesla V100-SXM2-32GB": 101.24948612232821, "core_hours": 101.24948612232821, "minival/prec@1": 0.7173743365594755, "minival/loss": 1.1634593419346853, "minival/sample count": 12812.0, "minival/attn_weight_avg": [13312, 12, 281], "minival/attn_mag": [13312, 12, 281], "minival/before_mlp": [13312, 12, 281], "z/secs/eval/minival": 2.9058017560164444, "real/prec@1": 0.7604244507547452, "real/loss": 1.9624801281613962, "real/sample count": 46837.0, "real/attn_weight_avg": [50176, 12, 281], "real/attn_mag": [50176, 12, 281], "real/before_mlp": [50176, 12, 281], "z/secs/eval/real": 11.1845931619755, "train/prec@1": 0.7480388713265426, "train/loss": 1.009167532784428, "train/sample count": 25623.0, "train/attn_weight_avg": [26624, 12, 281], "train/attn_mag": [26624, 12, 281], "train/before_mlp": [26624, 12, 281], "z/secs/eval/train": 6.566378959978465, "v2/prec@1": 0.5565, "v2/loss": 1.9484841918945313, "v2/sample count": 10000.0, "v2/attn_weight_avg": [10240, 12, 281], "v2/attn_mag": [10240, 12, 281], "v2/before_mlp": [10240, 12, 281], "z/secs/eval/v2": 3.341090453963261, "val/prec@1": 0.68402, "val/loss": 1.2986150170898438, "val/sample count": 50000.0, "val/attn_weight_avg": [50176, 12, 281], "val/attn_mag": [50176, 12, 281], "val/before_mlp": [50176, 12, 281], "z/secs/eval/val": 12.342969553952571}
{"step": 67551, "global_schedule": 0.3953573703765869, "l2_grads": 1.6195716857910156, "l2_params": 285.9176330566406, "l2_updates": 0.43003049492836, "training_loss": 3.2281529903411865, "uptime": 24841.66756289499, "examples_seen": 69171200.0, "progress": 0.6059545915300915, "epoch": 54.536151156419145, "img/sec/core": 189.51452494067448, "core_hours_Tesla V100-SXM2-32GB": 101.32453167478216, "core_hours": 101.32453167478216}
{"step": 67600, "global_schedule": 0.39460062980651855, "l2_grads": 1.668451189994812, "l2_params": 285.8193664550781, "l2_updates": 0.4254881739616394, "training_loss": 2.6345157623291016, "uptime": 24858.514523827995, "examples_seen": 69222400.0, "progress": 0.6064031145438072, "epoch": 54.5765184037592, "img/sec/core": 189.94523776277572, "core_hours_Tesla V100-SXM2-32GB": 101.39940705670665, "core_hours": 101.39940705670665}
{"step": 67650, "global_schedule": 0.39384421706199646, "l2_grads": 1.794534683227539, "l2_params": 285.73822021484375, "l2_updates": 0.43456515669822693, "training_loss": 2.1344780921936035, "uptime": 24875.38945801597, "examples_seen": 69273600.0, "progress": 0.606851637557523, "epoch": 54.61688565109926, "img/sec/core": 189.63036918274463, "core_hours_Tesla V100-SXM2-32GB": 101.47440676420875, "core_hours": 101.47440676420875}
{"step": 67700, "global_schedule": 0.3930879831314087, "l2_grads": 1.883678913116455, "l2_params": 285.6534729003906, "l2_updates": 0.4273354411125183, "training_loss": 2.3071951866149902, "uptime": 24892.243203054997, "examples_seen": 69324800.0, "progress": 0.6073001605712389, "epoch": 54.65725289843932, "img/sec/core": 189.86877946650378, "core_hours_Tesla V100-SXM2-32GB": 101.54931229771555, "core_hours": 101.54931229771555}
{"step": 67750, "global_schedule": 0.3923320770263672, "l2_grads": 1.5786486864089966, "l2_params": 285.55535888671875, "l2_updates": 0.4207765460014343, "training_loss": 3.424917221069336, "uptime": 24909.115145596967, "examples_seen": 69376000.0, "progress": 0.6077486835849547, "epoch": 54.697620145779375, "img/sec/core": 189.6639934636988, "core_hours_Tesla V100-SXM2-32GB": 101.62429870901319, "core_hours": 101.62429870901319}
{"step": 67800, "global_schedule": 0.39157634973526, "l2_grads": 1.6835880279541016, "l2_params": 285.4563293457031, "l2_updates": 0.4303424060344696, "training_loss": 3.4558639526367188, "uptime": 24925.984635056986, "examples_seen": 69427200.0, "progress": 0.6081972065986706, "epoch": 54.73798739311943, "img/sec/core": 189.69157351110024, "core_hours_Tesla V100-SXM2-32GB": 101.6992742177244, "core_hours": 101.6992742177244}
{"step": 67850, "global_schedule": 0.3908209204673767, "l2_grads": 1.745805025100708, "l2_params": 285.3584289550781, "l2_updates": 0.4211302697658539, "training_loss": 2.1303749084472656, "uptime": 24942.824909871968, "examples_seen": 69478400.0, "progress": 0.6086457296123864, "epoch": 54.77835464045949, "img/sec/core": 190.02065198800182, "core_hours_Tesla V100-SXM2-32GB": 101.77411988356876, "core_hours": 101.77411988356876}
{"step": 67900, "global_schedule": 0.3900657892227173, "l2_grads": 1.6931015253067017, "l2_params": 285.26239013671875, "l2_updates": 0.4229886829853058, "training_loss": 4.611380577087402, "uptime": 24959.709553111985, "examples_seen": 69529600.0, "progress": 0.6090942526261023, "epoch": 54.818721887799555, "img/sec/core": 189.52132742822465, "core_hours_Tesla V100-SXM2-32GB": 101.84916274241327, "core_hours": 101.84916274241327}
{"step": 67950, "global_schedule": 0.38931089639663696, "l2_grads": 1.6180760860443115, "l2_params": 285.1762390136719, "l2_updates": 0.4327656924724579, "training_loss": 2.505251884460449, "uptime": 24976.580892420956, "examples_seen": 69580800.0, "progress": 0.6095427756398181, "epoch": 54.85908913513961, "img/sec/core": 189.6707748802402, "core_hours_Tesla V100-SXM2-32GB": 101.92414647267536, "core_hours": 101.92414647267536}
{"step": 68000, "global_schedule": 0.38855624198913574, "l2_grads": 1.7741553783416748, "l2_params": 285.09649658203125, "l2_updates": 0.41355201601982117, "training_loss": 4.489912986755371, "uptime": 24993.450724084978, "examples_seen": 69632000.0, "progress": 0.609991298653534, "epoch": 54.89945638247967, "img/sec/core": 189.68772562352083, "core_hours_Tesla V100-SXM2-32GB": 101.99912350229324, "core_hours": 101.99912350229324}
{"step": 68050, "global_schedule": 0.3878018856048584, "l2_grads": 1.7461873292922974, "l2_params": 285.0106506347656, "l2_updates": 0.41909152269363403, "training_loss": 4.299379348754883, "uptime": 25010.858739655, "examples_seen": 69683200.0, "progress": 0.6104398216672497, "epoch": 54.93982362981973, "img/sec/core": 189.75955956884178, "core_hours_Tesla V100-SXM2-32GB": 102.0740721491732, "core_hours": 102.0740721491732}
{"step": 68100, "global_schedule": 0.38704779744148254, "l2_grads": 1.7787922620773315, "l2_params": 284.91192626953125, "l2_updates": 0.4258500337600708, "training_loss": 2.2605299949645996, "uptime": 25027.73018996499, "examples_seen": 69734400.0, "progress": 0.6108883446809655, "epoch": 54.980190877159785, "img/sec/core": 189.66952699407412, "core_hours_Tesla V100-SXM2-32GB": 102.14905637277316, "core_hours": 102.14905637277316}
{"step": 68150, "global_schedule": 0.3862939774990082, "l2_grads": 1.5910910367965698, "l2_params": 284.8252868652344, "l2_updates": 0.41160300374031067, "training_loss": 4.098543643951416, "uptime": 25044.62006926199, "examples_seen": 69785600.0, "progress": 0.6113368676946814, "epoch": 55.02055812449984, "img/sec/core": 189.46257363535432, "core_hours_Tesla V100-SXM2-32GB": 102.22412250298204, "core_hours": 102.22412250298204}
{"step": 68200, "global_schedule": 0.3855404257774353, "l2_grads": 1.789249300956726, "l2_params": 284.7331848144531, "l2_updates": 0.4219832122325897, "training_loss": 2.0406103134155273, "uptime": 25061.50276962499, "examples_seen": 69836800.0, "progress": 0.6117853907083972, "epoch": 55.0609253718399, "img/sec/core": 189.54313772062193, "core_hours_Tesla V100-SXM2-32GB": 102.2991567268176, "core_hours": 102.2991567268176}
{"step": 68251, "global_schedule": 0.3847871422767639, "l2_grads": 1.641791820526123, "l2_params": 284.6445617675781, "l2_updates": 0.4138590395450592, "training_loss": 3.4974799156188965, "uptime": 25078.366081493965, "examples_seen": 69888000.0, "progress": 0.6122339137221131, "epoch": 55.10129261917996, "img/sec/core": 189.76106383273216, "core_hours_Tesla V100-SXM2-32GB": 102.3741047795686, "core_hours": 102.3741047795686}
{"step": 68300, "global_schedule": 0.3840342164039612, "l2_grads": 1.840545892715454, "l2_params": 284.5609130859375, "l2_updates": 0.4134843349456787, "training_loss": 2.270934581756592, "uptime": 25095.258649493975, "examples_seen": 69939200.0, "progress": 0.6126824367358289, "epoch": 55.14165986652002, "img/sec/core": 189.4324178537014, "core_hours_Tesla V100-SXM2-32GB": 102.44918285956865, "core_hours": 102.44918285956865}
{"step": 68350, "global_schedule": 0.383281409740448, "l2_grads": 1.6957961320877075, "l2_params": 284.46630859375, "l2_updates": 0.4168878197669983, "training_loss": 2.425034761428833, "uptime": 25112.147419130953, "examples_seen": 69990400.0, "progress": 0.6131309597495448, "epoch": 55.18202711386008, "img/sec/core": 189.47502208766693, "core_hours_Tesla V100-SXM2-32GB": 102.52424405795522, "core_hours": 102.52424405795522}
{"step": 68400, "global_schedule": 0.38252902030944824, "l2_grads": 1.9249471426010132, "l2_params": 284.3825378417969, "l2_updates": 0.4137437343597412, "training_loss": 2.200134754180908, "uptime": 25129.03136055899, "examples_seen": 70041600.0, "progress": 0.6135794827632606, "epoch": 55.22239436120014, "img/sec/core": 189.52920522965695, "core_hours_Tesla V100-SXM2-32GB": 102.59928379763538, "core_hours": 102.59928379763538}
{"step": 68450, "global_schedule": 0.3817768096923828, "l2_grads": 1.7314226627349854, "l2_params": 284.2886047363281, "l2_updates": 0.40389397740364075, "training_loss": 4.429388046264648, "uptime": 25145.90236246196, "examples_seen": 70092800.0, "progress": 0.6140280057769765, "epoch": 55.262761608540195, "img/sec/core": 189.67456813795417, "core_hours_Tesla V100-SXM2-32GB": 102.67426602831524, "core_hours": 102.67426602831524}
{"step": 68500, "global_schedule": 0.3810250163078308, "l2_grads": 1.7115639448165894, "l2_params": 284.1986083984375, "l2_updates": 0.416233628988266, "training_loss": 2.023279905319214, "uptime": 25162.77166117, "examples_seen": 70144000.0, "progress": 0.6144765287906923, "epoch": 55.30312885588025, "img/sec/core": 189.69371847534373, "core_hours_Tesla V100-SXM2-32GB": 102.74924068923988, "core_hours": 102.74924068923988}
{"step": 68550, "global_schedule": 0.38027334213256836, "l2_grads": 1.7143967151641846, "l2_params": 284.1141357421875, "l2_updates": 0.4115246534347534, "training_loss": 4.355091094970703, "uptime": 25179.640447841957, "examples_seen": 70195200.0, "progress": 0.614925051804408, "epoch": 55.34349610322031, "img/sec/core": 189.69947644900907, "core_hours_Tesla V100-SXM2-32GB": 102.82421307444858, "core_hours": 102.82421307444858}
{"step": 68600, "global_schedule": 0.37952208518981934, "l2_grads": 1.779004693031311, "l2_params": 284.0248718261719, "l2_updates": 0.4129893481731415, "training_loss": 2.122040033340454, "uptime": 25196.542802320968, "examples_seen": 70246400.0, "progress": 0.6153735748181239, "epoch": 55.38386335056037, "img/sec/core": 189.32273630716685, "core_hours_Tesla V100-SXM2-32GB": 102.89933464991084, "core_hours": 102.89933464991084}
{"step": 68650, "global_schedule": 0.37877100706100464, "l2_grads": 1.738327145576477, "l2_params": 283.9414978027344, "l2_updates": 0.41209304332733154, "training_loss": 2.1409292221069336, "uptime": 25213.420074344962, "examples_seen": 70297600.0, "progress": 0.6158220978318397, "epoch": 55.42423059790043, "img/sec/core": 189.60410162558483, "core_hours_Tesla V100-SXM2-32GB": 102.97434474779526, "core_hours": 102.97434474779526}
{"step": 68700, "global_schedule": 0.37802034616470337, "l2_grads": 1.7599337100982666, "l2_params": 283.84967041015625, "l2_updates": 0.4150678217411041, "training_loss": 2.2119364738464355, "uptime": 25230.287257890974, "examples_seen": 70348800.0, "progress": 0.6162706208455556, "epoch": 55.46459784524049, "img/sec/core": 189.71750626124128, "core_hours_Tesla V100-SXM2-32GB": 103.04931000799975, "core_hours": 103.04931000799975}
{"step": 68750, "global_schedule": 0.3772698640823364, "l2_grads": 1.7147345542907715, "l2_params": 283.7654113769531, "l2_updates": 0.4127611219882965, "training_loss": 2.2792105674743652, "uptime": 25247.135413843964, "examples_seen": 70400000.0, "progress": 0.6167191438592714, "epoch": 55.50496509258055, "img/sec/core": 189.93176516935634, "core_hours_Tesla V100-SXM2-32GB": 103.12419070112416, "core_hours": 103.12419070112416}
{"step": 68800, "global_schedule": 0.3765197694301605, "l2_grads": 1.7318309545516968, "l2_params": 283.6815490722656, "l2_updates": 0.40801557898521423, "training_loss": 4.270578384399414, "uptime": 25264.008106426976, "examples_seen": 70451200.0, "progress": 0.6171676668729873, "epoch": 55.545332339920606, "img/sec/core": 189.65556233874574, "core_hours_Tesla V100-SXM2-32GB": 103.19918044593754, "core_hours": 103.19918044593754}
{"step": 68850, "global_schedule": 0.37576988339424133, "l2_grads": 1.724568247795105, "l2_params": 283.59881591796875, "l2_updates": 0.40785783529281616, "training_loss": 2.0400869846343994, "uptime": 25280.873833887978, "examples_seen": 70502400.0, "progress": 0.6176161898867031, "epoch": 55.58569958726066, "img/sec/core": 189.73388532450565, "core_hours_Tesla V100-SXM2-32GB": 103.2741392346531, "core_hours": 103.2741392346531}
{"step": 68900, "global_schedule": 0.3750203847885132, "l2_grads": 1.7674167156219482, "l2_params": 283.4993896484375, "l2_updates": 0.4127112925052643, "training_loss": 2.402669668197632, "uptime": 25297.744924620958, "examples_seen": 70553600.0, "progress": 0.6180647129004189, "epoch": 55.62606683460072, "img/sec/core": 189.6735694595292, "core_hours_Tesla V100-SXM2-32GB": 103.34912186013301, "core_hours": 103.34912186013301}
{"step": 68950, "global_schedule": 0.37427109479904175, "l2_grads": 1.6450763940811157, "l2_params": 283.4052429199219, "l2_updates": 0.3999689519405365, "training_loss": 4.185168266296387, "uptime": 25314.62932336895, "examples_seen": 70604800.0, "progress": 0.6185132359141348, "epoch": 55.66643408194078, "img/sec/core": 189.52407176361666, "core_hours_Tesla V100-SXM2-32GB": 103.42416363234632, "core_hours": 103.42416363234632}
{"step": 69000, "global_schedule": 0.37352219223976135, "l2_grads": 1.7115576267242432, "l2_params": 283.32232666015625, "l2_updates": 0.40171805024147034, "training_loss": 3.265559196472168, "uptime": 25331.493887811957, "examples_seen": 70656000.0, "progress": 0.6189617589278505, "epoch": 55.70680132928084, "img/sec/core": 189.74696979659498, "core_hours_Tesla V100-SXM2-32GB": 103.49911725209303, "core_hours": 103.49911725209303}
{"step": 69050, "global_schedule": 0.37277349829673767, "l2_grads": 1.6039282083511353, "l2_params": 283.2217102050781, "l2_updates": 0.40522441267967224, "training_loss": 3.1808547973632812, "uptime": 25348.92897357, "examples_seen": 70707200.0, "progress": 0.6194102819415664, "epoch": 55.7471685766209, "img/sec/core": 189.7316151560105, "core_hours_Tesla V100-SXM2-32GB": 103.57407693770223, "core_hours": 103.57407693770223}
{"step": 69100, "global_schedule": 0.37202519178390503, "l2_grads": 1.8882126808166504, "l2_params": 283.1430358886719, "l2_updates": 0.40548568964004517, "training_loss": 2.2163825035095215, "uptime": 25365.788493866974, "examples_seen": 70758400.0, "progress": 0.6198588049552822, "epoch": 55.78753582396096, "img/sec/core": 189.8037395864943, "core_hours_Tesla V100-SXM2-32GB": 103.6490081390221, "core_hours": 103.6490081390221}
{"step": 69150, "global_schedule": 0.3712771236896515, "l2_grads": 1.801463007926941, "l2_params": 283.0565185546875, "l2_updates": 0.4027225971221924, "training_loss": 2.0764474868774414, "uptime": 25382.66208976897, "examples_seen": 70809600.0, "progress": 0.6203073279689981, "epoch": 55.827903071301016, "img/sec/core": 189.6454092290508, "core_hours_Tesla V100-SXM2-32GB": 103.72400189858654, "core_hours": 103.72400189858654}
{"step": 69200, "global_schedule": 0.3705294728279114, "l2_grads": 1.7654767036437988, "l2_params": 282.97467041015625, "l2_updates": 0.40419262647628784, "training_loss": 2.316094398498535, "uptime": 25399.520993019978, "examples_seen": 70860800.0, "progress": 0.6207558509827139, "epoch": 55.86827031864107, "img/sec/core": 189.8106865171671, "core_hours_Tesla V100-SXM2-32GB": 103.7989303574799, "core_hours": 103.7989303574799}
{"step": 69250, "global_schedule": 0.3697819709777832, "l2_grads": 1.774693250656128, "l2_params": 282.8824462890625, "l2_updates": 0.4029729962348938, "training_loss": 2.2458457946777344, "uptime": 25416.39721530996, "examples_seen": 70912000.0, "progress": 0.6212043739964298, "epoch": 55.90863756598113, "img/sec/core": 189.61589537129552, "core_hours_Tesla V100-SXM2-32GB": 103.87393578987982, "core_hours": 103.87393578987982}
{"step": 69300, "global_schedule": 0.36903494596481323, "l2_grads": 1.8146857023239136, "l2_params": 282.7875671386719, "l2_updates": 0.40092986822128296, "training_loss": 2.277240514755249, "uptime": 25433.248142584984, "examples_seen": 70963200.0, "progress": 0.6216528970101456, "epoch": 55.94900481332119, "img/sec/core": 189.90052878235758, "core_hours_Tesla V100-SXM2-32GB": 103.94882879999105, "core_hours": 103.94882879999105}
{"step": 69350, "global_schedule": 0.3682880997657776, "l2_grads": 1.6367878913879395, "l2_params": 282.705322265625, "l2_updates": 0.3945598006248474, "training_loss": 3.651383876800537, "uptime": 25450.116088560957, "examples_seen": 71014400.0, "progress": 0.6221014200238614, "epoch": 55.98937206066125, "img/sec/core": 189.7089310434172, "core_hours_Tesla V100-SXM2-32GB": 104.02379744877315, "core_hours": 104.02379744877315}
{"step": 69400, "global_schedule": 0.36754167079925537, "l2_grads": 1.8255794048309326, "l2_params": 282.6086730957031, "l2_updates": 0.39964812994003296, "training_loss": 2.068286895751953, "uptime": 25466.98185311799, "examples_seen": 71065600.0, "progress": 0.6225499430375773, "epoch": 56.02973930800131, "img/sec/core": 189.7334680072526, "core_hours_Tesla V100-SXM2-32GB": 104.09875640235995, "core_hours": 104.09875640235995}
{"step": 69450, "global_schedule": 0.36679548025131226, "l2_grads": 1.8194911479949951, "l2_params": 282.51922607421875, "l2_updates": 0.408390611410141, "training_loss": 2.115497350692749, "uptime": 25483.83432325197, "examples_seen": 71116800.0, "progress": 0.622998466051293, "epoch": 56.07010655534137, "img/sec/core": 189.88314321639118, "core_hours_Tesla V100-SXM2-32GB": 104.17365626962209, "core_hours": 104.17365626962209}
{"step": 69500, "global_schedule": 0.36604970693588257, "l2_grads": 1.8032699823379517, "l2_params": 282.4411926269531, "l2_updates": 0.39580535888671875, "training_loss": 4.545413494110107, "uptime": 25500.713510003, "examples_seen": 71168000.0, "progress": 0.623446989065009, "epoch": 56.110473802681426, "img/sec/core": 189.5825934744602, "core_hours_Tesla V100-SXM2-32GB": 104.24867487740444, "core_hours": 104.24867487740444}
{"step": 69550, "global_schedule": 0.3653041124343872, "l2_grads": 1.9666447639465332, "l2_params": 282.35272216796875, "l2_updates": 0.3846537172794342, "training_loss": 2.0915300846099854, "uptime": 25517.576822314004, "examples_seen": 71219200.0, "progress": 0.6238955120787247, "epoch": 56.150841050021484, "img/sec/core": 189.761058858627, "core_hours_Tesla V100-SXM2-32GB": 104.32362293212002, "core_hours": 104.32362293212002}
{"step": 69600, "global_schedule": 0.36455899477005005, "l2_grads": 1.676929235458374, "l2_params": 282.2587585449219, "l2_updates": 0.39895379543304443, "training_loss": 4.456624984741211, "uptime": 25534.423080345965, "examples_seen": 71270400.0, "progress": 0.6243440350924406, "epoch": 56.19120829736154, "img/sec/core": 189.95316312553797, "core_hours_Tesla V100-SXM2-32GB": 104.39849519003984, "core_hours": 104.39849519003984}
{"step": 69650, "global_schedule": 0.3638140559196472, "l2_grads": 1.6985682249069214, "l2_params": 282.1737365722656, "l2_updates": 0.40139782428741455, "training_loss": 3.18381929397583, "uptime": 25551.285083636, "examples_seen": 71321600.0, "progress": 0.6247925581061564, "epoch": 56.2315755447016, "img/sec/core": 189.77579027581396, "core_hours_Tesla V100-SXM2-32GB": 104.47343742688444, "core_hours": 104.47343742688444}
{"step": 69700, "global_schedule": 0.3630695939064026, "l2_grads": 1.8031262159347534, "l2_params": 282.0863037109375, "l2_updates": 0.3903128504753113, "training_loss": 2.0981173515319824, "uptime": 25568.144734020985, "examples_seen": 71372800.0, "progress": 0.6252410811198723, "epoch": 56.27194279204166, "img/sec/core": 189.8022750726833, "core_hours_Tesla V100-SXM2-32GB": 104.54836920637327, "core_hours": 104.54836920637327}
{"step": 69750, "global_schedule": 0.3623253107070923, "l2_grads": 1.6666587591171265, "l2_params": 281.9951477050781, "l2_updates": 0.39088815450668335, "training_loss": 4.097579479217529, "uptime": 25585.007558817975, "examples_seen": 71424000.0, "progress": 0.6256896041335881, "epoch": 56.31231003938172, "img/sec/core": 189.7665449605568, "core_hours_Tesla V100-SXM2-32GB": 104.6233150943599, "core_hours": 104.6233150943599}
{"step": 69800, "global_schedule": 0.3615814745426178, "l2_grads": 1.6246891021728516, "l2_params": 281.90045166015625, "l2_updates": 0.39280882477760315, "training_loss": 2.664900779724121, "uptime": 25601.88100949698, "examples_seen": 71475200.0, "progress": 0.6261381271473039, "epoch": 56.35267728672178, "img/sec/core": 189.6470414306802, "core_hours_Tesla V100-SXM2-32GB": 104.6983082084888, "core_hours": 104.6983082084888}
{"step": 69850, "global_schedule": 0.3608378767967224, "l2_grads": 1.541180968284607, "l2_params": 281.8094177246094, "l2_updates": 0.3870430290699005, "training_loss": 3.388698101043701, "uptime": 25618.740922605968, "examples_seen": 71526400.0, "progress": 0.6265866501610198, "epoch": 56.393044534061836, "img/sec/core": 189.7993174291219, "core_hours_Tesla V100-SXM2-32GB": 104.77324115563987, "core_hours": 104.77324115563987}
{"step": 69900, "global_schedule": 0.36009472608566284, "l2_grads": 1.7623326778411865, "l2_params": 281.7129211425781, "l2_updates": 0.3858564794063568, "training_loss": 2.6272263526916504, "uptime": 25635.610127997992, "examples_seen": 71577600.0, "progress": 0.6270351731747356, "epoch": 56.433411781401894, "img/sec/core": 189.69476781123328, "core_hours_Tesla V100-SXM2-32GB": 104.84821540182664, "core_hours": 104.84821540182664}
{"step": 69950, "global_schedule": 0.3593517541885376, "l2_grads": 1.8171793222427368, "l2_params": 281.62249755859375, "l2_updates": 0.3970443308353424, "training_loss": 2.2385339736938477, "uptime": 25652.463961656962, "examples_seen": 71628800.0, "progress": 0.6274836961884515, "epoch": 56.47377902874195, "img/sec/core": 189.86778110847757, "core_hours_Tesla V100-SXM2-32GB": 104.92312132919983, "core_hours": 104.92312132919983}
{"step": 70000, "global_schedule": 0.3586091697216034, "l2_grads": 1.7218706607818604, "l2_params": 281.53997802734375, "l2_updates": 0.3866593539714813, "training_loss": 2.728565216064453, "uptime": 25669.325717500993, "examples_seen": 71680000.0, "progress": 0.6279322192021672, "epoch": 56.51414627608201, "img/sec/core": 189.77857523259, "core_hours_Tesla V100-SXM2-32GB": 104.99806246628441, "core_hours": 104.99806246628441, "minival/prec@1": 0.7225257571027162, "minival/loss": 1.1153669544878582, "minival/sample count": 12812.0, "minival/attn_weight_avg": [13312, 12, 281], "minival/attn_mag": [13312, 12, 281], "minival/before_mlp": [13312, 12, 281], "z/secs/eval/minival": 2.876395897998009, "real/prec@1": 0.768772551615176, "real/loss": 1.9123820908733347, "real/sample count": 46837.0, "real/attn_weight_avg": [50176, 12, 281], "real/attn_mag": [50176, 12, 281], "real/before_mlp": [50176, 12, 281], "z/secs/eval/real": 11.176025903027039, "train/prec@1": 0.7569761542364282, "train/loss": 0.9589456480736616, "train/sample count": 25623.0, "train/attn_weight_avg": [26624, 12, 281], "train/attn_mag": [26624, 12, 281], "train/before_mlp": [26624, 12, 281], "z/secs/eval/train": 6.589222846028861, "v2/prec@1": 0.5693, "v2/loss": 1.8972238891601563, "v2/sample count": 10000.0, "v2/attn_weight_avg": [10240, 12, 281], "v2/attn_mag": [10240, 12, 281], "v2/before_mlp": [10240, 12, 281], "z/secs/eval/v2": 3.392605041968636, "val/prec@1": 0.6914, "val/loss": 1.2556964208984376, "val/sample count": 50000.0, "val/attn_weight_avg": [50176, 12, 281], "val/attn_mag": [50176, 12, 281], "val/before_mlp": [50176, 12, 281], "z/secs/eval/val": 12.20829896099167}
{"step": 70050, "global_schedule": 0.3578670024871826, "l2_grads": 1.8262490034103394, "l2_params": 281.4571838378906, "l2_updates": 0.3779314160346985, "training_loss": 4.052490234375, "uptime": 25723.308450965967, "examples_seen": 71731200.0, "progress": 0.6283807422158831, "epoch": 56.554513523422074, "img/sec/core": 188.84968262322408, "core_hours_Tesla V100-SXM2-32GB": 105.07337221541752, "core_hours": 105.07337221541752}
{"step": 70100, "global_schedule": 0.35712510347366333, "l2_grads": 1.7807788848876953, "l2_params": 281.3681335449219, "l2_updates": 0.39433571696281433, "training_loss": 2.103264808654785, "uptime": 25740.206509427982, "examples_seen": 71782400.0, "progress": 0.6288292652295989, "epoch": 56.59488077076213, "img/sec/core": 189.3708680907498, "core_hours_Tesla V100-SXM2-32GB": 105.14847469747092, "core_hours": 105.14847469747092}
{"step": 70151, "global_schedule": 0.35638362169265747, "l2_grads": 1.6835265159606934, "l2_params": 281.28369140625, "l2_updates": 0.3842867612838745, "training_loss": 2.778837203979492, "uptime": 25757.08883071295, "examples_seen": 71833600.0, "progress": 0.6292777882433148, "epoch": 56.63524801810219, "img/sec/core": 189.5473937490679, "core_hours_Tesla V100-SXM2-32GB": 105.22350723651522, "core_hours": 105.22350723651522}
{"step": 70200, "global_schedule": 0.3556423783302307, "l2_grads": 1.7898979187011719, "l2_params": 281.1865539550781, "l2_updates": 0.3827177584171295, "training_loss": 2.176971912384033, "uptime": 25773.977592374955, "examples_seen": 71884800.0, "progress": 0.6297263112570306, "epoch": 56.67561526544225, "img/sec/core": 189.47511155889603, "core_hours_Tesla V100-SXM2-32GB": 105.29856839945747, "core_hours": 105.29856839945747}
{"step": 70250, "global_schedule": 0.35490161180496216, "l2_grads": 1.9028784036636353, "l2_params": 281.08740234375, "l2_updates": 0.3817620277404785, "training_loss": 2.172069549560547, "uptime": 25790.878026789986, "examples_seen": 71936000.0, "progress": 0.6301748342707464, "epoch": 56.715982512782304, "img/sec/core": 189.34424532626286, "core_hours_Tesla V100-SXM2-32GB": 105.37368144130205, "core_hours": 105.37368144130205}
{"step": 70300, "global_schedule": 0.3541610836982727, "l2_grads": 1.9258722066879272, "l2_params": 281.0008850097656, "l2_updates": 0.3893491327762604, "training_loss": 2.1335337162017822, "uptime": 25807.758980454004, "examples_seen": 71987200.0, "progress": 0.6306233572844623, "epoch": 56.75634976012236, "img/sec/core": 189.56275004893763, "core_hours_Tesla V100-SXM2-32GB": 105.44870790203102, "core_hours": 105.44870790203102}
{"step": 70350, "global_schedule": 0.3534209728240967, "l2_grads": 1.6681816577911377, "l2_params": 280.91357421875, "l2_updates": 0.38496777415275574, "training_loss": 2.792727470397949, "uptime": 25824.647933575965, "examples_seen": 72038400.0, "progress": 0.6310718802981781, "epoch": 56.79671700746242, "img/sec/core": 189.47296359292787, "core_hours_Tesla V100-SXM2-32GB": 105.5237699159064, "core_hours": 105.5237699159064}
{"step": 70400, "global_schedule": 0.35268115997314453, "l2_grads": 1.9292467832565308, "l2_params": 280.8157043457031, "l2_updates": 0.38198718428611755, "training_loss": 2.1119158267974854, "uptime": 25841.54118676798, "examples_seen": 72089600.0, "progress": 0.631520403311894, "epoch": 56.83708425480248, "img/sec/core": 189.42473445627667, "core_hours_Tesla V100-SXM2-32GB": 105.59885104120424, "core_hours": 105.59885104120424}
{"step": 70451, "global_schedule": 0.3519417643547058, "l2_grads": 1.909091591835022, "l2_params": 280.7174377441406, "l2_updates": 0.38137540221214294, "training_loss": 2.0726733207702637, "uptime": 25858.415374648, "examples_seen": 72140800.0, "progress": 0.6319689263256097, "epoch": 56.87745150214254, "img/sec/core": 189.6387561139332, "core_hours_Tesla V100-SXM2-32GB": 105.67384743178212, "core_hours": 105.67384743178212}
{"step": 70500, "global_schedule": 0.3512026369571686, "l2_grads": 1.8340004682540894, "l2_params": 280.6409606933594, "l2_updates": 0.38419291377067566, "training_loss": 2.0336668491363525, "uptime": 25875.300561744953, "examples_seen": 72192000.0, "progress": 0.6324174493393256, "epoch": 56.9178187494826, "img/sec/core": 189.5152231139709, "core_hours_Tesla V100-SXM2-32GB": 105.74889270776858, "core_hours": 105.74889270776858}
{"step": 70550, "global_schedule": 0.35046398639678955, "l2_grads": 1.9173110723495483, "l2_params": 280.5487365722656, "l2_updates": 0.38241204619407654, "training_loss": 2.229771137237549, "uptime": 25892.195039677958, "examples_seen": 72243200.0, "progress": 0.6328659723530414, "epoch": 56.95818599682266, "img/sec/core": 189.41100238134595, "core_hours_Tesla V100-SXM2-32GB": 105.82397927635971, "core_hours": 105.82397927635971}
{"step": 70600, "global_schedule": 0.34972554445266724, "l2_grads": 1.5936769247055054, "l2_params": 280.46209716796875, "l2_updates": 0.3810517191886902, "training_loss": 2.7875688076019287, "uptime": 25909.082972873992, "examples_seen": 72294400.0, "progress": 0.6333144953667572, "epoch": 56.998553244162714, "img/sec/core": 189.48440657921608, "core_hours_Tesla V100-SXM2-32GB": 105.89903675723097, "core_hours": 105.89903675723097}
{"step": 70650, "global_schedule": 0.3489876091480255, "l2_grads": 1.755733609199524, "l2_params": 280.3666687011719, "l2_updates": 0.38290756940841675, "training_loss": 1.8965861797332764, "uptime": 25925.95295202697, "examples_seen": 72345600.0, "progress": 0.6337630183804731, "epoch": 57.03892049150277, "img/sec/core": 189.6860672429921, "core_hours_Tesla V100-SXM2-32GB": 105.97401444235533, "core_hours": 105.97401444235533}
{"step": 70700, "global_schedule": 0.34824997186660767, "l2_grads": 1.881118893623352, "l2_params": 280.2851867675781, "l2_updates": 0.3751516044139862, "training_loss": 2.052729606628418, "uptime": 25942.842175059952, "examples_seen": 72396800.0, "progress": 0.6342115413941889, "epoch": 57.07928773884283, "img/sec/core": 189.46993557674256, "core_hours_Tesla V100-SXM2-32GB": 106.04907765583523, "core_hours": 106.04907765583523}
{"step": 70750, "global_schedule": 0.34751269221305847, "l2_grads": 1.8391480445861816, "l2_params": 280.1994934082031, "l2_updates": 0.3765993118286133, "training_loss": 2.06638240814209, "uptime": 25959.71755218599, "examples_seen": 72448000.0, "progress": 0.6346600644079048, "epoch": 57.11965498618289, "img/sec/core": 189.6253918416152, "core_hours_Tesla V100-SXM2-32GB": 106.12407933195095, "core_hours": 106.12407933195095}
{"step": 70800, "global_schedule": 0.34677577018737793, "l2_grads": 1.8751219511032104, "l2_params": 280.11138916015625, "l2_updates": 0.3764103055000305, "training_loss": 2.0996925830841064, "uptime": 25976.612277127977, "examples_seen": 72499200.0, "progress": 0.6351085874216206, "epoch": 57.16002223352295, "img/sec/core": 189.4082331016412, "core_hours_Tesla V100-SXM2-32GB": 106.19916699835979, "core_hours": 106.19916699835979}
{"step": 70850, "global_schedule": 0.3460392355918884, "l2_grads": 1.8880101442337036, "l2_params": 280.0321350097656, "l2_updates": 0.3737840950489044, "training_loss": 2.068985939025879, "uptime": 25993.48660049698, "examples_seen": 72550400.0, "progress": 0.6355571104353365, "epoch": 57.20038948086301, "img/sec/core": 189.63723344771427, "core_hours_Tesla V100-SXM2-32GB": 106.27416399111092, "core_hours": 106.27416399111092}
{"step": 70900, "global_schedule": 0.3453030586242676, "l2_grads": 1.8320778608322144, "l2_params": 279.95452880859375, "l2_updates": 0.38358059525489807, "training_loss": 2.0270166397094727, "uptime": 26010.367404803983, "examples_seen": 72601600.0, "progress": 0.6360056334490523, "epoch": 57.24075672820307, "img/sec/core": 189.5644272514106, "core_hours_Tesla V100-SXM2-32GB": 106.34918978803093, "core_hours": 106.34918978803093}
{"step": 70950, "global_schedule": 0.3445672392845154, "l2_grads": 1.8323590755462646, "l2_params": 279.86309814453125, "l2_updates": 0.3819687068462372, "training_loss": 2.0699009895324707, "uptime": 26027.24304530496, "examples_seen": 72652800.0, "progress": 0.6364541564627682, "epoch": 57.281123975543125, "img/sec/core": 189.62243239388198, "core_hours_Tesla V100-SXM2-32GB": 106.42419263470194, "core_hours": 106.42419263470194}
{"step": 71000, "global_schedule": 0.3438318371772766, "l2_grads": 1.939685583114624, "l2_params": 279.7806091308594, "l2_updates": 0.3746809959411621, "training_loss": 2.0312347412109375, "uptime": 26044.145936695975, "examples_seen": 72704000.0, "progress": 0.6369026794764839, "epoch": 57.32149122288318, "img/sec/core": 189.31672256386756, "core_hours_Tesla V100-SXM2-32GB": 106.49931659643978, "core_hours": 106.49931659643978}
{"step": 71050, "global_schedule": 0.3430967628955841, "l2_grads": 1.6807557344436646, "l2_params": 279.6897277832031, "l2_updates": 0.3715146780014038, "training_loss": 3.279789686203003, "uptime": 26061.512474373973, "examples_seen": 72755200.0, "progress": 0.6373512024901997, "epoch": 57.36185847022324, "img/sec/core": 189.5870351806774, "core_hours_Tesla V100-SXM2-32GB": 106.574333446662, "core_hours": 106.574333446662}
{"step": 71100, "global_schedule": 0.34236207604408264, "l2_grads": 1.6453635692596436, "l2_params": 279.59527587890625, "l2_updates": 0.3708374798297882, "training_loss": 2.9555373191833496, "uptime": 26078.391336437955, "examples_seen": 72806400.0, "progress": 0.6377997255039156, "epoch": 57.4022257175633, "img/sec/core": 189.58624034427166, "core_hours_Tesla V100-SXM2-32GB": 106.64935061139082, "core_hours": 106.64935061139082}
{"step": 71150, "global_schedule": 0.3416277766227722, "l2_grads": 1.8995546102523804, "l2_params": 279.5060729980469, "l2_updates": 0.3651953339576721, "training_loss": 2.0971901416778564, "uptime": 26095.266898249974, "examples_seen": 72857600.0, "progress": 0.6382482485176314, "epoch": 57.44259296490336, "img/sec/core": 189.62331658320457, "core_hours_Tesla V100-SXM2-32GB": 106.72435310833312, "core_hours": 106.72435310833312}
{"step": 71200, "global_schedule": 0.34089386463165283, "l2_grads": 1.8986561298370361, "l2_params": 279.4112243652344, "l2_updates": 0.3687991499900818, "training_loss": 2.135136604309082, "uptime": 26112.146010971977, "examples_seen": 72908800.0, "progress": 0.6386967715313473, "epoch": 57.48296021224342, "img/sec/core": 189.58342495269994, "core_hours_Tesla V100-SXM2-32GB": 106.79937138709758, "core_hours": 106.79937138709758}
{"step": 71250, "global_schedule": 0.3401603102684021, "l2_grads": 1.6999038457870483, "l2_params": 279.3271484375, "l2_updates": 0.37456196546554565, "training_loss": 2.6639533042907715, "uptime": 26129.045849924965, "examples_seen": 72960000.0, "progress": 0.6391452945450631, "epoch": 57.52332745958348, "img/sec/core": 189.35091682836625, "core_hours_Tesla V100-SXM2-32GB": 106.87448178244419, "core_hours": 106.87448178244419}
{"step": 71300, "global_schedule": 0.3394271433353424, "l2_grads": 1.751025676727295, "l2_params": 279.2433776855469, "l2_updates": 0.3671736717224121, "training_loss": 3.2209439277648926, "uptime": 26145.923304440978, "examples_seen": 73011200.0, "progress": 0.639593817558779, "epoch": 57.563694706923535, "img/sec/core": 189.60205148021876, "core_hours_Tesla V100-SXM2-32GB": 106.94949269140423, "core_hours": 106.94949269140423}
{"step": 71350, "global_schedule": 0.33869436383247375, "l2_grads": 1.8253042697906494, "l2_params": 279.1548767089844, "l2_updates": 0.3671415150165558, "training_loss": 2.0812110900878906, "uptime": 26162.803033075994, "examples_seen": 73062400.0, "progress": 0.6400423405724948, "epoch": 57.60406195426359, "img/sec/core": 189.57650737119792, "core_hours_Tesla V100-SXM2-32GB": 107.02451370755986, "core_hours": 107.02451370755986}
{"step": 71400, "global_schedule": 0.33796197175979614, "l2_grads": 1.7329243421554565, "l2_params": 279.0669250488281, "l2_updates": 0.3630622327327728, "training_loss": 3.073535203933716, "uptime": 26179.70575200295, "examples_seen": 73113600.0, "progress": 0.6404908635862107, "epoch": 57.64442920160365, "img/sec/core": 189.3186542253271, "core_hours_Tesla V100-SXM2-32GB": 107.09963690279078, "core_hours": 107.09963690279078}
{"step": 71450, "global_schedule": 0.33722996711730957, "l2_grads": 1.7303777933120728, "l2_params": 278.981201171875, "l2_updates": 0.3679471015930176, "training_loss": 4.216803550720215, "uptime": 26196.577790503972, "examples_seen": 73164800.0, "progress": 0.6409393865999264, "epoch": 57.68479644894371, "img/sec/core": 189.66291475720772, "core_hours_Tesla V100-SXM2-32GB": 107.1746237405731, "core_hours": 107.1746237405731}
{"step": 71500, "global_schedule": 0.3364983797073364, "l2_grads": 1.7825238704681396, "l2_params": 278.9118957519531, "l2_updates": 0.359736829996109, "training_loss": 2.327606678009033, "uptime": 26213.46095630998, "examples_seen": 73216000.0, "progress": 0.6413879096136422, "epoch": 57.72516369628377, "img/sec/core": 189.5379123067813, "core_hours_Tesla V100-SXM2-32GB": 107.24966003304425, "core_hours": 107.24966003304425}
{"step": 71550, "global_schedule": 0.3357672095298767, "l2_grads": 1.7606194019317627, "l2_params": 278.82525634765625, "l2_updates": 0.3667553663253784, "training_loss": 2.345890522003174, "uptime": 26230.354561154963, "examples_seen": 73267200.0, "progress": 0.6418364326273581, "epoch": 57.76553094362383, "img/sec/core": 189.42079143932895, "core_hours_Tesla V100-SXM2-32GB": 107.32474272124416, "core_hours": 107.32474272124416}
{"step": 71600, "global_schedule": 0.33503633737564087, "l2_grads": 1.742759346961975, "l2_params": 278.7353820800781, "l2_updates": 0.36246034502983093, "training_loss": 3.9729747772216797, "uptime": 26247.24518417596, "examples_seen": 73318400.0, "progress": 0.6422849556410739, "epoch": 57.80589819096389, "img/sec/core": 189.4542312632216, "core_hours_Tesla V100-SXM2-32GB": 107.39981215689305, "core_hours": 107.39981215689305}
{"step": 71650, "global_schedule": 0.33430594205856323, "l2_grads": 1.8516123294830322, "l2_params": 278.6488952636719, "l2_updates": 0.3654775321483612, "training_loss": 2.099024772644043, "uptime": 26264.108391040005, "examples_seen": 73369600.0, "progress": 0.6427334786547898, "epoch": 57.846265438303945, "img/sec/core": 189.7622454494801, "core_hours_Tesla V100-SXM2-32GB": 107.47475974295547, "core_hours": 107.47475974295547}
{"step": 71700, "global_schedule": 0.3335758447647095, "l2_grads": 1.794475793838501, "l2_params": 278.5570983886719, "l2_updates": 0.36253997683525085, "training_loss": 2.1593222618103027, "uptime": 26281.01009877195, "examples_seen": 73420800.0, "progress": 0.6431820016685056, "epoch": 57.886632685644, "img/sec/core": 189.32998077774323, "core_hours_Tesla V100-SXM2-32GB": 107.54987844398633, "core_hours": 107.54987844398633}
{"step": 71750, "global_schedule": 0.3328462839126587, "l2_grads": 1.8705207109451294, "l2_params": 278.4740905761719, "l2_updates": 0.3682876229286194, "training_loss": 2.099679708480835, "uptime": 26297.893496375997, "examples_seen": 73472000.0, "progress": 0.6436305246822215, "epoch": 57.92699993298406, "img/sec/core": 189.53531007483954, "core_hours_Tesla V100-SXM2-32GB": 107.62491576667098, "core_hours": 107.62491576667098}
{"step": 71800, "global_schedule": 0.3321169912815094, "l2_grads": 1.850559115409851, "l2_params": 278.3880920410156, "l2_updates": 0.3591814637184143, "training_loss": 2.1418771743774414, "uptime": 26314.77697672398, "examples_seen": 73523200.0, "progress": 0.6440790476959373, "epoch": 57.96736718032412, "img/sec/core": 189.53438118474787, "core_hours_Tesla V100-SXM2-32GB": 107.69995345710647, "core_hours": 107.69995345710647}
{"step": 71850, "global_schedule": 0.3313882052898407, "l2_grads": 1.903460144996643, "l2_params": 278.2936096191406, "l2_updates": 0.3588204085826874, "training_loss": 2.1402530670166016, "uptime": 26331.659665265994, "examples_seen": 73574400.0, "progress": 0.6445275707096532, "epoch": 58.00773442766418, "img/sec/core": 189.5432704356719, "core_hours_Tesla V100-SXM2-32GB": 107.7749876284043, "core_hours": 107.7749876284043}
{"step": 71900, "global_schedule": 0.3306597173213959, "l2_grads": 1.839287281036377, "l2_params": 278.2113037109375, "l2_updates": 0.3551962375640869, "training_loss": 2.3647658824920654, "uptime": 26348.546860625967, "examples_seen": 73625600.0, "progress": 0.644976093723369, "epoch": 58.04810167500424, "img/sec/core": 189.4926855399974, "core_hours_Tesla V100-SXM2-32GB": 107.85004183000419, "core_hours": 107.85004183000419}
{"step": 71950, "global_schedule": 0.32993173599243164, "l2_grads": 1.7523301839828491, "l2_params": 278.1295166015625, "l2_updates": 0.3580946922302246, "training_loss": 3.377866268157959, "uptime": 26365.429054201, "examples_seen": 73676800.0, "progress": 0.6454246167370847, "epoch": 58.0884689223443, "img/sec/core": 189.54882763178483, "core_hours_Tesla V100-SXM2-32GB": 107.92507380144879, "core_hours": 107.92507380144879}
{"step": 72000, "global_schedule": 0.32920408248901367, "l2_grads": 1.910938024520874, "l2_params": 278.0434265136719, "l2_updates": 0.3565269112586975, "training_loss": 2.2417337894439697, "uptime": 26382.31421614095, "examples_seen": 73728000.0, "progress": 0.6458731397508006, "epoch": 58.128836169684355, "img/sec/core": 189.51550547044613, "core_hours_Tesla V100-SXM2-32GB": 108.00011896562633, "core_hours": 108.00011896562633}
{"step": 72050, "global_schedule": 0.3284769356250763, "l2_grads": 1.852442979812622, "l2_params": 277.9670104980469, "l2_updates": 0.34867486357688904, "training_loss": 3.63423228263855, "uptime": 26399.691481694987, "examples_seen": 73779200.0, "progress": 0.6463216627645164, "epoch": 58.16920341702441, "img/sec/core": 189.9682508568187, "core_hours_Tesla V100-SXM2-32GB": 108.07498527701297, "core_hours": 108.07498527701297}
{"step": 72100, "global_schedule": 0.3277500867843628, "l2_grads": 1.9760254621505737, "l2_params": 277.8769226074219, "l2_updates": 0.355815589427948, "training_loss": 2.127987861633301, "uptime": 26416.557145397994, "examples_seen": 73830400.0, "progress": 0.6467701857782323, "epoch": 58.20957066436447, "img/sec/core": 189.73460258367646, "core_hours_Tesla V100-SXM2-32GB": 108.14994378235967, "core_hours": 108.14994378235967}
{"step": 72150, "global_schedule": 0.32702362537384033, "l2_grads": 1.8059629201889038, "l2_params": 277.7828674316406, "l2_updates": 0.3588017523288727, "training_loss": 2.6392741203308105, "uptime": 26433.406127001974, "examples_seen": 73881600.0, "progress": 0.6472187087919481, "epoch": 58.24993791170453, "img/sec/core": 189.92245793918468, "core_hours_Tesla V100-SXM2-32GB": 108.22482814504403, "core_hours": 108.22482814504403}
{"step": 72200, "global_schedule": 0.32629773020744324, "l2_grads": 1.8941481113433838, "l2_params": 277.70538330078125, "l2_updates": 0.3542446196079254, "training_loss": 2.1379895210266113, "uptime": 26450.27010467497, "examples_seen": 73932800.0, "progress": 0.647667231805664, "epoch": 58.29030515904459, "img/sec/core": 189.75357190633335, "core_hours_Tesla V100-SXM2-32GB": 108.29977915692402, "core_hours": 108.29977915692402}
{"step": 72250, "global_schedule": 0.32557213306427, "l2_grads": 1.8779773712158203, "l2_params": 277.6210632324219, "l2_updates": 0.3464699983596802, "training_loss": 4.479169845581055, "uptime": 26467.134055566974, "examples_seen": 73984000.0, "progress": 0.6481157548193798, "epoch": 58.33067240638465, "img/sec/core": 189.7538732467248, "core_hours_Tesla V100-SXM2-32GB": 108.37473004977736, "core_hours": 108.37473004977736}
{"step": 72300, "global_schedule": 0.3248470425605774, "l2_grads": 1.8020386695861816, "l2_params": 277.5352783203125, "l2_updates": 0.35356035828590393, "training_loss": 2.3408679962158203, "uptime": 26483.98296159698, "examples_seen": 74035200.0, "progress": 0.6485642778330957, "epoch": 58.37103965372471, "img/sec/core": 189.92330981615615, "core_hours_Tesla V100-SXM2-32GB": 108.44961407657738, "core_hours": 108.44961407657738}
{"step": 72350, "global_schedule": 0.32412227988243103, "l2_grads": 1.6881743669509888, "l2_params": 277.44488525390625, "l2_updates": 0.35419249534606934, "training_loss": 2.6140706539154053, "uptime": 26500.834111512988, "examples_seen": 74086400.0, "progress": 0.6490128008468115, "epoch": 58.411406901064765, "img/sec/core": 189.89801977608676, "core_hours_Tesla V100-SXM2-32GB": 108.52450807620409, "core_hours": 108.52450807620409}
{"step": 72400, "global_schedule": 0.32339805364608765, "l2_grads": 1.945620059967041, "l2_params": 277.355224609375, "l2_updates": 0.35098737478256226, "training_loss": 2.170407295227051, "uptime": 26517.70444309496, "examples_seen": 74137600.0, "progress": 0.6494613238605272, "epoch": 58.45177414840482, "img/sec/core": 189.68210461372308, "core_hours_Tesla V100-SXM2-32GB": 108.59948732767953, "core_hours": 108.59948732767953}
{"step": 72450, "global_schedule": 0.32267409563064575, "l2_grads": 1.9418549537658691, "l2_params": 277.2710266113281, "l2_updates": 0.352504700422287, "training_loss": 2.135040521621704, "uptime": 26534.564151398954, "examples_seen": 74188800.0, "progress": 0.6499098468742431, "epoch": 58.49214139574488, "img/sec/core": 189.8016230353228, "core_hours_Tesla V100-SXM2-32GB": 108.67441936458616, "core_hours": 108.67441936458616}
{"step": 72500, "global_schedule": 0.3219507336616516, "l2_grads": 1.895585536956787, "l2_params": 277.18359375, "l2_updates": 0.34823495149612427, "training_loss": 2.8032419681549072, "uptime": 26551.41047492699, "examples_seen": 74240000.0, "progress": 0.6503583698879589, "epoch": 58.53250864308494, "img/sec/core": 189.9524246150498, "core_hours_Tesla V100-SXM2-32GB": 108.74929191359965, "core_hours": 108.74929191359965, "minival/prec@1": 0.7339993755853887, "minival/loss": 1.0815809799513518, "minival/sample count": 12812.0, "minival/attn_weight_avg": [13312, 12, 281], "minival/attn_mag": [13312, 12, 281], "minival/before_mlp": [13312, 12, 281], "z/secs/eval/minival": 2.898391594993882, "real/prec@1": 0.7710357196233747, "real/loss": 1.8915067955714433, "real/sample count": 46837.0, "real/attn_weight_avg": [50176, 12, 281], "real/attn_mag": [50176, 12, 281], "real/before_mlp": [50176, 12, 281], "z/secs/eval/real": 11.177427757997066, "train/prec@1": 0.7644303945673808, "train/loss": 0.9200904316037366, "train/sample count": 25623.0, "train/attn_weight_avg": [26624, 12, 281], "train/attn_mag": [26624, 12, 281], "train/before_mlp": [26624, 12, 281], "z/secs/eval/train": 6.620409401017241, "v2/prec@1": 0.5703, "v2/loss": 1.8771148803710938, "v2/sample count": 10000.0, "v2/attn_weight_avg": [10240, 12, 281], "v2/attn_mag": [10240, 12, 281], "v2/before_mlp": [10240, 12, 281], "z/secs/eval/v2": 3.374917541979812, "val/prec@1": 0.6967, "val/loss": 1.222492255859375, "val/sample count": 50000.0, "val/attn_weight_avg": [50176, 12, 281], "val/attn_mag": [50176, 12, 281], "val/before_mlp": [50176, 12, 281], "z/secs/eval/val": 12.32831717497902}
{"step": 72550, "global_schedule": 0.32122766971588135, "l2_grads": 1.8645570278167725, "l2_params": 277.0932312011719, "l2_updates": 0.3472767770290375, "training_loss": 4.144314765930176, "uptime": 26604.73535077198, "examples_seen": 74291200.0, "progress": 0.6508068929016748, "epoch": 58.572875890424996, "img/sec/core": 189.08726039410635, "core_hours_Tesla V100-SXM2-32GB": 108.82450704016387, "core_hours": 108.82450704016387}
{"step": 72600, "global_schedule": 0.3205051124095917, "l2_grads": 1.9468353986740112, "l2_params": 277.0057373046875, "l2_updates": 0.3480894863605499, "training_loss": 2.0654256343841553, "uptime": 26621.59067673399, "examples_seen": 74342400.0, "progress": 0.6512554159153906, "epoch": 58.61324313776506, "img/sec/core": 189.85097097573535, "core_hours_Tesla V100-SXM2-32GB": 108.89941959999503, "core_hours": 108.89941959999503}
{"step": 72650, "global_schedule": 0.31978291273117065, "l2_grads": 1.9182215929031372, "l2_params": 276.9205017089844, "l2_updates": 0.34414011240005493, "training_loss": 2.2094533443450928, "uptime": 26638.455150283, "examples_seen": 74393600.0, "progress": 0.6517039389291065, "epoch": 58.65361038510512, "img/sec/core": 189.74799247072087, "core_hours_Tesla V100-SXM2-32GB": 108.97437281576839, "core_hours": 108.97437281576839}
{"step": 72700, "global_schedule": 0.3190612196922302, "l2_grads": 1.9494080543518066, "l2_params": 276.83282470703125, "l2_updates": 0.3445012867450714, "training_loss": 2.124250650405884, "uptime": 26655.329946279002, "examples_seen": 74444800.0, "progress": 0.6521524619428223, "epoch": 58.693977632445176, "img/sec/core": 189.63192211379405, "core_hours_Tesla V100-SXM2-32GB": 109.04937190908394, "core_hours": 109.04937190908394}
{"step": 72750, "global_schedule": 0.31833988428115845, "l2_grads": 1.794235110282898, "l2_params": 276.7424621582031, "l2_updates": 0.33981895446777344, "training_loss": 4.168357849121094, "uptime": 26672.19905850198, "examples_seen": 74496000.0, "progress": 0.6526009849565381, "epoch": 58.73434487978523, "img/sec/core": 189.69581550598264, "core_hours_Tesla V100-SXM2-32GB": 109.12434574118608, "core_hours": 109.12434574118608}
{"step": 72800, "global_schedule": 0.31761908531188965, "l2_grads": 1.8151254653930664, "l2_params": 276.64013671875, "l2_updates": 0.34981974959373474, "training_loss": 2.965740203857422, "uptime": 26689.058095049986, "examples_seen": 74547200.0, "progress": 0.653049507970254, "epoch": 58.77471212712529, "img/sec/core": 189.8091857674203, "core_hours_Tesla V100-SXM2-32GB": 109.19927479251055, "core_hours": 109.19927479251055}
{"step": 72850, "global_schedule": 0.3168985843658447, "l2_grads": 1.8487560749053955, "l2_params": 276.57330322265625, "l2_updates": 0.34522438049316406, "training_loss": 4.566970348358154, "uptime": 26705.94048738398, "examples_seen": 74598400.0, "progress": 0.6534980309839697, "epoch": 58.81507937446535, "img/sec/core": 189.54659604470555, "core_hours_Tesla V100-SXM2-32GB": 109.2743076473283, "core_hours": 109.2743076473283}
{"step": 72900, "global_schedule": 0.31617867946624756, "l2_grads": 1.7519348859786987, "l2_params": 276.47796630859375, "l2_updates": 0.34188899397850037, "training_loss": 2.384150743484497, "uptime": 26722.828478852985, "examples_seen": 74649600.0, "progress": 0.6539465539976856, "epoch": 58.855446621805406, "img/sec/core": 189.48375275255214, "core_hours_Tesla V100-SXM2-32GB": 109.34936538719055, "core_hours": 109.34936538719055}
{"step": 72950, "global_schedule": 0.31545907258987427, "l2_grads": 2.047712564468384, "l2_params": 276.38653564453125, "l2_updates": 0.3404981791973114, "training_loss": 2.269578456878662, "uptime": 26739.69965501997, "examples_seen": 74700800.0, "progress": 0.6543950770114014, "epoch": 58.89581386914547, "img/sec/core": 189.67260897093064, "core_hours_Tesla V100-SXM2-32GB": 109.42434839237714, "core_hours": 109.42434839237714}
{"step": 73000, "global_schedule": 0.31474003195762634, "l2_grads": 1.941479206085205, "l2_params": 276.3032531738281, "l2_updates": 0.3424990773200989, "training_loss": 2.0763473510742188, "uptime": 26756.55143048498, "examples_seen": 74752000.0, "progress": 0.6548436000251173, "epoch": 58.93618111648553, "img/sec/core": 189.89097063656135, "core_hours_Tesla V100-SXM2-32GB": 109.49924517222163, "core_hours": 109.49924517222163}
{"step": 73050, "global_schedule": 0.3140213191509247, "l2_grads": 1.9763126373291016, "l2_params": 276.2167053222656, "l2_updates": 0.3325263559818268, "training_loss": 1.9475038051605225, "uptime": 26774.289382245974, "examples_seen": 74803200.0, "progress": 0.6552921230388331, "epoch": 58.976548363825586, "img/sec/core": 189.47193662239943, "core_hours_Tesla V100-SXM2-32GB": 109.57430759294606, "core_hours": 109.57430759294606}
{"step": 73100, "global_schedule": 0.3133031725883484, "l2_grads": 1.786318063735962, "l2_params": 276.1331481933594, "l2_updates": 0.3402946889400482, "training_loss": 2.454038619995117, "uptime": 26791.130635662004, "examples_seen": 74854400.0, "progress": 0.655740646052549, "epoch": 59.01691561116564, "img/sec/core": 190.00961038648222, "core_hours_Tesla V100-SXM2-32GB": 109.64915760812842, "core_hours": 109.64915760812842}
{"step": 73150, "global_schedule": 0.31258535385131836, "l2_grads": 1.777658462524414, "l2_params": 276.05230712890625, "l2_updates": 0.3358986973762512, "training_loss": 3.3921637535095215, "uptime": 26807.99590645096, "examples_seen": 74905600.0, "progress": 0.6561891690662648, "epoch": 59.0572828585057, "img/sec/core": 189.73902287388614, "core_hours_Tesla V100-SXM2-32GB": 109.72411436719044, "core_hours": 109.72411436719044}
{"step": 73200, "global_schedule": 0.3118680715560913, "l2_grads": 2.0125670433044434, "l2_params": 275.9613952636719, "l2_updates": 0.33937808871269226, "training_loss": 1.9990193843841553, "uptime": 26824.863043023972, "examples_seen": 74956800.0, "progress": 0.6566376920799806, "epoch": 59.09765010584576, "img/sec/core": 189.71803460228105, "core_hours_Tesla V100-SXM2-32GB": 109.79907941862604, "core_hours": 109.79907941862604}
{"step": 73250, "global_schedule": 0.3111511468887329, "l2_grads": 1.8928762674331665, "l2_params": 275.8826599121094, "l2_updates": 0.3419386148452759, "training_loss": 2.057063102722168, "uptime": 26841.71277124295, "examples_seen": 75008000.0, "progress": 0.6570862150936965, "epoch": 59.138017353185816, "img/sec/core": 189.91404243516283, "core_hours_Tesla V100-SXM2-32GB": 109.87396709959928, "core_hours": 109.87396709959928}
{"step": 73300, "global_schedule": 0.31043481826782227, "l2_grads": 1.7739510536193848, "l2_params": 275.7920837402344, "l2_updates": 0.33837512135505676, "training_loss": 2.4761338233947754, "uptime": 26858.582520317985, "examples_seen": 75059200.0, "progress": 0.6575347381074123, "epoch": 59.17838460052588, "img/sec/core": 189.68865427498545, "core_hours_Tesla V100-SXM2-32GB": 109.948943762155, "core_hours": 109.948943762155}
{"step": 73350, "global_schedule": 0.3097187876701355, "l2_grads": 1.9285107851028442, "l2_params": 275.7037353515625, "l2_updates": 0.33999907970428467, "training_loss": 1.9996830224990845, "uptime": 26875.443364934996, "examples_seen": 75110400.0, "progress": 0.6579832611211281, "epoch": 59.21875184786594, "img/sec/core": 189.78883162065898, "core_hours_Tesla V100-SXM2-32GB": 110.0238808493417, "core_hours": 110.0238808493417}
{"step": 73400, "global_schedule": 0.3090033531188965, "l2_grads": 1.953817367553711, "l2_params": 275.61444091796875, "l2_updates": 0.33031710982322693, "training_loss": 1.972670555114746, "uptime": 26892.290620907967, "examples_seen": 75161600.0, "progress": 0.6584317841348439, "epoch": 59.259119095205996, "img/sec/core": 189.9419113198012, "core_hours_Tesla V100-SXM2-32GB": 110.0987575425549, "core_hours": 110.0987575425549}
{"step": 73450, "global_schedule": 0.30828824639320374, "l2_grads": 1.823883295059204, "l2_params": 275.53216552734375, "l2_updates": 0.3325617015361786, "training_loss": 4.377138137817383, "uptime": 26909.158051015984, "examples_seen": 75212800.0, "progress": 0.6588803071485598, "epoch": 59.299486342546054, "img/sec/core": 189.71473303920806, "core_hours_Tesla V100-SXM2-32GB": 110.17372389859055, "core_hours": 110.17372389859055}
{"step": 73500, "global_schedule": 0.30757373571395874, "l2_grads": 1.9166346788406372, "l2_params": 275.44866943359375, "l2_updates": 0.33426904678344727, "training_loss": 2.1220109462738037, "uptime": 26926.007073874003, "examples_seen": 75264000.0, "progress": 0.6593288301622756, "epoch": 59.33985358988611, "img/sec/core": 189.92199292298602, "core_hours_Tesla V100-SXM2-32GB": 110.24860844462619, "core_hours": 110.24860844462619}
{"step": 73550, "global_schedule": 0.30685955286026, "l2_grads": 1.804134726524353, "l2_params": 275.3646545410156, "l2_updates": 0.33420827984809875, "training_loss": 2.738433837890625, "uptime": 26942.86324874399, "examples_seen": 75315200.0, "progress": 0.6597773531759915, "epoch": 59.38022083722617, "img/sec/core": 189.84140973156158, "core_hours_Tesla V100-SXM2-32GB": 110.32352477738168, "core_hours": 110.32352477738168}
{"step": 73600, "global_schedule": 0.30614593625068665, "l2_grads": 1.905684232711792, "l2_params": 275.27484130859375, "l2_updates": 0.33308321237564087, "training_loss": 2.142871379852295, "uptime": 26959.72541245597, "examples_seen": 75366400.0, "progress": 0.6602258761897073, "epoch": 59.420588084566226, "img/sec/core": 189.77398480164197, "core_hours_Tesla V100-SXM2-32GB": 110.39846772721269, "core_hours": 110.39846772721269}
{"step": 73650, "global_schedule": 0.30543267726898193, "l2_grads": 1.8079394102096558, "l2_params": 275.18701171875, "l2_updates": 0.3307955861091614, "training_loss": 3.019341230392456, "uptime": 26976.593586992996, "examples_seen": 75417600.0, "progress": 0.6606743992034231, "epoch": 59.46095533190629, "img/sec/core": 189.70636051789614, "core_hours_Tesla V100-SXM2-32GB": 110.47343739182172, "core_hours": 110.47343739182172}
{"step": 73700, "global_schedule": 0.304720014333725, "l2_grads": 1.7325620651245117, "l2_params": 275.10235595703125, "l2_updates": 0.33584970235824585, "training_loss": 3.5514252185821533, "uptime": 26993.468457361974, "examples_seen": 75468800.0, "progress": 0.661122922217139, "epoch": 59.50132257924635, "img/sec/core": 189.63108634497922, "core_hours_Tesla V100-SXM2-32GB": 110.54843681568383, "core_hours": 110.54843681568383}
{"step": 73750, "global_schedule": 0.30400770902633667, "l2_grads": 1.9441149234771729, "l2_params": 275.0176086425781, "l2_updates": 0.3257422149181366, "training_loss": 2.7363710403442383, "uptime": 27010.33664519695, "examples_seen": 75520000.0, "progress": 0.6615714452308548, "epoch": 59.541689826586406, "img/sec/core": 189.70621096387978, "core_hours_Tesla V100-SXM2-32GB": 110.62340653939484, "core_hours": 110.62340653939484}
{"step": 73800, "global_schedule": 0.30329596996307373, "l2_grads": 1.8644249439239502, "l2_params": 274.92242431640625, "l2_updates": 0.33125579357147217, "training_loss": 2.093492031097412, "uptime": 27027.187563935993, "examples_seen": 75571200.0, "progress": 0.6620199682445707, "epoch": 59.582057073926464, "img/sec/core": 189.90062497811536, "core_hours_Tesla V100-SXM2-32GB": 110.69829951156837, "core_hours": 110.69829951156837}
{"step": 73850, "global_schedule": 0.30258458852767944, "l2_grads": 1.9362422227859497, "l2_params": 274.84405517578125, "l2_updates": 0.33032989501953125, "training_loss": 2.113133430480957, "uptime": 27044.04746837099, "examples_seen": 75622400.0, "progress": 0.6624684912582864, "epoch": 59.62242432126652, "img/sec/core": 189.79941507601183, "core_hours_Tesla V100-SXM2-32GB": 110.77323242016836, "core_hours": 110.77323242016836}
{"step": 73900, "global_schedule": 0.3018738031387329, "l2_grads": 1.7868802547454834, "l2_params": 274.7577209472656, "l2_updates": 0.3260550796985626, "training_loss": 4.330741882324219, "uptime": 27060.89569310099, "examples_seen": 75673600.0, "progress": 0.6629170142720023, "epoch": 59.66279156860658, "img/sec/core": 189.93098983909226, "core_hours_Tesla V100-SXM2-32GB": 110.84811341896834, "core_hours": 110.84811341896834}
{"step": 73950, "global_schedule": 0.3011634349822998, "l2_grads": 1.784649133682251, "l2_params": 274.6685485839844, "l2_updates": 0.3241754472255707, "training_loss": 2.896785259246826, "uptime": 27077.747455835983, "examples_seen": 75724800.0, "progress": 0.6633655372857181, "epoch": 59.70315881594664, "img/sec/core": 189.89111408238517, "core_hours_Tesla V100-SXM2-32GB": 110.92301014223499, "core_hours": 110.92301014223499}
{"step": 74000, "global_schedule": 0.3004535436630249, "l2_grads": 1.9567711353302002, "l2_params": 274.5780944824219, "l2_updates": 0.3271840512752533, "training_loss": 1.946613073348999, "uptime": 27094.613982915005, "examples_seen": 75776000.0, "progress": 0.663814060299434, "epoch": 59.7435260632867, "img/sec/core": 189.7248903112933, "core_hours_Tesla V100-SXM2-32GB": 110.99797248480841, "core_hours": 110.99797248480841}
{"step": 74050, "global_schedule": 0.2997440993785858, "l2_grads": 1.8296133279800415, "l2_params": 274.5008544921875, "l2_updates": 0.3298896551132202, "training_loss": 2.452871084213257, "uptime": 27112.02796128695, "examples_seen": 75827200.0, "progress": 0.6642625833131498, "epoch": 59.78389331062676, "img/sec/core": 189.60113759610547, "core_hours_Tesla V100-SXM2-32GB": 111.07298375532368, "core_hours": 111.07298375532368}
{"step": 74100, "global_schedule": 0.2990351617336273, "l2_grads": 1.7428735494613647, "l2_params": 274.41766357421875, "l2_updates": 0.32160454988479614, "training_loss": 2.933717727661133, "uptime": 27128.895754850004, "examples_seen": 75878400.0, "progress": 0.6647111063268656, "epoch": 59.82426055796682, "img/sec/core": 189.71064520310964, "core_hours_Tesla V100-SXM2-32GB": 111.14795172671504, "core_hours": 111.14795172671504}
{"step": 74150, "global_schedule": 0.298326700925827, "l2_grads": 2.057537317276001, "l2_params": 274.33380126953125, "l2_updates": 0.32319000363349915, "training_loss": 2.1712920665740967, "uptime": 27145.76084903098, "examples_seen": 75929600.0, "progress": 0.6651596293405815, "epoch": 59.864627805306874, "img/sec/core": 189.74100978396632, "core_hours_Tesla V100-SXM2-32GB": 111.22290770085269, "core_hours": 111.22290770085269}
{"step": 74200, "global_schedule": 0.2976187467575073, "l2_grads": 1.892822027206421, "l2_params": 274.2416687011719, "l2_updates": 0.32188355922698975, "training_loss": 1.95359468460083, "uptime": 27162.641735018988, "examples_seen": 75980800.0, "progress": 0.6656081523542973, "epoch": 59.90499505264693, "img/sec/core": 189.5635100120457, "core_hours_Tesla V100-SXM2-32GB": 111.2979338607994, "core_hours": 111.2979338607994}
{"step": 74250, "global_schedule": 0.29691123962402344, "l2_grads": 1.8874274492263794, "l2_params": 274.15667724609375, "l2_updates": 0.3184340298175812, "training_loss": 3.8983378410339355, "uptime": 27179.49703768699, "examples_seen": 76032000.0, "progress": 0.6660566753680132, "epoch": 59.94536229998699, "img/sec/core": 189.851233349542, "core_hours_Tesla V100-SXM2-32GB": 111.37284631710163, "core_hours": 111.37284631710163}
{"step": 74300, "global_schedule": 0.29620420932769775, "l2_grads": 1.9715931415557861, "l2_params": 274.0768737792969, "l2_updates": 0.32605159282684326, "training_loss": 2.061328411102295, "uptime": 27196.384449033998, "examples_seen": 76083200.0, "progress": 0.666505198381729, "epoch": 59.98572954732705, "img/sec/core": 189.4902619617243, "core_hours_Tesla V100-SXM2-32GB": 111.44790147864389, "core_hours": 111.44790147864389}
{"step": 74350, "global_schedule": 0.29549771547317505, "l2_grads": 1.948708415031433, "l2_params": 273.99029541015625, "l2_updates": 0.32349714636802673, "training_loss": 2.0430190563201904, "uptime": 27213.26301336399, "examples_seen": 76134400.0, "progress": 0.6669537213954448, "epoch": 60.02609679466711, "img/sec/core": 189.58958460191616, "core_hours_Tesla V100-SXM2-32GB": 111.52291732011052, "core_hours": 111.52291732011052}
{"step": 74400, "global_schedule": 0.29479163885116577, "l2_grads": 1.971563696861267, "l2_params": 273.90802001953125, "l2_updates": 0.3139120638370514, "training_loss": 2.0235390663146973, "uptime": 27230.135952701967, "examples_seen": 76185600.0, "progress": 0.6674022444091606, "epoch": 60.06646404200717, "img/sec/core": 189.65278875848816, "core_hours_Tesla V100-SXM2-32GB": 111.59790816161264, "core_hours": 111.59790816161264}
{"step": 74450, "global_schedule": 0.29408615827560425, "l2_grads": 1.8069976568222046, "l2_params": 273.82958984375, "l2_updates": 0.31963908672332764, "training_loss": 2.9282798767089844, "uptime": 27246.98842728499, "examples_seen": 76236800.0, "progress": 0.6678507674228764, "epoch": 60.10683128934723, "img/sec/core": 189.88309308734205, "core_hours_Tesla V100-SXM2-32GB": 111.67280804864829, "core_hours": 111.67280804864829}
{"step": 74500, "global_schedule": 0.29338109493255615, "l2_grads": 2.0305402278900146, "l2_params": 273.7459716796875, "l2_updates": 0.3239835500717163, "training_loss": 2.26851224899292, "uptime": 27263.86962134298, "examples_seen": 76288000.0, "progress": 0.6682992904365923, "epoch": 60.147198536687284, "img/sec/core": 189.56005061059435, "core_hours_Tesla V100-SXM2-32GB": 111.74783557779492, "core_hours": 111.74783557779492}
{"step": 74550, "global_schedule": 0.29267656803131104, "l2_grads": 2.0016348361968994, "l2_params": 273.6693420410156, "l2_updates": 0.31659170985221863, "training_loss": 2.0175719261169434, "uptime": 27280.743105993955, "examples_seen": 76339200.0, "progress": 0.6687478134503081, "epoch": 60.18756578402734, "img/sec/core": 189.6466596077355, "core_hours_Tesla V100-SXM2-32GB": 111.82282884291037, "core_hours": 111.82282884291037}
{"step": 74600, "global_schedule": 0.29197248816490173, "l2_grads": 1.7180430889129639, "l2_params": 273.58306884765625, "l2_updates": 0.3157350718975067, "training_loss": 3.072610855102539, "uptime": 27297.621643668972, "examples_seen": 76390400.0, "progress": 0.669196336464024, "epoch": 60.2279330313674, "img/sec/core": 189.58988400616053, "core_hours_Tesla V100-SXM2-32GB": 111.89784456591045, "core_hours": 111.89784456591045}
{"step": 74650, "global_schedule": 0.2912689447402954, "l2_grads": 1.7918033599853516, "l2_params": 273.49951171875, "l2_updates": 0.3168390095233917, "training_loss": 3.430929183959961, "uptime": 27314.519660312973, "examples_seen": 76441600.0, "progress": 0.6696448594777398, "epoch": 60.26830027870746, "img/sec/core": 189.37133673234658, "core_hours_Tesla V100-SXM2-32GB": 111.972946862106, "core_hours": 111.972946862106}
{"step": 74700, "global_schedule": 0.2905658483505249, "l2_grads": 1.8221497535705566, "l2_params": 273.41754150390625, "l2_updates": 0.3133246600627899, "training_loss": 1.9144186973571777, "uptime": 27331.401458230976, "examples_seen": 76492800.0, "progress": 0.6700933824914557, "epoch": 60.30866752604752, "img/sec/core": 189.55327006892074, "core_hours_Tesla V100-SXM2-32GB": 112.0479770750749, "core_hours": 112.0479770750749}
{"step": 74750, "global_schedule": 0.28986334800720215, "l2_grads": 2.127169132232666, "l2_params": 273.3320007324219, "l2_updates": 0.31081393361091614, "training_loss": 4.3882012367248535, "uptime": 27348.28280572797, "examples_seen": 76544000.0, "progress": 0.6705419055051715, "epoch": 60.34903477338758, "img/sec/core": 189.55832764948667, "core_hours_Tesla V100-SXM2-32GB": 112.12300528617266, "core_hours": 112.12300528617266}
{"step": 74800, "global_schedule": 0.2891612648963928, "l2_grads": 2.0130133628845215, "l2_params": 273.24658203125, "l2_updates": 0.31432488560676575, "training_loss": 2.0360944271087646, "uptime": 27365.151396200003, "examples_seen": 76595200.0, "progress": 0.6709904285188873, "epoch": 60.38940202072764, "img/sec/core": 189.70168285876287, "core_hours_Tesla V100-SXM2-32GB": 112.19797679938169, "core_hours": 112.19797679938169}
{"step": 74850, "global_schedule": 0.28845977783203125, "l2_grads": 1.8191776275634766, "l2_params": 273.161376953125, "l2_updates": 0.31014108657836914, "training_loss": 4.470353126525879, "uptime": 27382.037762858963, "examples_seen": 76646400.0, "progress": 0.6714389515326031, "epoch": 60.429769268067695, "img/sec/core": 189.50198492237365, "core_hours_Tesla V100-SXM2-32GB": 112.27302731786595, "core_hours": 112.27302731786595}
{"step": 74900, "global_schedule": 0.2877586781978607, "l2_grads": 1.762587547302246, "l2_params": 273.0797119140625, "l2_updates": 0.3107258677482605, "training_loss": 2.902925729751587, "uptime": 27398.925504138984, "examples_seen": 76697600.0, "progress": 0.6718874745463189, "epoch": 60.47013651540775, "img/sec/core": 189.48655992176552, "core_hours_Tesla V100-SXM2-32GB": 112.34808394577718, "core_hours": 112.34808394577718}
{"step": 74950, "global_schedule": 0.2870582044124603, "l2_grads": 1.804219126701355, "l2_params": 272.9902648925781, "l2_updates": 0.30982837080955505, "training_loss": 2.771660327911377, "uptime": 27415.801428278966, "examples_seen": 76748800.0, "progress": 0.6723359975600348, "epoch": 60.51050376274781, "img/sec/core": 189.6192453495703, "core_hours_Tesla V100-SXM2-32GB": 112.42308805306598, "core_hours": 112.42308805306598}
{"step": 75000, "global_schedule": 0.28635814785957336, "l2_grads": 2.0200555324554443, "l2_params": 272.90911865234375, "l2_updates": 0.31062039732933044, "training_loss": 2.0576162338256836, "uptime": 27432.664301624987, "examples_seen": 76800000.0, "progress": 0.6727845205737506, "epoch": 60.55087101008787, "img/sec/core": 189.76599861346236, "core_hours_Tesla V100-SXM2-32GB": 112.49803415682608, "core_hours": 112.49803415682608, "minival/prec@1": 0.7371214486418982, "minival/loss": 1.0585853845820812, "minival/sample count": 12812.0, "minival/attn_weight_avg": [13312, 12, 281], "minival/attn_mag": [13312, 12, 281], "minival/before_mlp": [13312, 12, 281], "z/secs/eval/minival": 2.9077644890057854, "real/prec@1": 0.7758182633388133, "real/loss": 1.8696504966693, "real/sample count": 46837.0, "real/attn_weight_avg": [50176, 12, 281], "real/attn_mag": [50176, 12, 281], "real/before_mlp": [50176, 12, 281], "z/secs/eval/real": 11.166549679997843, "train/prec@1": 0.7686453576864536, "train/loss": 0.8874300204260178, "train/sample count": 25623.0, "train/attn_weight_avg": [26624, 12, 281], "train/attn_mag": [26624, 12, 281], "train/before_mlp": [26624, 12, 281], "z/secs/eval/train": 6.606346643005963, "v2/prec@1": 0.5737, "v2/loss": 1.8545146240234376, "v2/sample count": 10000.0, "v2/attn_weight_avg": [10240, 12, 281], "v2/attn_mag": [10240, 12, 281], "v2/before_mlp": [10240, 12, 281], "z/secs/eval/v2": 3.370270472019911, "val/prec@1": 0.70406, "val/loss": 1.1913061901855468, "val/sample count": 50000.0, "val/attn_weight_avg": [50176, 12, 281], "val/attn_mag": [50176, 12, 281], "val/before_mlp": [50176, 12, 281], "z/secs/eval/val": 12.378069087979384}
{"step": 75050, "global_schedule": 0.28565871715545654, "l2_grads": 2.053257703781128, "l2_params": 272.8334655761719, "l2_updates": 0.306780070066452, "training_loss": 1.9619455337524414, "uptime": 27486.55181050999, "examples_seen": 76851200.0, "progress": 0.6732330435874665, "epoch": 60.591238257427925, "img/sec/core": 189.17926193413524, "core_hours_Tesla V100-SXM2-32GB": 112.57321270481708, "core_hours": 112.57321270481708}
{"step": 75100, "global_schedule": 0.28495967388153076, "l2_grads": 1.9597474336624146, "l2_params": 272.7431335449219, "l2_updates": 0.3105430006980896, "training_loss": 2.035503387451172, "uptime": 27503.42420764797, "examples_seen": 76902400.0, "progress": 0.6736815666011823, "epoch": 60.63160550476799, "img/sec/core": 189.6588833128324, "core_hours_Tesla V100-SXM2-32GB": 112.64820113654146, "core_hours": 112.64820113654146}
{"step": 75150, "global_schedule": 0.28426122665405273, "l2_grads": 1.9793989658355713, "l2_params": 272.6589660644531, "l2_updates": 0.30523040890693665, "training_loss": 1.978039264678955, "uptime": 27520.282519890985, "examples_seen": 76953600.0, "progress": 0.6741300896148982, "epoch": 60.67197275210805, "img/sec/core": 189.81734077953928, "core_hours_Tesla V100-SXM2-32GB": 112.72312696873263, "core_hours": 112.72312696873263}
{"step": 75200, "global_schedule": 0.2835633456707001, "l2_grads": 1.849863052368164, "l2_params": 272.5715637207031, "l2_updates": 0.30709272623062134, "training_loss": 2.513390302658081, "uptime": 27537.144925325003, "examples_seen": 77004800.0, "progress": 0.674578612628614, "epoch": 60.712339999448105, "img/sec/core": 189.77126439768557, "core_hours_Tesla V100-SXM2-32GB": 112.79807099288381, "core_hours": 112.79807099288381}
{"step": 75251, "global_schedule": 0.28286585211753845, "l2_grads": 2.1668617725372314, "l2_params": 272.48779296875, "l2_updates": 0.3051605820655823, "training_loss": 2.017399311065674, "uptime": 27554.01626558299, "examples_seen": 77056000.0, "progress": 0.6750271356423299, "epoch": 60.75270724678816, "img/sec/core": 189.670764211205, "core_hours_Tesla V100-SXM2-32GB": 112.87305472736377, "core_hours": 112.87305472736377}
{"step": 75300, "global_schedule": 0.282168984413147, "l2_grads": 1.9485480785369873, "l2_params": 272.3995361328125, "l2_updates": 0.30823206901550293, "training_loss": 2.312485456466675, "uptime": 27570.875275437953, "examples_seen": 77107200.0, "progress": 0.6754756586560456, "epoch": 60.79307449412822, "img/sec/core": 189.80948629425706, "core_hours_Tesla V100-SXM2-32GB": 112.94798366005247, "core_hours": 112.94798366005247}
{"step": 75350, "global_schedule": 0.2814725339412689, "l2_grads": 2.1322038173675537, "l2_params": 272.3200988769531, "l2_updates": 0.3043574094772339, "training_loss": 4.346637725830078, "uptime": 27587.782020886953, "examples_seen": 77158400.0, "progress": 0.6759241816697614, "epoch": 60.83344174146828, "img/sec/core": 189.27356596531442, "core_hours_Tesla V100-SXM2-32GB": 113.02312475093692, "core_hours": 113.02312475093692}
{"step": 75400, "global_schedule": 0.2807767391204834, "l2_grads": 1.7863479852676392, "l2_params": 272.24127197265625, "l2_updates": 0.2999360263347626, "training_loss": 3.280219554901123, "uptime": 27604.649650993, "examples_seen": 77209600.0, "progress": 0.6763727046834773, "epoch": 60.873808988808335, "img/sec/core": 189.71248360803637, "core_hours_Tesla V100-SXM2-32GB": 113.09809199585268, "core_hours": 113.09809199585268}
{"step": 75450, "global_schedule": 0.2800813317298889, "l2_grads": 1.9448390007019043, "l2_params": 272.15863037109375, "l2_updates": 0.3040120005607605, "training_loss": 1.9365599155426025, "uptime": 27621.516602771997, "examples_seen": 77260800.0, "progress": 0.6768212276971931, "epoch": 60.9141762361484, "img/sec/core": 189.7201131495936, "core_hours_Tesla V100-SXM2-32GB": 113.17305622598157, "core_hours": 113.17305622598157}
{"step": 75500, "global_schedule": 0.27938657999038696, "l2_grads": 1.8798109292984009, "l2_params": 272.07489013671875, "l2_updates": 0.30443480610847473, "training_loss": 4.293741703033447, "uptime": 27638.393296710972, "examples_seen": 77312000.0, "progress": 0.677269750710909, "epoch": 60.95454348348846, "img/sec/core": 189.61059622050055, "core_hours_Tesla V100-SXM2-32GB": 113.24806375459924, "core_hours": 113.24806375459924}
{"step": 75550, "global_schedule": 0.27869221568107605, "l2_grads": 2.018052101135254, "l2_params": 271.99432373046875, "l2_updates": 0.30385860800743103, "training_loss": 2.143037796020508, "uptime": 27655.264154645964, "examples_seen": 77363200.0, "progress": 0.6777182737246248, "epoch": 60.994910730828515, "img/sec/core": 189.67618673161675, "core_hours_Tesla V100-SXM2-32GB": 113.32304534542142, "core_hours": 113.32304534542142}
{"step": 75600, "global_schedule": 0.27799850702285767, "l2_grads": 1.9115419387817383, "l2_params": 271.9171142578125, "l2_updates": 0.30562669038772583, "training_loss": 1.9070411920547485, "uptime": 27672.13420137897, "examples_seen": 77414400.0, "progress": 0.6781667967383407, "epoch": 61.03527797816857, "img/sec/core": 189.68530737614103, "core_hours_Tesla V100-SXM2-32GB": 113.39802333090144, "core_hours": 113.39802333090144}
{"step": 75650, "global_schedule": 0.2773052453994751, "l2_grads": 1.9868035316467285, "l2_params": 271.8320617675781, "l2_updates": 0.29728758335113525, "training_loss": 2.1186444759368896, "uptime": 27689.00102806097, "examples_seen": 77465600.0, "progress": 0.6786153197520565, "epoch": 61.07564522550863, "img/sec/core": 189.72152025576656, "core_hours_Tesla V100-SXM2-32GB": 113.47298700504368, "core_hours": 113.47298700504368}
{"step": 75700, "global_schedule": 0.2766125798225403, "l2_grads": 1.9064315557479858, "l2_params": 271.75225830078125, "l2_updates": 0.30509546399116516, "training_loss": 2.283034324645996, "uptime": 27705.878947213, "examples_seen": 77516800.0, "progress": 0.6790638427657724, "epoch": 61.11601247284869, "img/sec/core": 189.5968318828662, "core_hours_Tesla V100-SXM2-32GB": 113.54799997905269, "core_hours": 113.54799997905269}
{"step": 75750, "global_schedule": 0.27592039108276367, "l2_grads": 2.0951671600341797, "l2_params": 271.6715087890625, "l2_updates": 0.3011021614074707, "training_loss": 1.9401060342788696, "uptime": 27722.727304211003, "examples_seen": 77568000.0, "progress": 0.6795123657794881, "epoch": 61.156379720188745, "img/sec/core": 189.92949878611535, "core_hours_Tesla V100-SXM2-32GB": 113.62288156571047, "core_hours": 113.62288156571047}
{"step": 75800, "global_schedule": 0.2752287983894348, "l2_grads": 1.8933992385864258, "l2_params": 271.59942626953125, "l2_updates": 0.3006359040737152, "training_loss": 2.210481643676758, "uptime": 27739.62159588997, "examples_seen": 77619200.0, "progress": 0.6799608887932039, "epoch": 61.19674696752881, "img/sec/core": 189.4130905756674, "core_hours_Tesla V100-SXM2-32GB": 113.69796730650589, "core_hours": 113.69796730650589}
{"step": 75850, "global_schedule": 0.27453768253326416, "l2_grads": 1.9401811361312866, "l2_params": 271.51898193359375, "l2_updates": 0.2991439998149872, "training_loss": 2.0319390296936035, "uptime": 27756.491534514003, "examples_seen": 77670400.0, "progress": 0.6804094118069198, "epoch": 61.23711421486887, "img/sec/core": 189.68652295161397, "core_hours_Tesla V100-SXM2-32GB": 113.7729448115016, "core_hours": 113.7729448115016}
{"step": 75900, "global_schedule": 0.27384719252586365, "l2_grads": 1.881213903427124, "l2_params": 271.43914794921875, "l2_updates": 0.29706183075904846, "training_loss": 3.7057533264160156, "uptime": 27773.366474949988, "examples_seen": 77721600.0, "progress": 0.6808579348206356, "epoch": 61.277481462208925, "img/sec/core": 189.63029897138546, "core_hours_Tesla V100-SXM2-32GB": 113.84794454677264, "core_hours": 113.84794454677264}
{"step": 75950, "global_schedule": 0.27315711975097656, "l2_grads": 1.8425790071487427, "l2_params": 271.3542785644531, "l2_updates": 0.29720747470855713, "training_loss": 3.8601651191711426, "uptime": 27790.24591318, "examples_seen": 77772800.0, "progress": 0.6813064578343515, "epoch": 61.31784870954898, "img/sec/core": 189.57976897065768, "core_hours_Tesla V100-SXM2-32GB": 113.92296427223935, "core_hours": 113.92296427223935}
{"step": 76000, "global_schedule": 0.2724677324295044, "l2_grads": 1.9914265871047974, "l2_params": 271.27374267578125, "l2_updates": 0.29458582401275635, "training_loss": 1.9585572481155396, "uptime": 27807.130157077976, "examples_seen": 77824000.0, "progress": 0.6817549808480673, "epoch": 61.35821595688904, "img/sec/core": 189.52580994067236, "core_hours_Tesla V100-SXM2-32GB": 113.99800535623037, "core_hours": 113.99800535623037}
{"step": 76050, "global_schedule": 0.27177876234054565, "l2_grads": 2.0242185592651367, "l2_params": 271.1954650878906, "l2_updates": 0.2965165674686432, "training_loss": 2.0125937461853027, "uptime": 27824.55648599495, "examples_seen": 77875200.0, "progress": 0.6822035038617832, "epoch": 61.3985832042291, "img/sec/core": 189.71317283527011, "core_hours_Tesla V100-SXM2-32GB": 114.07297232879041, "core_hours": 114.07297232879041}
{"step": 76100, "global_schedule": 0.27109044790267944, "l2_grads": 2.0289881229400635, "l2_params": 271.11614990234375, "l2_updates": 0.30003663897514343, "training_loss": 2.0838534832000732, "uptime": 27841.42644509999, "examples_seen": 77926400.0, "progress": 0.682652026875499, "epoch": 61.438950451569156, "img/sec/core": 189.68629266233182, "core_hours_Tesla V100-SXM2-32GB": 114.1479499248128, "core_hours": 114.1479499248128}
{"step": 76150, "global_schedule": 0.2704026699066162, "l2_grads": 2.0984561443328857, "l2_params": 271.0354309082031, "l2_updates": 0.29077598452568054, "training_loss": 1.8639742136001587, "uptime": 27858.29425989295, "examples_seen": 77977600.0, "progress": 0.6831005498892149, "epoch": 61.47931769890922, "img/sec/core": 189.71040643246107, "core_hours_Tesla V100-SXM2-32GB": 114.22291799055931, "core_hours": 114.22291799055931}
{"step": 76200, "global_schedule": 0.2697153687477112, "l2_grads": 1.7419685125350952, "l2_params": 270.947021484375, "l2_updates": 0.2929667830467224, "training_loss": 2.693378448486328, "uptime": 27875.166560007958, "examples_seen": 78028800.0, "progress": 0.6835490729029307, "epoch": 61.51968494624928, "img/sec/core": 189.65997393288814, "core_hours_Tesla V100-SXM2-32GB": 114.29790599107044, "core_hours": 114.29790599107044}
{"step": 76250, "global_schedule": 0.2690287232398987, "l2_grads": 1.967315673828125, "l2_params": 270.87506103515625, "l2_updates": 0.29350733757019043, "training_loss": 2.520875930786133, "uptime": 27892.01579257095, "examples_seen": 78080000.0, "progress": 0.6839975959166464, "epoch": 61.560052193589335, "img/sec/core": 189.919629160351, "core_hours_Tesla V100-SXM2-32GB": 114.37279146912819, "core_hours": 114.37279146912819}
{"step": 76300, "global_schedule": 0.2683424949645996, "l2_grads": 1.8549646139144897, "l2_params": 270.7921447753906, "l2_updates": 0.2891342341899872, "training_loss": 3.6417245864868164, "uptime": 27908.885355100967, "examples_seen": 78131200.0, "progress": 0.6844461189303623, "epoch": 61.60041944092939, "img/sec/core": 189.69075186781248, "core_hours_Tesla V100-SXM2-32GB": 114.44776730259493, "core_hours": 114.44776730259493}
{"step": 76350, "global_schedule": 0.26765692234039307, "l2_grads": 2.007425546646118, "l2_params": 270.70770263671875, "l2_updates": 0.28873032331466675, "training_loss": 1.9216636419296265, "uptime": 27925.74924242898, "examples_seen": 78182400.0, "progress": 0.6848946419440781, "epoch": 61.64078668826945, "img/sec/core": 189.7545884740447, "core_hours_Tesla V100-SXM2-32GB": 114.52271791294166, "core_hours": 114.52271791294166}
{"step": 76400, "global_schedule": 0.2669718265533447, "l2_grads": 2.025761604309082, "l2_params": 270.6252136230469, "l2_updates": 0.28931504487991333, "training_loss": 2.000080108642578, "uptime": 27942.62633603398, "examples_seen": 78233600.0, "progress": 0.685343164957794, "epoch": 61.68115393560951, "img/sec/core": 189.6061060568049, "core_hours_Tesla V100-SXM2-32GB": 114.59772721785275, "core_hours": 114.59772721785275}
{"step": 76450, "global_schedule": 0.26628729701042175, "l2_grads": 1.85041344165802, "l2_params": 270.5454406738281, "l2_updates": 0.2868765890598297, "training_loss": 3.015202760696411, "uptime": 27959.50214339496, "examples_seen": 78284800.0, "progress": 0.6857916879715098, "epoch": 61.721521182949566, "img/sec/core": 189.62055749695404, "core_hours_Tesla V100-SXM2-32GB": 114.67273080612378, "core_hours": 114.67273080612378}
{"step": 76500, "global_schedule": 0.2656034231185913, "l2_grads": 2.018059253692627, "l2_params": 270.4600524902344, "l2_updates": 0.29161617159843445, "training_loss": 2.089801788330078, "uptime": 27976.364083544002, "examples_seen": 78336000.0, "progress": 0.6862402109852257, "epoch": 61.76188843028963, "img/sec/core": 189.7765009076713, "core_hours_Tesla V100-SXM2-32GB": 114.74767276234175, "core_hours": 114.74767276234175}
{"step": 76550, "global_schedule": 0.2649199962615967, "l2_grads": 2.0574374198913574, "l2_params": 270.380126953125, "l2_updates": 0.2896791696548462, "training_loss": 2.061509132385254, "uptime": 27993.258956937992, "examples_seen": 78387200.0, "progress": 0.6866887339989415, "epoch": 61.80225567762969, "img/sec/core": 189.40656880792173, "core_hours_Tesla V100-SXM2-32GB": 114.82276108853725, "core_hours": 114.82276108853725}
{"step": 76600, "global_schedule": 0.2642372250556946, "l2_grads": 1.9609806537628174, "l2_params": 270.3041076660156, "l2_updates": 0.28712567687034607, "training_loss": 4.448206424713135, "uptime": 28010.128250180976, "examples_seen": 78438400.0, "progress": 0.6871372570126573, "epoch": 61.842622924969746, "img/sec/core": 189.69377992945223, "core_hours_Tesla V100-SXM2-32GB": 114.89773572517274, "core_hours": 114.89773572517274}
{"step": 76650, "global_schedule": 0.2635549306869507, "l2_grads": 2.1204006671905518, "l2_params": 270.21185302734375, "l2_updates": 0.28145524859428406, "training_loss": 2.010535717010498, "uptime": 28027.011942959973, "examples_seen": 78489600.0, "progress": 0.6875857800263732, "epoch": 61.8829901723098, "img/sec/core": 189.53199645878973, "core_hours_Tesla V100-SXM2-32GB": 114.97277435974607, "core_hours": 114.97277435974607}
{"step": 76700, "global_schedule": 0.2628733217716217, "l2_grads": 1.8027557134628296, "l2_params": 270.1242370605469, "l2_updates": 0.28548112511634827, "training_loss": 3.813732147216797, "uptime": 28043.887683657988, "examples_seen": 78540800.0, "progress": 0.688034303040089, "epoch": 61.92335741964986, "img/sec/core": 189.6213065407213, "core_hours_Tesla V100-SXM2-32GB": 115.04777765173723, "core_hours": 115.04777765173723}
{"step": 76750, "global_schedule": 0.26219215989112854, "l2_grads": 1.937642216682434, "l2_params": 270.0492858886719, "l2_updates": 0.28321975469589233, "training_loss": 1.9458515644073486, "uptime": 28060.77733871696, "examples_seen": 78592000.0, "progress": 0.6884828260538048, "epoch": 61.96372466698992, "img/sec/core": 189.4650890635194, "core_hours_Tesla V100-SXM2-32GB": 115.12284278533267, "core_hours": 115.12284278533267}
{"step": 76800, "global_schedule": 0.2615116834640503, "l2_grads": 2.0167932510375977, "l2_params": 269.9645690917969, "l2_updates": 0.28734779357910156, "training_loss": 2.1156606674194336, "uptime": 28077.659792986, "examples_seen": 78643200.0, "progress": 0.6889313490675206, "epoch": 62.004091914329976, "img/sec/core": 189.54590067322172, "core_hours_Tesla V100-SXM2-32GB": 115.1978759154173, "core_hours": 115.1978759154173}
{"step": 76850, "global_schedule": 0.26083165407180786, "l2_grads": 1.848165512084961, "l2_params": 269.8844299316406, "l2_updates": 0.2847681939601898, "training_loss": 1.8329561948776245, "uptime": 28094.542465417006, "examples_seen": 78694400.0, "progress": 0.6893798720812365, "epoch": 62.04445916167004, "img/sec/core": 189.54345131539043, "core_hours_Tesla V100-SXM2-32GB": 115.27291001511065, "core_hours": 115.27291001511065}
{"step": 76900, "global_schedule": 0.26015233993530273, "l2_grads": 1.8309893608093262, "l2_params": 269.7996826171875, "l2_updates": 0.2840035557746887, "training_loss": 2.5017285346984863, "uptime": 28111.396426539985, "examples_seen": 78745600.0, "progress": 0.6898283950949523, "epoch": 62.0848264090101, "img/sec/core": 189.86634516660132, "core_hours_Tesla V100-SXM2-32GB": 115.34781650899055, "core_hours": 115.34781650899055}
{"step": 76950, "global_schedule": 0.25947344303131104, "l2_grads": 1.9878971576690674, "l2_params": 269.7183837890625, "l2_updates": 0.28238800168037415, "training_loss": 2.0334901809692383, "uptime": 28128.282842201006, "examples_seen": 78796800.0, "progress": 0.6902769181086682, "epoch": 62.125193656350156, "img/sec/core": 189.50143501361646, "core_hours_Tesla V100-SXM2-32GB": 115.42286724526177, "core_hours": 115.42286724526177}
{"step": 77000, "global_schedule": 0.25879526138305664, "l2_grads": 1.9668306112289429, "l2_params": 269.6396789550781, "l2_updates": 0.2810848653316498, "training_loss": 1.9354820251464844, "uptime": 28145.15668091399, "examples_seen": 78848000.0, "progress": 0.690725441122384, "epoch": 62.16556090369021, "img/sec/core": 189.6426802715294, "core_hours_Tesla V100-SXM2-32GB": 115.49786208398613, "core_hours": 115.49786208398613}
{"step": 77050, "global_schedule": 0.25811755657196045, "l2_grads": 1.8379801511764526, "l2_params": 269.55810546875, "l2_updates": 0.2825717329978943, "training_loss": 2.998727321624756, "uptime": 28162.82066244498, "examples_seen": 78899200.0, "progress": 0.6911739641360998, "epoch": 62.20592815103027, "img/sec/core": 189.70010971232693, "core_hours_Tesla V100-SXM2-32GB": 115.57283421891948, "core_hours": 115.57283421891948}
{"step": 77100, "global_schedule": 0.2574405074119568, "l2_grads": 1.9267628192901611, "l2_params": 269.47430419921875, "l2_updates": 0.279121994972229, "training_loss": 3.9444077014923096, "uptime": 28179.700181466993, "examples_seen": 78950400.0, "progress": 0.6916224871498157, "epoch": 62.24629539837033, "img/sec/core": 189.57886156750402, "core_hours_Tesla V100-SXM2-32GB": 115.64785430346176, "core_hours": 115.64785430346176}
{"step": 77150, "global_schedule": 0.2567639648914337, "l2_grads": 1.8778443336486816, "l2_params": 269.39410400390625, "l2_updates": 0.2783392071723938, "training_loss": 3.2009730339050293, "uptime": 28196.579371800006, "examples_seen": 79001600.0, "progress": 0.6920710101635315, "epoch": 62.286662645710386, "img/sec/core": 189.5825532425758, "core_hours_Tesla V100-SXM2-32GB": 115.72287292716403, "core_hours": 115.72287292716403}
{"step": 77200, "global_schedule": 0.2560880780220032, "l2_grads": 1.871472954750061, "l2_params": 269.3172912597656, "l2_updates": 0.27771151065826416, "training_loss": 4.031716346740723, "uptime": 28213.453005677962, "examples_seen": 79052800.0, "progress": 0.6925195331772473, "epoch": 62.327029893050444, "img/sec/core": 189.64498241131542, "core_hours_Tesla V100-SXM2-32GB": 115.79786685551052, "core_hours": 115.79786685551052}
{"step": 77250, "global_schedule": 0.2554126977920532, "l2_grads": 1.8828550577163696, "l2_params": 269.2325744628906, "l2_updates": 0.2747431993484497, "training_loss": 4.323941230773926, "uptime": 28230.344390693004, "examples_seen": 79104000.0, "progress": 0.6929680561909631, "epoch": 62.36739714039051, "img/sec/core": 189.44568471740783, "core_hours_Tesla V100-SXM2-32GB": 115.8729396777996, "core_hours": 115.8729396777996}
{"step": 77300, "global_schedule": 0.2547380030155182, "l2_grads": 1.983020544052124, "l2_params": 269.15716552734375, "l2_updates": 0.27753013372421265, "training_loss": 2.067209243774414, "uptime": 28247.221636503004, "examples_seen": 79155200.0, "progress": 0.693416579204679, "epoch": 62.407764387730566, "img/sec/core": 189.60439612155733, "core_hours_Tesla V100-SXM2-32GB": 115.94794965917735, "core_hours": 115.94794965917735}
{"step": 77350, "global_schedule": 0.25406378507614136, "l2_grads": 2.15232515335083, "l2_params": 269.08416748046875, "l2_updates": 0.275511771440506, "training_loss": 1.9222859144210815, "uptime": 28264.118640213972, "examples_seen": 79206400.0, "progress": 0.6938651022183948, "epoch": 62.448131635070624, "img/sec/core": 189.38268906946922, "core_hours_Tesla V100-SXM2-32GB": 116.02304745344833, "core_hours": 116.02304745344833}
{"step": 77400, "global_schedule": 0.25339025259017944, "l2_grads": 2.0047812461853027, "l2_params": 269.0036315917969, "l2_updates": 0.27978962659835815, "training_loss": 1.8897044658660889, "uptime": 28281.025861337956, "examples_seen": 79257600.0, "progress": 0.6943136252321107, "epoch": 62.48849888241068, "img/sec/core": 189.2682408619275, "core_hours_Tesla V100-SXM2-32GB": 116.09819065844381, "core_hours": 116.09819065844381}
{"step": 77450, "global_schedule": 0.2527172565460205, "l2_grads": 2.0642812252044678, "l2_params": 268.92095947265625, "l2_updates": 0.2769770622253418, "training_loss": 1.9210326671600342, "uptime": 28297.909862473956, "examples_seen": 79308800.0, "progress": 0.6947621482458265, "epoch": 62.52886612975074, "img/sec/core": 189.5285349855156, "core_hours_Tesla V100-SXM2-32GB": 116.1732306634927, "core_hours": 116.1732306634927}
{"step": 77500, "global_schedule": 0.2520449161529541, "l2_grads": 2.0530483722686768, "l2_params": 268.8394775390625, "l2_updates": 0.2758254110813141, "training_loss": 4.394577503204346, "uptime": 28314.786149286956, "examples_seen": 79360000.0, "progress": 0.6952106712595423, "epoch": 62.5692333770908, "img/sec/core": 189.61517041385252, "core_hours_Tesla V100-SXM2-32GB": 116.2482363826616, "core_hours": 116.2482363826616, "minival/prec@1": 0.7475023415547923, "minival/loss": 1.0130669876370175, "minival/sample count": 12812.0, "minival/attn_weight_avg": [13312, 12, 281], "minival/attn_mag": [13312, 12, 281], "minival/before_mlp": [13312, 12, 281], "z/secs/eval/minival": 2.8907473839935847, "real/prec@1": 0.7855114546192113, "real/loss": 1.8183237627970408, "real/sample count": 46837.0, "real/attn_weight_avg": [50176, 12, 281], "real/attn_mag": [50176, 12, 281], "real/before_mlp": [50176, 12, 281], "z/secs/eval/real": 11.170154596038628, "train/prec@1": 0.782187878078289, "train/loss": 0.8462948678728336, "train/sample count": 25623.0, "train/attn_weight_avg": [26624, 12, 281], "train/attn_mag": [26624, 12, 281], "train/before_mlp": [26624, 12, 281], "z/secs/eval/train": 6.565844577969983, "v2/prec@1": 0.5842, "v2/loss": 1.7937501220703125, "v2/sample count": 10000.0, "v2/attn_weight_avg": [10240, 12, 281], "v2/attn_mag": [10240, 12, 281], "v2/before_mlp": [10240, 12, 281], "z/secs/eval/v2": 3.3905015629716218, "val/prec@1": 0.71198, "val/loss": 1.1558915869140625, "val/sample count": 50000.0, "val/attn_weight_avg": [50176, 12, 281], "val/attn_mag": [50176, 12, 281], "val/before_mlp": [50176, 12, 281], "z/secs/eval/val": 12.26482619496528}
{"step": 77551, "global_schedule": 0.2513730525970459, "l2_grads": 2.0087625980377197, "l2_params": 268.7643737792969, "l2_updates": 0.27625367045402527, "training_loss": 2.380533218383789, "uptime": 28368.010193920985, "examples_seen": 79411200.0, "progress": 0.6956591942732582, "epoch": 62.609600624430854, "img/sec/core": 188.90465383464627, "core_hours_Tesla V100-SXM2-32GB": 116.32352421667478, "core_hours": 116.32352421667478}
{"step": 77600, "global_schedule": 0.250701904296875, "l2_grads": 2.076124668121338, "l2_params": 268.6812438964844, "l2_updates": 0.27208927273750305, "training_loss": 1.9510321617126465, "uptime": 28384.89383552695, "examples_seen": 79462400.0, "progress": 0.696107717286974, "epoch": 62.64996787177092, "img/sec/core": 189.53257091584086, "core_hours_Tesla V100-SXM2-32GB": 116.39856262381241, "core_hours": 116.39856262381241}
{"step": 77650, "global_schedule": 0.2500312626361847, "l2_grads": 2.171342134475708, "l2_params": 268.6034851074219, "l2_updates": 0.27097228169441223, "training_loss": 1.966376543045044, "uptime": 28401.768237688986, "examples_seen": 79513600.0, "progress": 0.6965562403006899, "epoch": 62.690335119110976, "img/sec/core": 189.63634795899267, "core_hours_Tesla V100-SXM2-32GB": 116.47355996675478, "core_hours": 116.47355996675478}
{"step": 77700, "global_schedule": 0.2493613064289093, "l2_grads": 1.9038105010986328, "l2_params": 268.5230407714844, "l2_updates": 0.2702329456806183, "training_loss": 3.17812442779541, "uptime": 28418.650988235953, "examples_seen": 79564800.0, "progress": 0.6970047633144056, "epoch": 62.730702366451034, "img/sec/core": 189.54257430373838, "core_hours_Tesla V100-SXM2-32GB": 116.5485944136302, "core_hours": 116.5485944136302}
{"step": 77750, "global_schedule": 0.2486918568611145, "l2_grads": 2.099414825439453, "l2_params": 268.446533203125, "l2_updates": 0.26841869950294495, "training_loss": 1.9255481958389282, "uptime": 28435.53221810097, "examples_seen": 79616000.0, "progress": 0.6974532863281215, "epoch": 62.77106961379109, "img/sec/core": 189.55964853198597, "core_hours_Tesla V100-SXM2-32GB": 116.62362210191915, "core_hours": 116.62362210191915}
{"step": 77801, "global_schedule": 0.24802309274673462, "l2_grads": 1.9866454601287842, "l2_params": 268.3659362792969, "l2_updates": 0.27064892649650574, "training_loss": 3.932605266571045, "uptime": 28452.42323669698, "examples_seen": 79667200.0, "progress": 0.6979018093418373, "epoch": 62.81143686113115, "img/sec/core": 189.44979438691152, "core_hours_Tesla V100-SXM2-32GB": 116.69869329567922, "core_hours": 116.69869329567922}
{"step": 77850, "global_schedule": 0.24735486507415771, "l2_grads": 1.9941282272338867, "l2_params": 268.2876281738281, "l2_updates": 0.2702462673187256, "training_loss": 1.8941024541854858, "uptime": 28469.30863973999, "examples_seen": 79718400.0, "progress": 0.6983503323555532, "epoch": 62.85180410847121, "img/sec/core": 189.51279941908143, "core_hours_Tesla V100-SXM2-32GB": 116.77373953142592, "core_hours": 116.77373953142592}
{"step": 77900, "global_schedule": 0.24668732285499573, "l2_grads": 2.058149576187134, "l2_params": 268.2019348144531, "l2_updates": 0.26817625761032104, "training_loss": 2.1128649711608887, "uptime": 28486.17375858198, "examples_seen": 79769600.0, "progress": 0.698798855369269, "epoch": 62.892171355811264, "img/sec/core": 189.74073233523893, "core_hours_Tesla V100-SXM2-32GB": 116.84869561516808, "core_hours": 116.84869561516808}
{"step": 77950, "global_schedule": 0.24602028727531433, "l2_grads": 2.1026487350463867, "l2_params": 268.1145935058594, "l2_updates": 0.26596948504447937, "training_loss": 2.042451858520508, "uptime": 28503.045278780977, "examples_seen": 79820800.0, "progress": 0.6992473783829848, "epoch": 62.93253860315133, "img/sec/core": 189.6687413022829, "core_hours_Tesla V100-SXM2-32GB": 116.92368014938587, "core_hours": 116.92368014938587}
{"step": 78001, "global_schedule": 0.24535396695137024, "l2_grads": 2.1635780334472656, "l2_params": 268.0423889160156, "l2_updates": 0.2802160084247589, "training_loss": 1.9703971147537231, "uptime": 28519.920490962977, "examples_seen": 79872000.0, "progress": 0.6996959013967007, "epoch": 62.97290585049139, "img/sec/core": 189.62724530440724, "core_hours_Tesla V100-SXM2-32GB": 116.99868109241697, "core_hours": 116.99868109241697}
{"step": 78050, "global_schedule": 0.24468815326690674, "l2_grads": 2.0393943786621094, "l2_params": 267.9664001464844, "l2_updates": 0.26892557740211487, "training_loss": 1.9665255546569824, "uptime": 28537.35616485396, "examples_seen": 79923200.0, "progress": 0.7001444244104165, "epoch": 63.013273097831444, "img/sec/core": 189.7084870348936, "core_hours_Tesla V100-SXM2-32GB": 117.07364991666154, "core_hours": 117.07364991666154}
{"step": 78100, "global_schedule": 0.24402302503585815, "l2_grads": 2.040266513824463, "l2_params": 267.88958740234375, "l2_updates": 0.2666763961315155, "training_loss": 1.8673725128173828, "uptime": 28554.205252288957, "examples_seen": 79974400.0, "progress": 0.7005929474241324, "epoch": 63.0536403451715, "img/sec/core": 189.92126501484105, "core_hours_Tesla V100-SXM2-32GB": 117.14853474970596, "core_hours": 117.14853474970596}
{"step": 78150, "global_schedule": 0.24335843324661255, "l2_grads": 1.9061847925186157, "l2_params": 267.80828857421875, "l2_updates": 0.26622626185417175, "training_loss": 4.127840518951416, "uptime": 28571.069837243995, "examples_seen": 80025600.0, "progress": 0.7010414704378481, "epoch": 63.09400759251156, "img/sec/core": 189.74673901145354, "core_hours_Tesla V100-SXM2-32GB": 117.22348846061725, "core_hours": 117.22348846061725}
{"step": 78200, "global_schedule": 0.24269458651542664, "l2_grads": 2.032557487487793, "l2_params": 267.72430419921875, "l2_updates": 0.26140865683555603, "training_loss": 3.320141315460205, "uptime": 28587.913273378974, "examples_seen": 80076800.0, "progress": 0.701489993451564, "epoch": 63.13437483985162, "img/sec/core": 189.98498728857888, "core_hours_Tesla V100-SXM2-32GB": 117.2983481767727, "core_hours": 117.2983481767727}
{"step": 78250, "global_schedule": 0.24203121662139893, "l2_grads": 2.0648834705352783, "l2_params": 267.6507263183594, "l2_updates": 0.26080551743507385, "training_loss": 4.123290061950684, "uptime": 28604.781708342955, "examples_seen": 80128000.0, "progress": 0.7019385164652798, "epoch": 63.174742087191674, "img/sec/core": 189.70343169552996, "core_hours_Tesla V100-SXM2-32GB": 117.37331899883483, "core_hours": 117.37331899883483}
{"step": 78300, "global_schedule": 0.24136856198310852, "l2_grads": 2.141526222229004, "l2_params": 267.570556640625, "l2_updates": 0.2599230110645294, "training_loss": 1.9592187404632568, "uptime": 28621.66664034495, "examples_seen": 80179200.0, "progress": 0.7023870394789957, "epoch": 63.21510933453174, "img/sec/core": 189.51808628083396, "core_hours_Tesla V100-SXM2-32GB": 117.44836314106594, "core_hours": 117.44836314106594}
{"step": 78350, "global_schedule": 0.2407064437866211, "l2_grads": 2.146043062210083, "l2_params": 267.4994201660156, "l2_updates": 0.26132944226264954, "training_loss": 1.9343945980072021, "uptime": 28638.52323442098, "examples_seen": 80230400.0, "progress": 0.7028355624927115, "epoch": 63.2554765818718, "img/sec/core": 189.83668857223162, "core_hours_Tesla V100-SXM2-32GB": 117.5232813369594, "core_hours": 117.5232813369594}
{"step": 78400, "global_schedule": 0.24004504084587097, "l2_grads": 1.8532463312149048, "l2_params": 267.41766357421875, "l2_updates": 0.26017001271247864, "training_loss": 2.2765440940856934, "uptime": 28655.415264257987, "examples_seen": 80281600.0, "progress": 0.7032840855064273, "epoch": 63.295843829211854, "img/sec/core": 189.43845297913856, "core_hours_Tesla V100-SXM2-32GB": 117.59835702512387, "core_hours": 117.59835702512387}
{"step": 78450, "global_schedule": 0.23938417434692383, "l2_grads": 2.0148932933807373, "l2_params": 267.3402099609375, "l2_updates": 0.25585639476776123, "training_loss": 3.853940725326538, "uptime": 28672.30481795699, "examples_seen": 80332800.0, "progress": 0.7037326085201432, "epoch": 63.33621107655191, "img/sec/core": 189.4662261080979, "core_hours_Tesla V100-SXM2-32GB": 117.67342170823055, "core_hours": 117.67342170823055}
{"step": 78500, "global_schedule": 0.238724023103714, "l2_grads": 2.0611844062805176, "l2_params": 267.2597351074219, "l2_updates": 0.2608632743358612, "training_loss": 2.012147903442383, "uptime": 28689.178182709962, "examples_seen": 80384000.0, "progress": 0.704181131533859, "epoch": 63.37657832389197, "img/sec/core": 189.64800719050982, "core_hours_Tesla V100-SXM2-32GB": 117.74841444046598, "core_hours": 117.74841444046598}
{"step": 78550, "global_schedule": 0.23806440830230713, "l2_grads": 2.020726203918457, "l2_params": 267.1904602050781, "l2_updates": 0.25445207953453064, "training_loss": 4.227062702178955, "uptime": 28706.047438087, "examples_seen": 80435200.0, "progress": 0.7046296545475749, "epoch": 63.41694557123203, "img/sec/core": 189.69420572977833, "core_hours_Tesla V100-SXM2-32GB": 117.82338890880837, "core_hours": 117.82338890880837}
{"step": 78600, "global_schedule": 0.23740550875663757, "l2_grads": 1.8435688018798828, "l2_params": 267.1073303222656, "l2_updates": 0.2595289647579193, "training_loss": 3.2869997024536133, "uptime": 28722.92480662599, "examples_seen": 80486400.0, "progress": 0.7050781775612907, "epoch": 63.457312818572085, "img/sec/core": 189.60301735471606, "core_hours_Tesla V100-SXM2-32GB": 117.89839943564833, "core_hours": 117.89839943564833}
{"step": 78650, "global_schedule": 0.2367471158504486, "l2_grads": 1.9282984733581543, "l2_params": 267.02569580078125, "l2_updates": 0.2550676167011261, "training_loss": 3.8301124572753906, "uptime": 28739.80251523899, "examples_seen": 80537600.0, "progress": 0.7055267005750065, "epoch": 63.49768006591215, "img/sec/core": 189.5991969866882, "core_hours_Tesla V100-SXM2-32GB": 117.97341147392832, "core_hours": 117.97341147392832}
{"step": 78700, "global_schedule": 0.23608937859535217, "l2_grads": 2.0224828720092773, "l2_params": 266.9471435546875, "l2_updates": 0.25763335824012756, "training_loss": 1.803786039352417, "uptime": 28756.684236234985, "examples_seen": 80588800.0, "progress": 0.7059752235887223, "epoch": 63.53804731325221, "img/sec/core": 189.55413377338405, "core_hours_Tesla V100-SXM2-32GB": 118.04844134502166, "core_hours": 118.04844134502166}
{"step": 78750, "global_schedule": 0.23543238639831543, "l2_grads": 1.8065177202224731, "l2_params": 266.8720397949219, "l2_updates": 0.25674867630004883, "training_loss": 2.3806447982788086, "uptime": 28773.56618690095, "examples_seen": 80640000.0, "progress": 0.7064237466024381, "epoch": 63.578414560592265, "img/sec/core": 189.55155499012398, "core_hours_Tesla V100-SXM2-32GB": 118.12347223687037, "core_hours": 118.12347223687037}
{"step": 78800, "global_schedule": 0.23477590084075928, "l2_grads": 2.045729637145996, "l2_params": 266.79742431640625, "l2_updates": 0.25475382804870605, "training_loss": 3.9435887336730957, "uptime": 28790.431887694984, "examples_seen": 80691200.0, "progress": 0.706872269616154, "epoch": 63.61878180793232, "img/sec/core": 189.73418531958265, "core_hours_Tesla V100-SXM2-32GB": 118.19843090706608, "core_hours": 118.19843090706608}
{"step": 78850, "global_schedule": 0.2341201901435852, "l2_grads": 1.868456244468689, "l2_params": 266.71502685546875, "l2_updates": 0.2519384026527405, "training_loss": 3.79565167427063, "uptime": 28807.301401154953, "examples_seen": 80742400.0, "progress": 0.7073207926298698, "epoch": 63.65914905527238, "img/sec/core": 189.6913036403494, "core_hours_Tesla V100-SXM2-32GB": 118.27340652244374, "core_hours": 118.27340652244374}
{"step": 78900, "global_schedule": 0.23346498608589172, "l2_grads": 2.0130600929260254, "l2_params": 266.6319274902344, "l2_updates": 0.25250476598739624, "training_loss": 4.251689434051514, "uptime": 28824.169343334972, "examples_seen": 80793600.0, "progress": 0.7077693156435857, "epoch": 63.69951630261244, "img/sec/core": 189.70897373543283, "core_hours_Tesla V100-SXM2-32GB": 118.34837515435493, "core_hours": 118.34837515435493}
{"step": 78950, "global_schedule": 0.23281052708625793, "l2_grads": 2.0383481979370117, "l2_params": 266.5567932128906, "l2_updates": 0.2535238564014435, "training_loss": 2.260162591934204, "uptime": 28841.037381346978, "examples_seen": 80844800.0, "progress": 0.7082178386573015, "epoch": 63.739883549952495, "img/sec/core": 189.7078959463095, "core_hours_Tesla V100-SXM2-32GB": 118.42334421218605, "core_hours": 118.42334421218605}
{"step": 79000, "global_schedule": 0.23215660452842712, "l2_grads": 2.0838441848754883, "l2_params": 266.4847717285156, "l2_updates": 0.24940448999404907, "training_loss": 1.957988977432251, "uptime": 28857.92520988395, "examples_seen": 80896000.0, "progress": 0.7086663616710174, "epoch": 63.78025079729256, "img/sec/core": 189.48558087230404, "core_hours_Tesla V100-SXM2-32GB": 118.49840122790594, "core_hours": 118.49840122790594}
{"step": 79050, "global_schedule": 0.231503427028656, "l2_grads": 2.1595842838287354, "l2_params": 266.4057312011719, "l2_updates": 0.24755728244781494, "training_loss": 4.163699626922607, "uptime": 28875.32679305697, "examples_seen": 80947200.0, "progress": 0.7091148846847332, "epoch": 63.82061804463262, "img/sec/core": 189.85176430487772, "core_hours_Tesla V100-SXM2-32GB": 118.57331347470172, "core_hours": 118.57331347470172}
{"step": 79100, "global_schedule": 0.23085078597068787, "l2_grads": 1.9026156663894653, "l2_params": 266.33349609375, "l2_updates": 0.2550373077392578, "training_loss": 2.6348109245300293, "uptime": 28892.186421389983, "examples_seen": 80998400.0, "progress": 0.7095634076984491, "epoch": 63.860985291972675, "img/sec/core": 189.8025233293137, "core_hours_Tesla V100-SXM2-32GB": 118.64824515618176, "core_hours": 118.64824515618176}
{"step": 79150, "global_schedule": 0.23019888997077942, "l2_grads": 1.9921140670776367, "l2_params": 266.2481689453125, "l2_updates": 0.2526717483997345, "training_loss": 1.928797960281372, "uptime": 28909.074323661975, "examples_seen": 81049600.0, "progress": 0.7100119307121648, "epoch": 63.90135253931273, "img/sec/core": 189.48475355089408, "core_hours_Tesla V100-SXM2-32GB": 118.72330249961284, "core_hours": 118.72330249961284}
{"step": 79200, "global_schedule": 0.22954753041267395, "l2_grads": 1.9756821393966675, "l2_params": 266.1717224121094, "l2_updates": 0.24627192318439484, "training_loss": 4.092148303985596, "uptime": 28925.941585046006, "examples_seen": 81100800.0, "progress": 0.7104604537258806, "epoch": 63.94171978665279, "img/sec/core": 189.71663076434243, "core_hours_Tesla V100-SXM2-32GB": 118.7982681057641, "core_hours": 118.7982681057641}
{"step": 79250, "global_schedule": 0.22889694571495056, "l2_grads": 1.9833900928497314, "l2_params": 266.091552734375, "l2_updates": 0.24896714091300964, "training_loss": 2.8025617599487305, "uptime": 28942.819955857005, "examples_seen": 81152000.0, "progress": 0.7109089767395965, "epoch": 63.98208703399285, "img/sec/core": 189.5917583416733, "core_hours_Tesla V100-SXM2-32GB": 118.87328308714632, "core_hours": 118.87328308714632}
{"step": 79300, "global_schedule": 0.22824689745903015, "l2_grads": 1.9069181680679321, "l2_params": 266.01715087890625, "l2_updates": 0.25068971514701843, "training_loss": 3.00673508644104, "uptime": 28959.687232775963, "examples_seen": 81203200.0, "progress": 0.7113574997533123, "epoch": 64.02245428133291, "img/sec/core": 189.71645603347903, "core_hours_Tesla V100-SXM2-32GB": 118.94824876234169, "core_hours": 118.94824876234169}
{"step": 79350, "global_schedule": 0.22759759426116943, "l2_grads": 1.996862530708313, "l2_params": 265.94342041015625, "l2_updates": 0.24177303910255432, "training_loss": 3.7821550369262695, "uptime": 28976.56670426397, "examples_seen": 81254400.0, "progress": 0.7118060227670282, "epoch": 64.06282152867297, "img/sec/core": 189.57939543745937, "core_hours_Tesla V100-SXM2-32GB": 119.0232686356217, "core_hours": 119.0232686356217}
{"step": 79400, "global_schedule": 0.22694885730743408, "l2_grads": 1.952805995941162, "l2_params": 265.86273193359375, "l2_updates": 0.24960534274578094, "training_loss": 2.4230639934539795, "uptime": 28993.411827398988, "examples_seen": 81305600.0, "progress": 0.712254545780744, "epoch": 64.10318877601303, "img/sec/core": 189.9659607324309, "core_hours_Tesla V100-SXM2-32GB": 119.09813584955512, "core_hours": 119.09813584955512}
{"step": 79450, "global_schedule": 0.22630086541175842, "l2_grads": 2.074598550796509, "l2_params": 265.78533935546875, "l2_updates": 0.24382472038269043, "training_loss": 1.895272970199585, "uptime": 29010.284869709983, "examples_seen": 81356800.0, "progress": 0.7127030687944599, "epoch": 64.14355602335309, "img/sec/core": 189.6516313430141, "core_hours_Tesla V100-SXM2-32GB": 119.17312714871511, "core_hours": 119.17312714871511}
{"step": 79500, "global_schedule": 0.22565343976020813, "l2_grads": 2.1767094135284424, "l2_params": 265.70330810546875, "l2_updates": 0.24698475003242493, "training_loss": 1.9408373832702637, "uptime": 29027.128368277976, "examples_seen": 81408000.0, "progress": 0.7131515918081757, "epoch": 64.18392327069314, "img/sec/core": 189.98428308005734, "core_hours_Tesla V100-SXM2-32GB": 119.24798714235062, "core_hours": 119.24798714235062}
{"step": 79550, "global_schedule": 0.22500675916671753, "l2_grads": 2.0004079341888428, "l2_params": 265.6200256347656, "l2_updates": 0.24237681925296783, "training_loss": 2.9108948707580566, "uptime": 29043.989447986998, "examples_seen": 81459200.0, "progress": 0.7136001148218916, "epoch": 64.2242905180332, "img/sec/core": 189.7861854177518, "core_hours_Tesla V100-SXM2-32GB": 119.32292527439073, "core_hours": 119.32292527439073}
{"step": 79600, "global_schedule": 0.2243606448173523, "l2_grads": 1.9333280324935913, "l2_params": 265.54351806640625, "l2_updates": 0.24094586074352264, "training_loss": 3.739358901977539, "uptime": 29060.847139019985, "examples_seen": 81510400.0, "progress": 0.7140486378356073, "epoch": 64.26465776537326, "img/sec/core": 189.82433559485318, "core_hours_Tesla V100-SXM2-32GB": 119.39784834564846, "core_hours": 119.39784834564846}
{"step": 79650, "global_schedule": 0.22371530532836914, "l2_grads": 2.0059268474578857, "l2_params": 265.4708251953125, "l2_updates": 0.24393963813781738, "training_loss": 2.2083983421325684, "uptime": 29077.709157006, "examples_seen": 81561600.0, "progress": 0.7144971608493231, "epoch": 64.30502501271332, "img/sec/core": 189.77562487799105, "core_hours_Tesla V100-SXM2-32GB": 119.47279064780852, "core_hours": 119.47279064780852}
{"step": 79700, "global_schedule": 0.22307050228118896, "l2_grads": 1.9119306802749634, "l2_params": 265.3880310058594, "l2_updates": 0.24030110239982605, "training_loss": 2.7883405685424805, "uptime": 29094.57848598197, "examples_seen": 81612800.0, "progress": 0.714945683863039, "epoch": 64.34539226005337, "img/sec/core": 189.69337811590555, "core_hours_Tesla V100-SXM2-32GB": 119.54776544325726, "core_hours": 119.54776544325726}
{"step": 79750, "global_schedule": 0.22242647409439087, "l2_grads": 2.11037015914917, "l2_params": 265.3097229003906, "l2_updates": 0.2393740862607956, "training_loss": 4.1394805908203125, "uptime": 29111.436808736005, "examples_seen": 81664000.0, "progress": 0.7153942068767548, "epoch": 64.38575950739343, "img/sec/core": 189.81722243001767, "core_hours_Tesla V100-SXM2-32GB": 119.6226913221641, "core_hours": 119.6226913221641}
{"step": 79800, "global_schedule": 0.22178301215171814, "l2_grads": 2.101048469543457, "l2_params": 265.2314453125, "l2_updates": 0.24372299015522003, "training_loss": 1.8657760620117188, "uptime": 29128.30794790096, "examples_seen": 81715200.0, "progress": 0.7158427298904707, "epoch": 64.42612675473349, "img/sec/core": 189.67302496365718, "core_hours_Tesla V100-SXM2-32GB": 119.69767416289723, "core_hours": 119.69767416289723}
{"step": 79850, "global_schedule": 0.2211402952671051, "l2_grads": 1.9089728593826294, "l2_params": 265.1524353027344, "l2_updates": 0.24143573641777039, "training_loss": 4.006800174713135, "uptime": 29145.183686054952, "examples_seen": 81766400.0, "progress": 0.7162912529041865, "epoch": 64.46649400207355, "img/sec/core": 189.6213351262063, "core_hours_Tesla V100-SXM2-32GB": 119.77267744358163, "core_hours": 119.77267744358163}
{"step": 79900, "global_schedule": 0.22049817442893982, "l2_grads": 1.9687327146530151, "l2_params": 265.0845642089844, "l2_updates": 0.24061034619808197, "training_loss": 2.5997769832611084, "uptime": 29162.04446776997, "examples_seen": 81817600.0, "progress": 0.7167397759179024, "epoch": 64.50686124941362, "img/sec/core": 189.78953965993242, "core_hours_Tesla V100-SXM2-32GB": 119.84761425120395, "core_hours": 119.84761425120395}
{"step": 79950, "global_schedule": 0.21985682845115662, "l2_grads": 2.0430872440338135, "l2_params": 265.004638671875, "l2_updates": 0.23946601152420044, "training_loss": 3.964831829071045, "uptime": 29178.925086489005, "examples_seen": 81868800.0, "progress": 0.7171882989316182, "epoch": 64.54722849675368, "img/sec/core": 189.56651135018137, "core_hours_Tesla V100-SXM2-32GB": 119.92263922328854, "core_hours": 119.92263922328854}
{"step": 80000, "global_schedule": 0.2192160189151764, "l2_grads": 1.9968572854995728, "l2_params": 264.9302978515625, "l2_updates": 0.2396298348903656, "training_loss": 2.3141367435455322, "uptime": 29195.81494148099, "examples_seen": 81920000.0, "progress": 0.7176368219453341, "epoch": 64.58759574409373, "img/sec/core": 189.46284627777408, "core_hours_Tesla V100-SXM2-32GB": 119.99770524547513, "core_hours": 119.99770524547513, "minival/prec@1": 0.7483609116453325, "minival/loss": 1.0093901911416054, "minival/sample count": 12812.0, "minival/attn_weight_avg": [13312, 12, 281], "minival/attn_mag": [13312, 12, 281], "minival/before_mlp": [13312, 12, 281], "z/secs/eval/minival": 2.8894820749992505, "real/prec@1": 0.7885005444413604, "real/loss": 1.8082493275590412, "real/sample count": 46837.0, "real/attn_weight_avg": [50176, 12, 281], "real/attn_mag": [50176, 12, 281], "real/before_mlp": [50176, 12, 281], "z/secs/eval/real": 11.202873935981188, "train/prec@1": 0.7865589509425126, "train/loss": 0.8296793828369541, "train/sample count": 25623.0, "train/attn_weight_avg": [26624, 12, 281], "train/attn_mag": [26624, 12, 281], "train/before_mlp": [26624, 12, 281], "z/secs/eval/train": 6.588300755014643, "v2/prec@1": 0.5865, "v2/loss": 1.7917408935546875, "v2/sample count": 10000.0, "v2/attn_weight_avg": [10240, 12, 281], "v2/attn_mag": [10240, 12, 281], "v2/before_mlp": [10240, 12, 281], "z/secs/eval/v2": 3.3391981570166536, "val/prec@1": 0.71606, "val/loss": 1.1517830932617188, "val/sample count": 50000.0, "val/attn_weight_avg": [50176, 12, 281], "val/attn_mag": [50176, 12, 281], "val/before_mlp": [50176, 12, 281], "z/secs/eval/val": 12.264697236998472}
{"step": 80050, "global_schedule": 0.21857601404190063, "l2_grads": 2.131901264190674, "l2_params": 264.8567199707031, "l2_updates": 0.23466752469539642, "training_loss": 4.100987434387207, "uptime": 29249.56247525895, "examples_seen": 81971200.0, "progress": 0.7180853449590499, "epoch": 64.62796299143379, "img/sec/core": 188.93349257190948, "core_hours_Tesla V100-SXM2-32GB": 120.07298158758164, "core_hours": 120.07298158758164}
{"step": 80100, "global_schedule": 0.21793657541275024, "l2_grads": 1.920664668083191, "l2_params": 264.78363037109375, "l2_updates": 0.23738236725330353, "training_loss": 2.863881826400757, "uptime": 29266.44087880099, "examples_seen": 82022400.0, "progress": 0.7185338679727656, "epoch": 64.66833023877385, "img/sec/core": 189.59139068038527, "core_hours_Tesla V100-SXM2-32GB": 120.14799671443515, "core_hours": 120.14799671443515}
{"step": 80150, "global_schedule": 0.21729791164398193, "l2_grads": 2.1600112915039062, "l2_params": 264.703125, "l2_updates": 0.23443029820919037, "training_loss": 2.051316738128662, "uptime": 29283.325057192997, "examples_seen": 82073600.0, "progress": 0.7189823909864815, "epoch": 64.7086974861139, "img/sec/core": 189.52654524870945, "core_hours_Tesla V100-SXM2-32GB": 120.22303750728852, "core_hours": 120.22303750728852}
{"step": 80200, "global_schedule": 0.216659814119339, "l2_grads": 2.1038222312927246, "l2_params": 264.6298522949219, "l2_updates": 0.23390308022499084, "training_loss": 2.298389196395874, "uptime": 29300.202084383985, "examples_seen": 82124800.0, "progress": 0.7194309140001973, "epoch": 64.74906473345396, "img/sec/core": 189.6068521894999, "core_hours_Tesla V100-SXM2-32GB": 120.29804651702625, "core_hours": 120.29804651702625}
{"step": 80250, "global_schedule": 0.21602249145507812, "l2_grads": 2.0751726627349854, "l2_params": 264.5547180175781, "l2_updates": 0.23771905899047852, "training_loss": 2.116380214691162, "uptime": 29317.081733324972, "examples_seen": 82176000.0, "progress": 0.7198794370139132, "epoch": 64.78943198079402, "img/sec/core": 189.5774024203667, "core_hours_Tesla V100-SXM2-32GB": 120.37306717898619, "core_hours": 120.37306717898619}
{"step": 80300, "global_schedule": 0.21538576483726501, "l2_grads": 1.9979416131973267, "l2_params": 264.4831237792969, "l2_updates": 0.23150311410427094, "training_loss": 2.9966158866882324, "uptime": 29333.970656636986, "examples_seen": 82227200.0, "progress": 0.720327960027629, "epoch": 64.82979922813408, "img/sec/core": 189.47329802390433, "core_hours_Tesla V100-SXM2-32GB": 120.4481290603729, "core_hours": 120.4481290603729}
{"step": 80350, "global_schedule": 0.21474981307983398, "l2_grads": 2.1478283405303955, "l2_params": 264.4124755859375, "l2_updates": 0.23520790040493011, "training_loss": 1.7892088890075684, "uptime": 29350.860691537964, "examples_seen": 82278400.0, "progress": 0.7207764830413449, "epoch": 64.87016647547414, "img/sec/core": 189.46082816055448, "core_hours_Tesla V100-SXM2-32GB": 120.52319588215504, "core_hours": 120.52319588215504}
{"step": 80400, "global_schedule": 0.2141144573688507, "l2_grads": 2.0451416969299316, "l2_params": 264.3348388671875, "l2_updates": 0.23595628142356873, "training_loss": 4.169811248779297, "uptime": 29367.72921684495, "examples_seen": 82329600.0, "progress": 0.7212250060550607, "epoch": 64.9105337228142, "img/sec/core": 189.70241569812163, "core_hours_Tesla V100-SXM2-32GB": 120.59816710574164, "core_hours": 120.59816710574164}
{"step": 80450, "global_schedule": 0.2134798765182495, "l2_grads": 2.1626603603363037, "l2_params": 264.26275634765625, "l2_updates": 0.23022665083408356, "training_loss": 2.009641408920288, "uptime": 29384.615051034954, "examples_seen": 82380800.0, "progress": 0.7216735290687765, "epoch": 64.95090097015425, "img/sec/core": 189.50796057763836, "core_hours_Tesla V100-SXM2-32GB": 120.67321525769722, "core_hours": 120.67321525769722}
{"step": 80500, "global_schedule": 0.21284589171409607, "l2_grads": 2.10438871383667, "l2_params": 264.1884765625, "l2_updates": 0.23213428258895874, "training_loss": 1.9549795389175415, "uptime": 29401.513590657967, "examples_seen": 82432000.0, "progress": 0.7221220520824924, "epoch": 64.99126821749431, "img/sec/core": 189.36547603451936, "core_hours_Tesla V100-SXM2-32GB": 120.74831987824395, "core_hours": 120.74831987824395}
{"step": 80550, "global_schedule": 0.2122126817703247, "l2_grads": 2.193498373031616, "l2_params": 264.10003662109375, "l2_updates": 0.23025688529014587, "training_loss": 1.807438611984253, "uptime": 29418.403373093985, "examples_seen": 82483200.0, "progress": 0.7225705750962081, "epoch": 65.03163546483437, "img/sec/core": 189.46366018167345, "core_hours_Tesla V100-SXM2-32GB": 120.82338557795957, "core_hours": 120.82338557795957}
{"step": 80600, "global_schedule": 0.2115800678730011, "l2_grads": 1.9890201091766357, "l2_params": 264.03021240234375, "l2_updates": 0.22826479375362396, "training_loss": 2.89555025100708, "uptime": 29435.27987998299, "examples_seen": 82534400.0, "progress": 0.723019098109924, "epoch": 65.07200271217442, "img/sec/core": 189.61269776061175, "core_hours_Tesla V100-SXM2-32GB": 120.89839227524405, "core_hours": 120.89839227524405}
{"step": 80650, "global_schedule": 0.21094822883605957, "l2_grads": 1.9959343671798706, "l2_params": 263.9532470703125, "l2_updates": 0.22534556686878204, "training_loss": 3.313981056213379, "uptime": 29452.16113635496, "examples_seen": 82585600.0, "progress": 0.7234676211236398, "epoch": 65.1123699595145, "img/sec/core": 189.55935088536836, "core_hours_Tesla V100-SXM2-32GB": 120.97342008134169, "core_hours": 120.97342008134169}
{"step": 80700, "global_schedule": 0.21031701564788818, "l2_grads": 2.083009958267212, "l2_params": 263.8838195800781, "l2_updates": 0.23105259239673615, "training_loss": 1.8937426805496216, "uptime": 29469.046517702984, "examples_seen": 82636800.0, "progress": 0.7239161441373557, "epoch": 65.15273720685455, "img/sec/core": 189.51304291238543, "core_hours_Tesla V100-SXM2-32GB": 121.04846622066624, "core_hours": 121.04846622066624}
{"step": 80750, "global_schedule": 0.20968657732009888, "l2_grads": 2.0369675159454346, "l2_params": 263.8132629394531, "l2_updates": 0.22822560369968414, "training_loss": 2.017991304397583, "uptime": 29485.949808445002, "examples_seen": 82688000.0, "progress": 0.7243646671510715, "epoch": 65.19310445419461, "img/sec/core": 189.31224983578733, "core_hours_Tesla V100-SXM2-32GB": 121.12359195729742, "core_hours": 121.12359195729742}
{"step": 80800, "global_schedule": 0.20905673503875732, "l2_grads": 1.9439613819122314, "l2_params": 263.74005126953125, "l2_updates": 0.23003222048282623, "training_loss": 3.6416640281677246, "uptime": 29502.84489764797, "examples_seen": 82739200.0, "progress": 0.7248131901647874, "epoch": 65.23347170153467, "img/sec/core": 189.40414942809892, "core_hours_Tesla V100-SXM2-32GB": 121.19868124264396, "core_hours": 121.19868124264396}
{"step": 80850, "global_schedule": 0.2084275782108307, "l2_grads": 2.081542730331421, "l2_params": 263.6655578613281, "l2_updates": 0.2235558032989502, "training_loss": 3.0293593406677246, "uptime": 29519.716665457992, "examples_seen": 82790400.0, "progress": 0.7252617131785032, "epoch": 65.27383894887473, "img/sec/core": 189.66595771304824, "core_hours_Tesla V100-SXM2-32GB": 121.27366687735517, "core_hours": 121.27366687735517}
{"step": 80900, "global_schedule": 0.20779922604560852, "l2_grads": 1.9972178936004639, "l2_params": 263.5970153808594, "l2_updates": 0.22546623647212982, "training_loss": 2.752094268798828, "uptime": 29536.624530410976, "examples_seen": 82841600.0, "progress": 0.725710236192219, "epoch": 65.31420619621478, "img/sec/core": 189.26103377915157, "core_hours_Tesla V100-SXM2-32GB": 121.34881294381287, "core_hours": 121.34881294381287}
{"step": 80950, "global_schedule": 0.20717158913612366, "l2_grads": 2.123910427093506, "l2_params": 263.52410888671875, "l2_updates": 0.22728340327739716, "training_loss": 2.022796392440796, "uptime": 29553.503734252998, "examples_seen": 82892800.0, "progress": 0.7261587592059349, "epoch": 65.35457344355484, "img/sec/core": 189.58240151312458, "core_hours_Tesla V100-SXM2-32GB": 121.4238316275552, "core_hours": 121.4238316275552}
{"step": 81000, "global_schedule": 0.20654454827308655, "l2_grads": 2.0327863693237305, "l2_params": 263.4521484375, "l2_updates": 0.22522808611392975, "training_loss": 4.05271577835083, "uptime": 29570.385656227998, "examples_seen": 82944000.0, "progress": 0.7266072822196507, "epoch": 65.3949406908949, "img/sec/core": 189.5518771345313, "core_hours_Tesla V100-SXM2-32GB": 121.49886239188852, "core_hours": 121.49886239188852}
{"step": 81050, "global_schedule": 0.2059183120727539, "l2_grads": 2.027597188949585, "l2_params": 263.3789978027344, "l2_updates": 0.22156769037246704, "training_loss": 2.8646786212921143, "uptime": 29588.006123266998, "examples_seen": 82995200.0, "progress": 0.7270558052333665, "epoch": 65.43530793823496, "img/sec/core": 189.48853303175818, "core_hours_Tesla V100-SXM2-32GB": 121.57391823824857, "core_hours": 121.57391823824857}
{"step": 81101, "global_schedule": 0.20529267191886902, "l2_grads": 2.044546365737915, "l2_params": 263.3046569824219, "l2_updates": 0.2231454849243164, "training_loss": 2.2272980213165283, "uptime": 29604.88881380699, "examples_seen": 83046400.0, "progress": 0.7275043282470823, "epoch": 65.47567518557501, "img/sec/core": 189.54324800421904, "core_hours_Tesla V100-SXM2-32GB": 121.6489524184263, "core_hours": 121.6489524184263}
{"step": 81150, "global_schedule": 0.2046678364276886, "l2_grads": 1.9424355030059814, "l2_params": 263.2286376953125, "l2_updates": 0.2239682823419571, "training_loss": 3.4717304706573486, "uptime": 29621.784116974974, "examples_seen": 83097600.0, "progress": 0.7279528512607982, "epoch": 65.51604243291507, "img/sec/core": 189.40175078146754, "core_hours_Tesla V100-SXM2-32GB": 121.72404265472846, "core_hours": 121.72404265472846}
{"step": 81200, "global_schedule": 0.20404362678527832, "l2_grads": 1.9446393251419067, "l2_params": 263.15185546875, "l2_updates": 0.22086310386657715, "training_loss": 2.4162118434906006, "uptime": 29638.667915018974, "examples_seen": 83148800.0, "progress": 0.728401374274514, "epoch": 65.55640968025513, "img/sec/core": 189.53081478827156, "core_hours_Tesla V100-SXM2-32GB": 121.79908175714624, "core_hours": 121.79908175714624}
{"step": 81250, "global_schedule": 0.20342019200325012, "l2_grads": 1.915505290031433, "l2_params": 263.0824890136719, "l2_updates": 0.22047656774520874, "training_loss": 3.349862813949585, "uptime": 29655.563154592004, "examples_seen": 83200000.0, "progress": 0.7288498972882299, "epoch": 65.59677692759519, "img/sec/core": 189.40246370392603, "core_hours_Tesla V100-SXM2-32GB": 121.87417171080416, "core_hours": 121.87417171080416}
{"step": 81300, "global_schedule": 0.20279741287231445, "l2_grads": 2.1615288257598877, "l2_params": 263.01129150390625, "l2_updates": 0.22255365550518036, "training_loss": 1.893795132637024, "uptime": 29672.442498879973, "examples_seen": 83251200.0, "progress": 0.7292984203019457, "epoch": 65.63714417493524, "img/sec/core": 189.58082407744374, "core_hours_Tesla V100-SXM2-32GB": 121.94919101875068, "core_hours": 121.94919101875068}
{"step": 81350, "global_schedule": 0.20217540860176086, "l2_grads": 2.141104221343994, "l2_params": 262.94842529296875, "l2_updates": 0.21608439087867737, "training_loss": 3.595792531967163, "uptime": 29689.343169990985, "examples_seen": 83302400.0, "progress": 0.7297469433156615, "epoch": 65.67751142227532, "img/sec/core": 189.34159353677413, "core_hours_Tesla V100-SXM2-32GB": 122.02430511257741, "core_hours": 122.02430511257741}
{"step": 81400, "global_schedule": 0.20155403017997742, "l2_grads": 2.0921199321746826, "l2_params": 262.87579345703125, "l2_updates": 0.21946842968463898, "training_loss": 1.8498302698135376, "uptime": 29706.224966235983, "examples_seen": 83353600.0, "progress": 0.7301954663293774, "epoch": 65.71787866961537, "img/sec/core": 189.55328885385845, "core_hours_Tesla V100-SXM2-32GB": 122.09933531811072, "core_hours": 122.09933531811072}
{"step": 81450, "global_schedule": 0.20093345642089844, "l2_grads": 2.058976173400879, "l2_params": 262.8047790527344, "l2_updates": 0.21975767612457275, "training_loss": 2.3756885528564453, "uptime": 29723.10817211197, "examples_seen": 83404800.0, "progress": 0.7306439893430932, "epoch": 65.75824591695543, "img/sec/core": 189.53746246447943, "core_hours_Tesla V100-SXM2-32GB": 122.17437178867067, "core_hours": 122.17437178867067}
{"step": 81500, "global_schedule": 0.200313538312912, "l2_grads": 1.9989612102508545, "l2_params": 262.72747802734375, "l2_updates": 0.21887513995170593, "training_loss": 3.1519060134887695, "uptime": 29740.007950843952, "examples_seen": 83456000.0, "progress": 0.731092512356809, "epoch": 65.79861316429549, "img/sec/core": 189.35159156516735, "core_hours_Tesla V100-SXM2-32GB": 122.24948191636837, "core_hours": 122.24948191636837}
{"step": 81550, "global_schedule": 0.19969439506530762, "l2_grads": 1.986797571182251, "l2_params": 262.66009521484375, "l2_updates": 0.21611662209033966, "training_loss": 2.876783609390259, "uptime": 29756.89741032099, "examples_seen": 83507200.0, "progress": 0.7315410353705248, "epoch": 65.83898041163555, "img/sec/core": 189.4672830915843, "core_hours_Tesla V100-SXM2-32GB": 122.32454618071077, "core_hours": 122.32454618071077}
{"step": 81600, "global_schedule": 0.1990758776664734, "l2_grads": 2.2472305297851562, "l2_params": 262.59228515625, "l2_updates": 0.2123044729232788, "training_loss": 4.141525745391846, "uptime": 29773.78583909897, "examples_seen": 83558400.0, "progress": 0.7319895583842407, "epoch": 65.8793476589756, "img/sec/core": 189.4788462602451, "core_hours_Tesla V100-SXM2-32GB": 122.39960586416846, "core_hours": 122.39960586416846}
{"step": 81650, "global_schedule": 0.19845819473266602, "l2_grads": 1.930092453956604, "l2_params": 262.5213928222656, "l2_updates": 0.2158607840538025, "training_loss": 2.9240899085998535, "uptime": 29790.675668326963, "examples_seen": 83609600.0, "progress": 0.7324380813979565, "epoch": 65.91971490631566, "img/sec/core": 189.4631352871569, "core_hours_Tesla V100-SXM2-32GB": 122.4746717718484, "core_hours": 122.4746717718484}
{"step": 81700, "global_schedule": 0.19784113764762878, "l2_grads": 2.1649527549743652, "l2_params": 262.44512939453125, "l2_updates": 0.21582084894180298, "training_loss": 1.849177360534668, "uptime": 29807.556538612, "examples_seen": 83660800.0, "progress": 0.7328866044116724, "epoch": 65.96008215365572, "img/sec/core": 189.56368634835934, "core_hours_Tesla V100-SXM2-32GB": 122.54969786200414, "core_hours": 122.54969786200414}
{"step": 81750, "global_schedule": 0.19722488522529602, "l2_grads": 2.1519947052001953, "l2_params": 262.3735046386719, "l2_updates": 0.21724973618984222, "training_loss": 1.7772027254104614, "uptime": 29824.425573128974, "examples_seen": 83712000.0, "progress": 0.7333351274253882, "epoch": 66.00044940099578, "img/sec/core": 189.69668932623392, "core_hours_Tesla V100-SXM2-32GB": 122.62467134874625, "core_hours": 122.62467134874625}
{"step": 81800, "global_schedule": 0.1966092884540558, "l2_grads": 1.956915259361267, "l2_params": 262.30450439453125, "l2_updates": 0.2148936241865158, "training_loss": 2.1386022567749023, "uptime": 29841.327363524004, "examples_seen": 83763200.0, "progress": 0.733783650439104, "epoch": 66.04081664833583, "img/sec/core": 189.3290548048093, "core_hours_Tesla V100-SXM2-32GB": 122.6997904171686, "core_hours": 122.6997904171686}
{"step": 81851, "global_schedule": 0.19599449634552002, "l2_grads": 2.0191490650177, "l2_params": 262.2339172363281, "l2_updates": 0.2139841616153717, "training_loss": 3.6005477905273438, "uptime": 29858.204082056996, "examples_seen": 83814400.0, "progress": 0.7342321734528199, "epoch": 66.08118389567589, "img/sec/core": 189.61031990574924, "core_hours_Tesla V100-SXM2-32GB": 122.77479805509302, "core_hours": 122.77479805509302}
{"step": 81900, "global_schedule": 0.19538041949272156, "l2_grads": 2.1467483043670654, "l2_params": 262.1570739746094, "l2_updates": 0.2115640938282013, "training_loss": 4.109167575836182, "uptime": 29875.096986235003, "examples_seen": 83865600.0, "progress": 0.7346806964665357, "epoch": 66.12155114301595, "img/sec/core": 189.42864804538374, "core_hours_Tesla V100-SXM2-32GB": 122.84987762921747, "core_hours": 122.84987762921747}
{"step": 81950, "global_schedule": 0.19476699829101562, "l2_grads": 2.2126107215881348, "l2_params": 262.0917663574219, "l2_updates": 0.21007078886032104, "training_loss": 3.8129775524139404, "uptime": 29891.96509852796, "examples_seen": 83916800.0, "progress": 0.7351292194802516, "epoch": 66.161918390356, "img/sec/core": 189.70706054265284, "core_hours_Tesla V100-SXM2-32GB": 122.92484701718618, "core_hours": 122.92484701718618}
{"step": 82000, "global_schedule": 0.19415441155433655, "l2_grads": 2.152956485748291, "l2_params": 262.0169372558594, "l2_updates": 0.21419140696525574, "training_loss": 1.8190070390701294, "uptime": 29908.845351643977, "examples_seen": 83968000.0, "progress": 0.7355777424939673, "epoch": 66.20228563769606, "img/sec/core": 189.5706170995405, "core_hours_Tesla V100-SXM2-32GB": 122.99987036436848, "core_hours": 122.99987036436848}
{"step": 82050, "global_schedule": 0.1935424506664276, "l2_grads": 2.041088342666626, "l2_params": 261.9437255859375, "l2_updates": 0.2097725123167038, "training_loss": 3.3761000633239746, "uptime": 29926.20683175599, "examples_seen": 84019200.0, "progress": 0.7360262655076832, "epoch": 66.24265288503614, "img/sec/core": 189.8505057470114, "core_hours_Tesla V100-SXM2-32GB": 123.07478310777289, "core_hours": 123.07478310777289}
{"step": 82100, "global_schedule": 0.19293129444122314, "l2_grads": 2.2417690753936768, "l2_params": 261.87713623046875, "l2_updates": 0.20788542926311493, "training_loss": 3.990518093109131, "uptime": 29943.085352436, "examples_seen": 84070400.0, "progress": 0.736474788521399, "epoch": 66.2830201323762, "img/sec/core": 189.59007490449218, "core_hours_Tesla V100-SXM2-32GB": 123.14979875523959, "core_hours": 123.14979875523959}
{"step": 82150, "global_schedule": 0.1923208236694336, "l2_grads": 1.9652467966079712, "l2_params": 261.8084411621094, "l2_updates": 0.20813529193401337, "training_loss": 3.17387056350708, "uptime": 29959.95092317398, "examples_seen": 84121600.0, "progress": 0.7369233115351149, "epoch": 66.32338737971625, "img/sec/core": 189.73564842331615, "core_hours_Tesla V100-SXM2-32GB": 123.22475684740839, "core_hours": 123.22475684740839}
{"step": 82200, "global_schedule": 0.1917111575603485, "l2_grads": 2.2504794597625732, "l2_params": 261.7351989746094, "l2_updates": 0.20993518829345703, "training_loss": 1.7458397150039673, "uptime": 29976.800860029995, "examples_seen": 84172800.0, "progress": 0.7373718345488307, "epoch": 66.36375462705631, "img/sec/core": 189.91169090688066, "core_hours_Tesla V100-SXM2-32GB": 123.29964545565736, "core_hours": 123.29964545565736}
{"step": 82250, "global_schedule": 0.19110214710235596, "l2_grads": 2.081930637359619, "l2_params": 261.6678466796875, "l2_updates": 0.20725645124912262, "training_loss": 4.156556129455566, "uptime": 29993.66997309297, "examples_seen": 84224000.0, "progress": 0.7378203575625465, "epoch": 66.40412187439637, "img/sec/core": 189.69580606011021, "core_hours_Tesla V100-SXM2-32GB": 123.37461929149279, "core_hours": 123.37461929149279}
{"step": 82300, "global_schedule": 0.19049394130706787, "l2_grads": 2.2135283946990967, "l2_params": 261.593994140625, "l2_updates": 0.20673778653144836, "training_loss": 4.315860748291016, "uptime": 30010.528718156973, "examples_seen": 84275200.0, "progress": 0.7382688805762624, "epoch": 66.44448912173642, "img/sec/core": 189.81246752656745, "core_hours_Tesla V100-SXM2-32GB": 123.4495470473328, "core_hours": 123.4495470473328}
{"step": 82350, "global_schedule": 0.1898864209651947, "l2_grads": 2.1297147274017334, "l2_params": 261.526611328125, "l2_updates": 0.20817972719669342, "training_loss": 1.940123438835144, "uptime": 30027.395896219998, "examples_seen": 84326400.0, "progress": 0.7387174035899782, "epoch": 66.48485636907648, "img/sec/core": 189.71756793241255, "core_hours_Tesla V100-SXM2-32GB": 123.52451228316848, "core_hours": 123.52451228316848}
{"step": 82400, "global_schedule": 0.1892797350883484, "l2_grads": 2.047419548034668, "l2_params": 261.4537353515625, "l2_updates": 0.20446521043777466, "training_loss": 3.3318727016448975, "uptime": 30044.277232325985, "examples_seen": 84377600.0, "progress": 0.7391659266036941, "epoch": 66.52522361641654, "img/sec/core": 189.5584555576162, "core_hours_Tesla V100-SXM2-32GB": 123.59954044363954, "core_hours": 123.59954044363954}
{"step": 82450, "global_schedule": 0.18867367506027222, "l2_grads": 2.2965481281280518, "l2_params": 261.383056640625, "l2_updates": 0.2059302181005478, "training_loss": 4.346323013305664, "uptime": 30061.11723659298, "examples_seen": 84428800.0, "progress": 0.7396144496174099, "epoch": 66.5655908637566, "img/sec/core": 190.02370482004366, "core_hours_Tesla V100-SXM2-32GB": 123.67438490704839, "core_hours": 123.67438490704839}
{"step": 82500, "global_schedule": 0.1880684792995453, "l2_grads": 2.149866819381714, "l2_params": 261.310791015625, "l2_updates": 0.2070063054561615, "training_loss": 2.165726661682129, "uptime": 30077.983759869006, "examples_seen": 84480000.0, "progress": 0.7400629726311257, "epoch": 66.60595811109665, "img/sec/core": 189.72493308971755, "core_hours_Tesla V100-SXM2-32GB": 123.74934723271963, "core_hours": 123.74934723271963, "minival/prec@1": 0.7553855760224789, "minival/loss": 0.9934856022963701, "minival/sample count": 12812.0, "minival/attn_weight_avg": [13312, 12, 281], "minival/attn_mag": [13312, 12, 281], "minival/before_mlp": [13312, 12, 281], "z/secs/eval/minival": 2.8982084799790755, "real/prec@1": 0.7961867754126012, "real/loss": 1.7815952538441162, "real/sample count": 46837.0, "real/attn_weight_avg": [50176, 12, 281], "real/attn_mag": [50176, 12, 281], "real/before_mlp": [50176, 12, 281], "z/secs/eval/real": 11.216730246029329, "train/prec@1": 0.7978378800296608, "train/loss": 0.7990623568732971, "train/sample count": 25623.0, "train/attn_weight_avg": [26624, 12, 281], "train/attn_mag": [26624, 12, 281], "train/before_mlp": [26624, 12, 281], "z/secs/eval/train": 6.578937534010038, "v2/prec@1": 0.5946, "v2/loss": 1.763522900390625, "v2/sample count": 10000.0, "v2/attn_weight_avg": [10240, 12, 281], "v2/attn_mag": [10240, 12, 281], "v2/before_mlp": [10240, 12, 281], "z/secs/eval/v2": 3.389425238012336, "val/prec@1": 0.72332, "val/loss": 1.1303260998535156, "val/sample count": 50000.0, "val/attn_weight_avg": [50176, 12, 281], "val/attn_mag": [50176, 12, 281], "val/before_mlp": [50176, 12, 281], "z/secs/eval/val": 12.362473218003288}
{"step": 82550, "global_schedule": 0.1874639093875885, "l2_grads": 2.091683864593506, "l2_params": 261.2422180175781, "l2_updates": 0.2031136155128479, "training_loss": 3.581921100616455, "uptime": 30131.36423690495, "examples_seen": 84531200.0, "progress": 0.7405114956448415, "epoch": 66.64632535843671, "img/sec/core": 188.98339753689507, "core_hours_Tesla V100-SXM2-32GB": 123.824603696555, "core_hours": 123.824603696555}
{"step": 82600, "global_schedule": 0.18686020374298096, "l2_grads": 2.083648204803467, "l2_params": 261.16552734375, "l2_updates": 0.20167602598667145, "training_loss": 2.3729248046875, "uptime": 30148.228806403, "examples_seen": 84582400.0, "progress": 0.7409600186585573, "epoch": 66.68669260577677, "img/sec/core": 189.74691292118285, "core_hours_Tesla V100-SXM2-32GB": 123.89955733876856, "core_hours": 123.89955733876856}
{"step": 82650, "global_schedule": 0.18625715374946594, "l2_grads": 2.1157870292663574, "l2_params": 261.10357666015625, "l2_updates": 0.20316189527511597, "training_loss": 2.455068588256836, "uptime": 30165.126746394963, "examples_seen": 84633600.0, "progress": 0.7414085416722732, "epoch": 66.72705985311683, "img/sec/core": 189.37219575416023, "core_hours_Tesla V100-SXM2-32GB": 123.9746592942884, "core_hours": 123.9746592942884}
{"step": 82700, "global_schedule": 0.18565493822097778, "l2_grads": 2.286813497543335, "l2_params": 261.03167724609375, "l2_updates": 0.20118536055088043, "training_loss": 4.149686336517334, "uptime": 30182.013643878978, "examples_seen": 84684800.0, "progress": 0.741857064685989, "epoch": 66.76742710045689, "img/sec/core": 189.49602809095364, "core_hours_Tesla V100-SXM2-32GB": 124.04971217199514, "core_hours": 124.04971217199514}
{"step": 82750, "global_schedule": 0.18505337834358215, "l2_grads": 2.1335361003875732, "l2_params": 260.9612121582031, "l2_updates": 0.19959446787834167, "training_loss": 4.072211265563965, "uptime": 30198.914361895004, "examples_seen": 84736000.0, "progress": 0.7423055876997049, "epoch": 66.80779434779694, "img/sec/core": 189.3410680519967, "core_hours_Tesla V100-SXM2-32GB": 124.12482647428858, "core_hours": 124.12482647428858}
{"step": 82801, "global_schedule": 0.18445268273353577, "l2_grads": 1.9843621253967285, "l2_params": 260.89593505859375, "l2_updates": 0.19911827147006989, "training_loss": 2.304997205734253, "uptime": 30215.828225742967, "examples_seen": 84787200.0, "progress": 0.7427541107134207, "epoch": 66.84816159513701, "img/sec/core": 189.19390795411252, "core_hours_Tesla V100-SXM2-32GB": 124.19999920250174, "core_hours": 124.19999920250174}
{"step": 82850, "global_schedule": 0.1838526427745819, "l2_grads": 2.2342562675476074, "l2_params": 260.8210144042969, "l2_updates": 0.19851364195346832, "training_loss": 1.8600877523422241, "uptime": 30232.71805263695, "examples_seen": 84838400.0, "progress": 0.7432026337271366, "epoch": 66.88852884247707, "img/sec/core": 189.46316146913048, "core_hours_Tesla V100-SXM2-32GB": 124.27506509980834, "core_hours": 124.27506509980834}
{"step": 82900, "global_schedule": 0.1832534670829773, "l2_grads": 2.0331239700317383, "l2_params": 260.75262451171875, "l2_updates": 0.19739274680614471, "training_loss": 2.8138175010681152, "uptime": 30249.620973376965, "examples_seen": 84889600.0, "progress": 0.7436511567408524, "epoch": 66.92889608981713, "img/sec/core": 189.31639384809182, "core_hours_Tesla V100-SXM2-32GB": 124.35018919198619, "core_hours": 124.35018919198619}
{"step": 82950, "global_schedule": 0.1826549470424652, "l2_grads": 2.1701886653900146, "l2_params": 260.68280029296875, "l2_updates": 0.19547230005264282, "training_loss": 4.16622257232666, "uptime": 30266.512788200984, "examples_seen": 84940800.0, "progress": 0.7440996797545683, "epoch": 66.96926333715719, "img/sec/core": 189.44086430842245, "core_hours_Tesla V100-SXM2-32GB": 124.42526392453738, "core_hours": 124.42526392453738}
{"step": 83001, "global_schedule": 0.18205717206001282, "l2_grads": 2.15049147605896, "l2_params": 260.6171569824219, "l2_updates": 0.19917269051074982, "training_loss": 1.8653597831726074, "uptime": 30283.415356654965, "examples_seen": 84992000.0, "progress": 0.744548202768284, "epoch": 67.00963058449724, "img/sec/core": 189.32033961065258, "core_hours_Tesla V100-SXM2-32GB": 124.50038645099951, "core_hours": 124.50038645099951}
{"step": 83050, "global_schedule": 0.18146026134490967, "l2_grads": 2.0772647857666016, "l2_params": 260.5479431152344, "l2_updates": 0.194996640086174, "training_loss": 3.4935483932495117, "uptime": 30300.89546267799, "examples_seen": 85043200.0, "progress": 0.7449967257819998, "epoch": 67.0499978318373, "img/sec/core": 189.3847098367453, "core_hours_Tesla V100-SXM2-32GB": 124.57548344396417, "core_hours": 124.57548344396417}
{"step": 83100, "global_schedule": 0.18086403608322144, "l2_grads": 2.2823402881622314, "l2_params": 260.47369384765625, "l2_updates": 0.19716760516166687, "training_loss": 2.0228331089019775, "uptime": 30317.78643380996, "examples_seen": 85094400.0, "progress": 0.7454452487957157, "epoch": 67.09036507917736, "img/sec/core": 189.4503267454461, "core_hours_Tesla V100-SXM2-32GB": 124.65055442677293, "core_hours": 124.65055442677293}
{"step": 83150, "global_schedule": 0.18026864528656006, "l2_grads": 2.1454925537109375, "l2_params": 260.4111022949219, "l2_updates": 0.19417345523834229, "training_loss": 2.601496934890747, "uptime": 30334.639251175977, "examples_seen": 85145600.0, "progress": 0.7458937718094315, "epoch": 67.13073232651742, "img/sec/core": 189.8792309025337, "core_hours_Tesla V100-SXM2-32GB": 124.72545583728856, "core_hours": 124.72545583728856}
{"step": 83200, "global_schedule": 0.1796739399433136, "l2_grads": 2.069598436355591, "l2_params": 260.3471374511719, "l2_updates": 0.19448226690292358, "training_loss": 3.8301777839660645, "uptime": 30351.53167084197, "examples_seen": 85196800.0, "progress": 0.7463422948231474, "epoch": 67.17109957385748, "img/sec/core": 189.43408127859624, "core_hours_Tesla V100-SXM2-32GB": 124.8005332580263, "core_hours": 124.8005332580263}
{"step": 83250, "global_schedule": 0.17908009886741638, "l2_grads": 2.1101725101470947, "l2_params": 260.2800598144531, "l2_updates": 0.19360318779945374, "training_loss": 3.5419504642486572, "uptime": 30368.416835485958, "examples_seen": 85248000.0, "progress": 0.7467908178368632, "epoch": 67.21146682119753, "img/sec/core": 189.51547512090983, "core_hours_Tesla V100-SXM2-32GB": 124.87557843422181, "core_hours": 124.87557843422181}
{"step": 83300, "global_schedule": 0.17848694324493408, "l2_grads": 2.0513646602630615, "l2_params": 260.21087646484375, "l2_updates": 0.19446568191051483, "training_loss": 2.2248921394348145, "uptime": 30385.289017489995, "examples_seen": 85299200.0, "progress": 0.7472393408505791, "epoch": 67.25183406853759, "img/sec/core": 189.66130161672496, "core_hours_Tesla V100-SXM2-32GB": 124.95056590979532, "core_hours": 124.95056590979532}
{"step": 83350, "global_schedule": 0.17789462208747864, "l2_grads": 2.2473561763763428, "l2_params": 260.1408386230469, "l2_updates": 0.19119291007518768, "training_loss": 1.7953792810440063, "uptime": 30402.162096897955, "examples_seen": 85350400.0, "progress": 0.7476878638642949, "epoch": 67.29220131587765, "img/sec/core": 189.65121437704744, "core_hours_Tesla V100-SXM2-32GB": 125.02555737383068, "core_hours": 125.02555737383068}
{"step": 83400, "global_schedule": 0.1773030161857605, "l2_grads": 2.0839059352874756, "l2_params": 260.0718078613281, "l2_updates": 0.19434398412704468, "training_loss": 1.8553874492645264, "uptime": 30419.05368488998, "examples_seen": 85401600.0, "progress": 0.7481363868780108, "epoch": 67.3325685632177, "img/sec/core": 189.44340825214147, "core_hours_Tesla V100-SXM2-32GB": 125.10063109823969, "core_hours": 125.10063109823969}
{"step": 83450, "global_schedule": 0.1767122447490692, "l2_grads": 2.1638917922973633, "l2_params": 260.0001220703125, "l2_updates": 0.1941087543964386, "training_loss": 1.82326078414917, "uptime": 30435.927962420974, "examples_seen": 85452800.0, "progress": 0.7485849098917265, "epoch": 67.37293581055776, "img/sec/core": 189.63774858640488, "core_hours_Tesla V100-SXM2-32GB": 125.17562788726632, "core_hours": 125.17562788726632}
{"step": 83500, "global_schedule": 0.17612215876579285, "l2_grads": 2.0946617126464844, "l2_params": 259.9339294433594, "l2_updates": 0.19472160935401917, "training_loss": 2.3595128059387207, "uptime": 30452.78422785597, "examples_seen": 85504000.0, "progress": 0.7490334329054423, "epoch": 67.41330305789783, "img/sec/core": 189.84038975540096, "core_hours_Tesla V100-SXM2-32GB": 125.25054462253297, "core_hours": 125.25054462253297}
{"step": 83550, "global_schedule": 0.1755329668521881, "l2_grads": 2.2461133003234863, "l2_params": 259.8665466308594, "l2_updates": 0.19067180156707764, "training_loss": 4.011175155639648, "uptime": 30469.662981131987, "examples_seen": 85555200.0, "progress": 0.7494819559191582, "epoch": 67.45367030523789, "img/sec/core": 189.58746227700917, "core_hours_Tesla V100-SXM2-32GB": 125.32556130375971, "core_hours": 125.32556130375971}
{"step": 83601, "global_schedule": 0.1749444305896759, "l2_grads": 2.224635124206543, "l2_params": 259.80145263671875, "l2_updates": 0.19209983944892883, "training_loss": 1.7905899286270142, "uptime": 30486.548277102003, "examples_seen": 85606400.0, "progress": 0.749930478932874, "epoch": 67.49403755257795, "img/sec/core": 189.5140011571226, "core_hours_Tesla V100-SXM2-32GB": 125.40060706362645, "core_hours": 125.40060706362645}
{"step": 83650, "global_schedule": 0.17435678839683533, "l2_grads": 2.1630334854125977, "l2_params": 259.7352294921875, "l2_updates": 0.1919548064470291, "training_loss": 1.9100258350372314, "uptime": 30503.414968306955, "examples_seen": 85657600.0, "progress": 0.7503790019465899, "epoch": 67.53440479991801, "img/sec/core": 189.72304414160834, "core_hours_Tesla V100-SXM2-32GB": 125.47557013564847, "core_hours": 125.47557013564847}
{"step": 83700, "global_schedule": 0.17376980185508728, "l2_grads": 2.141014575958252, "l2_params": 259.66961669921875, "l2_updates": 0.19177456200122833, "training_loss": 1.786928415298462, "uptime": 30520.289399474976, "examples_seen": 85708800.0, "progress": 0.7508275249603057, "epoch": 67.57477204725807, "img/sec/core": 189.63602198718942, "core_hours_Tesla V100-SXM2-32GB": 125.55056760750634, "core_hours": 125.55056760750634}
{"step": 83750, "global_schedule": 0.17318370938301086, "l2_grads": 2.0628304481506348, "l2_params": 259.6034240722656, "l2_updates": 0.18704411387443542, "training_loss": 3.632692337036133, "uptime": 30537.14973833895, "examples_seen": 85760000.0, "progress": 0.7512760479740216, "epoch": 67.61513929459812, "img/sec/core": 189.7945246425246, "core_hours_Tesla V100-SXM2-32GB": 125.62550244690178, "core_hours": 125.62550244690178}
{"step": 83800, "global_schedule": 0.17259830236434937, "l2_grads": 2.0707528591156006, "l2_params": 259.53399658203125, "l2_updates": 0.18879148364067078, "training_loss": 3.214016914367676, "uptime": 30554.016738200968, "examples_seen": 85811200.0, "progress": 0.7517245709877374, "epoch": 67.65550654193818, "img/sec/core": 189.71957231149906, "core_hours_Tesla V100-SXM2-32GB": 125.70046689073297, "core_hours": 125.70046689073297}
{"step": 83850, "global_schedule": 0.1720137894153595, "l2_grads": 2.115450620651245, "l2_params": 259.4643249511719, "l2_updates": 0.1900438368320465, "training_loss": 2.2445950508117676, "uptime": 30570.900409794005, "examples_seen": 85862400.0, "progress": 0.7521730940014533, "epoch": 67.69587378927824, "img/sec/core": 189.53223428721694, "core_hours_Tesla V100-SXM2-32GB": 125.77550543114647, "core_hours": 125.77550543114647}
{"step": 83900, "global_schedule": 0.17142996191978455, "l2_grads": 2.1569833755493164, "l2_params": 259.3973083496094, "l2_updates": 0.18699127435684204, "training_loss": 1.9240721464157104, "uptime": 30587.763428037986, "examples_seen": 85913600.0, "progress": 0.752621617015169, "epoch": 67.7362410366183, "img/sec/core": 189.76436802125744, "core_hours_Tesla V100-SXM2-32GB": 125.8504521788975, "core_hours": 125.8504521788975}
{"step": 83950, "global_schedule": 0.17084699869155884, "l2_grads": 2.1379597187042236, "l2_params": 259.3348388671875, "l2_updates": 0.185929074883461, "training_loss": 3.7458248138427734, "uptime": 30604.642112586997, "examples_seen": 85964800.0, "progress": 0.7530701400288848, "epoch": 67.77660828395835, "img/sec/core": 189.58823424350473, "core_hours_Tesla V100-SXM2-32GB": 125.92546855467087, "core_hours": 125.92546855467087}
{"step": 84000, "global_schedule": 0.17026475071907043, "l2_grads": 2.2196309566497803, "l2_params": 259.2668762207031, "l2_updates": 0.18338926136493683, "training_loss": 4.0781755447387695, "uptime": 30621.513595215976, "examples_seen": 86016000.0, "progress": 0.7535186630426007, "epoch": 67.81697553129841, "img/sec/core": 189.66916366339024, "core_hours_Tesla V100-SXM2-32GB": 126.00045292191079, "core_hours": 126.00045292191079}
{"step": 84050, "global_schedule": 0.16968336701393127, "l2_grads": 2.248105764389038, "l2_params": 259.1963195800781, "l2_updates": 0.18281406164169312, "training_loss": 1.7862613201141357, "uptime": 30638.88198099297, "examples_seen": 86067200.0, "progress": 0.7539671860563165, "epoch": 67.85734277863847, "img/sec/core": 189.96391215987956, "core_hours_Tesla V100-SXM2-32GB": 126.07532094321292, "core_hours": 126.07532094321292}
{"step": 84100, "global_schedule": 0.16910269856452942, "l2_grads": 2.200861930847168, "l2_params": 259.12689208984375, "l2_updates": 0.18495328724384308, "training_loss": 1.841001272201538, "uptime": 30655.751462770975, "examples_seen": 86118400.0, "progress": 0.7544157090700324, "epoch": 67.89771002597853, "img/sec/core": 189.69165989273256, "core_hours_Tesla V100-SXM2-32GB": 126.15029641778183, "core_hours": 126.15029641778183}
{"step": 84150, "global_schedule": 0.1685229241847992, "l2_grads": 2.19439697265625, "l2_params": 259.0619812011719, "l2_updates": 0.1837422400712967, "training_loss": 2.0886311531066895, "uptime": 30672.619614983967, "examples_seen": 86169600.0, "progress": 0.7548642320837482, "epoch": 67.93807727331858, "img/sec/core": 189.70661158341701, "core_hours_Tesla V100-SXM2-32GB": 126.2252659831729, "core_hours": 126.2252659831729}
{"step": 84200, "global_schedule": 0.1679438352584839, "l2_grads": 2.0326132774353027, "l2_params": 258.9942626953125, "l2_updates": 0.18135400116443634, "training_loss": 2.6520466804504395, "uptime": 30689.488454787002, "examples_seen": 86220800.0, "progress": 0.7553127550974641, "epoch": 67.97844452065866, "img/sec/core": 189.69887896049576, "core_hours_Tesla V100-SXM2-32GB": 126.30023860451973, "core_hours": 126.30023860451973}
{"step": 84250, "global_schedule": 0.1673656404018402, "l2_grads": 2.2043068408966064, "l2_params": 258.93157958984375, "l2_updates": 0.18211184442043304, "training_loss": 3.950939655303955, "uptime": 30706.358413323993, "examples_seen": 86272000.0, "progress": 0.7557612781111799, "epoch": 68.01881176799871, "img/sec/core": 189.68629904948597, "core_hours_Tesla V100-SXM2-32GB": 126.37521619801745, "core_hours": 126.37521619801745}
{"step": 84301, "global_schedule": 0.16678813099861145, "l2_grads": 2.070305824279785, "l2_params": 258.8641052246094, "l2_updates": 0.18193234503269196, "training_loss": 1.879703402519226, "uptime": 30723.21084769396, "examples_seen": 86323200.0, "progress": 0.7562098011248957, "epoch": 68.05917901533877, "img/sec/core": 189.88354618384008, "core_hours_Tesla V100-SXM2-32GB": 126.45011590632842, "core_hours": 126.45011590632842}
{"step": 84350, "global_schedule": 0.1662115454673767, "l2_grads": 2.100846529006958, "l2_params": 258.8018798828125, "l2_updates": 0.1809198409318924, "training_loss": 2.1428475379943848, "uptime": 30740.075189035968, "examples_seen": 86374400.0, "progress": 0.7566583241386116, "epoch": 68.09954626267883, "img/sec/core": 189.74947998883476, "core_hours_Tesla V100-SXM2-32GB": 126.52506853451513, "core_hours": 126.52506853451513}
{"step": 84400, "global_schedule": 0.16563564538955688, "l2_grads": 2.163740873336792, "l2_params": 258.7392578125, "l2_updates": 0.18468093872070312, "training_loss": 1.7408463954925537, "uptime": 30756.93078418699, "examples_seen": 86425600.0, "progress": 0.7571068471523273, "epoch": 68.13991351001889, "img/sec/core": 189.84793899764648, "core_hours_Tesla V100-SXM2-32GB": 126.59998229074189, "core_hours": 126.59998229074189}
{"step": 84450, "global_schedule": 0.1650606393814087, "l2_grads": 2.1511566638946533, "l2_params": 258.671875, "l2_updates": 0.17840710282325745, "training_loss": 3.7769668102264404, "uptime": 30773.774252127972, "examples_seen": 86476800.0, "progress": 0.7575553701660432, "epoch": 68.18028075735894, "img/sec/core": 189.98462853446603, "core_hours_Tesla V100-SXM2-32GB": 126.67484214825737, "core_hours": 126.67484214825737}
{"step": 84500, "global_schedule": 0.1644863486289978, "l2_grads": 2.1245460510253906, "l2_params": 258.60589599609375, "l2_updates": 0.18131469190120697, "training_loss": 1.7863037586212158, "uptime": 30790.639975562983, "examples_seen": 86528000.0, "progress": 0.758003893179759, "epoch": 68.220648004699, "img/sec/core": 189.73393061559156, "core_hours_Tesla V100-SXM2-32GB": 126.74980091907963, "core_hours": 126.74980091907963}
{"step": 84550, "global_schedule": 0.16391295194625854, "l2_grads": 2.1962592601776123, "l2_params": 258.5356750488281, "l2_updates": 0.17904959619045258, "training_loss": 1.741672158241272, "uptime": 30807.499779045, "examples_seen": 86579200.0, "progress": 0.7584524161934749, "epoch": 68.26101525203906, "img/sec/core": 189.80055155525275, "core_hours_Tesla V100-SXM2-32GB": 126.82473337899971, "core_hours": 126.82473337899971}
{"step": 84600, "global_schedule": 0.1633402705192566, "l2_grads": 2.189966917037964, "l2_params": 258.4726257324219, "l2_updates": 0.17678093910217285, "training_loss": 2.4878077507019043, "uptime": 30824.379758901952, "examples_seen": 86630400.0, "progress": 0.7589009392071907, "epoch": 68.30138249937912, "img/sec/core": 189.57368593553016, "core_hours_Tesla V100-SXM2-32GB": 126.89975551169728, "core_hours": 126.89975551169728}
{"step": 84650, "global_schedule": 0.16276848316192627, "l2_grads": 2.4063191413879395, "l2_params": 258.41131591796875, "l2_updates": 0.17438548803329468, "training_loss": 4.120826721191406, "uptime": 30841.242538277, "examples_seen": 86681600.0, "progress": 0.7593494622209066, "epoch": 68.34174974671917, "img/sec/core": 189.76705611975353, "core_hours_Tesla V100-SXM2-32GB": 126.97470119780861, "core_hours": 126.97470119780861}
{"step": 84700, "global_schedule": 0.16219741106033325, "l2_grads": 2.200625419616699, "l2_params": 258.34649658203125, "l2_updates": 0.17429423332214355, "training_loss": 3.6855649948120117, "uptime": 30858.09955187398, "examples_seen": 86732800.0, "progress": 0.7597979852346224, "epoch": 68.38211699405923, "img/sec/core": 189.83196410149284, "core_hours_Tesla V100-SXM2-32GB": 127.04962125823963, "core_hours": 127.04962125823963}
{"step": 84750, "global_schedule": 0.16162726283073425, "l2_grads": 2.1932103633880615, "l2_params": 258.285888671875, "l2_updates": 0.17569832503795624, "training_loss": 2.564390182495117, "uptime": 30874.972412107978, "examples_seen": 86784000.0, "progress": 0.7602465082483382, "epoch": 68.42248424139929, "img/sec/core": 189.6536778958299, "core_hours_Tesla V100-SXM2-32GB": 127.1246117481685, "core_hours": 127.1246117481685}
{"step": 84800, "global_schedule": 0.16105780005455017, "l2_grads": 2.364532947540283, "l2_params": 258.21875, "l2_updates": 0.173425555229187, "training_loss": 3.9240365028381348, "uptime": 30891.837747717975, "examples_seen": 86835200.0, "progress": 0.7606950312620541, "epoch": 68.46285148873935, "img/sec/core": 189.73829362181473, "core_hours_Tesla V100-SXM2-32GB": 127.19956879532404, "core_hours": 127.19956879532404}
{"step": 84850, "global_schedule": 0.1604892611503601, "l2_grads": 2.1623897552490234, "l2_params": 258.159423828125, "l2_updates": 0.17310819029808044, "training_loss": 2.3827035427093506, "uptime": 30908.71864282695, "examples_seen": 86886400.0, "progress": 0.7611435542757699, "epoch": 68.5032187360794, "img/sec/core": 189.56340758843078, "core_hours_Tesla V100-SXM2-32GB": 127.27459499580839, "core_hours": 127.27459499580839}
{"step": 84900, "global_schedule": 0.15992143750190735, "l2_grads": 2.32439923286438, "l2_params": 258.09173583984375, "l2_updates": 0.17266063392162323, "training_loss": 4.228658676147461, "uptime": 30925.58102230297, "examples_seen": 86937600.0, "progress": 0.7615920772894857, "epoch": 68.54358598341946, "img/sec/core": 189.77155653213785, "core_hours_Tesla V100-SXM2-32GB": 127.34953890459069, "core_hours": 127.34953890459069}
{"step": 84950, "global_schedule": 0.1593545377254486, "l2_grads": 2.11696720123291, "l2_params": 258.0299987792969, "l2_updates": 0.17427249252796173, "training_loss": 2.262699842453003, "uptime": 30942.44618326897, "examples_seen": 86988800.0, "progress": 0.7620406003032015, "epoch": 68.58395323075953, "img/sec/core": 189.7402584209532, "core_hours_Tesla V100-SXM2-32GB": 127.42449517555069, "core_hours": 127.42449517555069}
{"step": 85000, "global_schedule": 0.15878832340240479, "l2_grads": 2.068984270095825, "l2_params": 257.96240234375, "l2_updates": 0.17208395898342133, "training_loss": 2.3589730262756348, "uptime": 30959.307189844956, "examples_seen": 87040000.0, "progress": 0.7624891233169174, "epoch": 68.62432047809959, "img/sec/core": 189.787008597552, "core_hours_Tesla V100-SXM2-32GB": 127.49943298255508, "core_hours": 127.49943298255508, "minival/prec@1": 0.7631907586637527, "minival/loss": 0.9534277271338638, "minival/sample count": 12812.0, "minival/attn_weight_avg": [13312, 12, 281], "minival/attn_mag": [13312, 12, 281], "minival/before_mlp": [13312, 12, 281], "z/secs/eval/minival": 2.894516050000675, "real/prec@1": 0.8017379422251638, "real/loss": 1.7585398709053472, "real/sample count": 46837.0, "real/attn_weight_avg": [50176, 12, 281], "real/attn_mag": [50176, 12, 281], "real/before_mlp": [50176, 12, 281], "z/secs/eval/real": 11.203800817020237, "train/prec@1": 0.8058385044686415, "train/loss": 0.7557080616526873, "train/sample count": 25623.0, "train/attn_weight_avg": [26624, 12, 281], "train/attn_mag": [26624, 12, 281], "train/before_mlp": [26624, 12, 281], "z/secs/eval/train": 6.599631066957954, "v2/prec@1": 0.6023, "v2/loss": 1.7262072143554688, "v2/sample count": 10000.0, "v2/attn_weight_avg": [10240, 12, 281], "v2/attn_mag": [10240, 12, 281], "v2/before_mlp": [10240, 12, 281], "z/secs/eval/v2": 3.373574081051629, "val/prec@1": 0.73076, "val/loss": 1.087759864501953, "val/sample count": 50000.0, "val/attn_weight_avg": [50176, 12, 281], "val/attn_mag": [50176, 12, 281], "val/before_mlp": [50176, 12, 281], "z/secs/eval/val": 12.260280234972015}
{"step": 85050, "global_schedule": 0.15822306275367737, "l2_grads": 2.2826528549194336, "l2_params": 257.8963623046875, "l2_updates": 0.17165477573871613, "training_loss": 1.870082139968872, "uptime": 31013.284741104, "examples_seen": 87091200.0, "progress": 0.7629376463306332, "epoch": 68.66468772543965, "img/sec/core": 189.33526595679913, "core_hours_Tesla V100-SXM2-32GB": 127.57454958669298, "core_hours": 127.57454958669298}
{"step": 85100, "global_schedule": 0.15765848755836487, "l2_grads": 2.3231849670410156, "l2_params": 257.8306884765625, "l2_updates": 0.1721975952386856, "training_loss": 4.102266311645508, "uptime": 31030.157734101987, "examples_seen": 87142400.0, "progress": 0.7633861693443491, "epoch": 68.7050549727797, "img/sec/core": 189.6521856188395, "core_hours_Tesla V100-SXM2-32GB": 127.64954066668405, "core_hours": 127.64954066668405}
{"step": 85150, "global_schedule": 0.1570947766304016, "l2_grads": 2.215796709060669, "l2_params": 257.7697448730469, "l2_updates": 0.1697525531053543, "training_loss": 3.970076084136963, "uptime": 31047.043210694974, "examples_seen": 87193600.0, "progress": 0.7638346923580649, "epoch": 68.74542222011976, "img/sec/core": 189.5119739367715, "core_hours_Tesla V100-SXM2-32GB": 127.72458722931954, "core_hours": 127.72458722931954}
{"step": 85200, "global_schedule": 0.15653195977210999, "l2_grads": 2.3239715099334717, "l2_params": 257.7014465332031, "l2_updates": 0.16902856528759003, "training_loss": 4.123147964477539, "uptime": 31063.907093568996, "examples_seen": 87244800.0, "progress": 0.7642832153717807, "epoch": 68.78578946745982, "img/sec/core": 189.75463859093807, "core_hours_Tesla V100-SXM2-32GB": 127.79953781987075, "core_hours": 127.79953781987075}
{"step": 85250, "global_schedule": 0.15596985816955566, "l2_grads": 2.210488796234131, "l2_params": 257.6362609863281, "l2_updates": 0.17275241017341614, "training_loss": 1.7328999042510986, "uptime": 31080.78376639099, "examples_seen": 87296000.0, "progress": 0.7647317383854966, "epoch": 68.82615671479988, "img/sec/core": 189.61083347127376, "core_hours_Tesla V100-SXM2-32GB": 127.87454525463517, "core_hours": 127.87454525463517}
{"step": 85300, "global_schedule": 0.15540868043899536, "l2_grads": 2.0689167976379395, "l2_params": 257.57452392578125, "l2_updates": 0.1686241179704666, "training_loss": 2.9312491416931152, "uptime": 31097.68113875395, "examples_seen": 87347200.0, "progress": 0.7651802613992124, "epoch": 68.86652396213994, "img/sec/core": 189.37855728470947, "core_hours_Tesla V100-SXM2-32GB": 127.94964468735944, "core_hours": 127.94964468735944}
{"step": 85350, "global_schedule": 0.15484824776649475, "l2_grads": 2.2013437747955322, "l2_params": 257.51263427734375, "l2_updates": 0.16575324535369873, "training_loss": 2.1255719661712646, "uptime": 31114.538936184952, "examples_seen": 87398400.0, "progress": 0.7656287844129283, "epoch": 68.90689120948, "img/sec/core": 189.82313751824685, "core_hours_Tesla V100-SXM2-32GB": 128.02456823149723, "core_hours": 128.02456823149723}
{"step": 85401, "global_schedule": 0.15428870916366577, "l2_grads": 2.1404519081115723, "l2_params": 257.4508056640625, "l2_updates": 0.16776245832443237, "training_loss": 1.890913963317871, "uptime": 31131.412232044968, "examples_seen": 87449600.0, "progress": 0.766077307426644, "epoch": 68.94725845682005, "img/sec/core": 189.64878151535038, "core_hours_Tesla V100-SXM2-32GB": 128.09956065754173, "core_hours": 128.09956065754173}
{"step": 85450, "global_schedule": 0.15372994542121887, "l2_grads": 2.082313299179077, "l2_params": 257.38568115234375, "l2_updates": 0.1676090508699417, "training_loss": 2.7841851711273193, "uptime": 31148.275832199957, "examples_seen": 87500800.0, "progress": 0.7665258304403599, "epoch": 68.98762570416011, "img/sec/core": 189.75781983618856, "core_hours_Tesla V100-SXM2-32GB": 128.17450999156392, "core_hours": 128.17450999156392}
{"step": 85500, "global_schedule": 0.1531720757484436, "l2_grads": 2.194864511489868, "l2_params": 257.3187255859375, "l2_updates": 0.16714490950107574, "training_loss": 2.0613274574279785, "uptime": 31165.12695005798, "examples_seen": 87552000.0, "progress": 0.7669743534540757, "epoch": 69.02799295150017, "img/sec/core": 189.89838104280193, "core_hours_Tesla V100-SXM2-32GB": 128.24940384871067, "core_hours": 128.24940384871067}
{"step": 85550, "global_schedule": 0.15261495113372803, "l2_grads": 2.253465175628662, "l2_params": 257.2550964355469, "l2_updates": 0.16537968814373016, "training_loss": 3.794285535812378, "uptime": 31181.97626052797, "examples_seen": 87603200.0, "progress": 0.7674228764677916, "epoch": 69.06836019884022, "img/sec/core": 189.9187510195026, "core_hours_Tesla V100-SXM2-32GB": 128.32428967302175, "core_hours": 128.32428967302175}
{"step": 85601, "global_schedule": 0.15205875039100647, "l2_grads": 2.1726107597351074, "l2_params": 257.18695068359375, "l2_updates": 0.16625414788722992, "training_loss": 2.281313419342041, "uptime": 31198.844096685003, "examples_seen": 87654400.0, "progress": 0.7678713994815074, "epoch": 69.10872744618028, "img/sec/core": 189.71016615343763, "core_hours_Tesla V100-SXM2-32GB": 128.39925783371967, "core_hours": 128.39925783371967}
{"step": 85650, "global_schedule": 0.1515032947063446, "l2_grads": 2.333651065826416, "l2_params": 257.12451171875, "l2_updates": 0.1644572764635086, "training_loss": 1.9218968152999878, "uptime": 31215.691482528986, "examples_seen": 87705600.0, "progress": 0.7683199224952232, "epoch": 69.14909469352035, "img/sec/core": 189.94044711944952, "core_hours_Tesla V100-SXM2-32GB": 128.47413510413736, "core_hours": 128.47413510413736}
{"step": 85700, "global_schedule": 0.15094876289367676, "l2_grads": 2.2477612495422363, "l2_params": 257.0635070800781, "l2_updates": 0.16337695717811584, "training_loss": 2.129377603530884, "uptime": 31232.590261003992, "examples_seen": 87756800.0, "progress": 0.7687684455089391, "epoch": 69.18946194086041, "img/sec/core": 189.36279949067992, "core_hours_Tesla V100-SXM2-32GB": 128.5492407862485, "core_hours": 128.5492407862485}
{"step": 85751, "global_schedule": 0.1503949761390686, "l2_grads": 2.259390115737915, "l2_params": 257.0039978027344, "l2_updates": 0.16462361812591553, "training_loss": 1.6518170833587646, "uptime": 31249.453908200958, "examples_seen": 87808000.0, "progress": 0.7692169685226549, "epoch": 69.22982918820047, "img/sec/core": 189.75729049738243, "core_hours_Tesla V100-SXM2-32GB": 128.62419032934613, "core_hours": 128.62419032934613}
{"step": 85800, "global_schedule": 0.14984211325645447, "l2_grads": 2.372978687286377, "l2_params": 256.9452209472656, "l2_updates": 0.1654149293899536, "training_loss": 1.803563117980957, "uptime": 31266.32078834396, "examples_seen": 87859200.0, "progress": 0.7696654915363708, "epoch": 69.27019643554053, "img/sec/core": 189.72091891738873, "core_hours_Tesla V100-SXM2-32GB": 128.6991542410928, "core_hours": 128.6991542410928}
{"step": 85850, "global_schedule": 0.1492900252342224, "l2_grads": 2.2139577865600586, "l2_params": 256.88555908203125, "l2_updates": 0.16232462227344513, "training_loss": 1.5545132160186768, "uptime": 31283.168149951962, "examples_seen": 87910400.0, "progress": 0.7701140145500865, "epoch": 69.31056368288058, "img/sec/core": 189.94072036064662, "core_hours_Tesla V100-SXM2-32GB": 128.77403140379505, "core_hours": 128.77403140379505}
{"step": 85900, "global_schedule": 0.148738831281662, "l2_grads": 2.421548366546631, "l2_params": 256.8202209472656, "l2_updates": 0.1592375785112381, "training_loss": 4.077338218688965, "uptime": 31300.03105503798, "examples_seen": 87961600.0, "progress": 0.7705625375638024, "epoch": 69.35093093022064, "img/sec/core": 189.7656414287284, "core_hours_Tesla V100-SXM2-32GB": 128.8489776486218, "core_hours": 128.8489776486218}
{"step": 85950, "global_schedule": 0.14818841218948364, "l2_grads": 2.208660125732422, "l2_params": 256.7570495605469, "l2_updates": 0.16138337552547455, "training_loss": 2.636693000793457, "uptime": 31316.904690267984, "examples_seen": 88012800.0, "progress": 0.7710110605775182, "epoch": 69.3912981775607, "img/sec/core": 189.64496721547707, "core_hours_Tesla V100-SXM2-32GB": 128.92397158297734, "core_hours": 128.92397158297734}
{"step": 86000, "global_schedule": 0.14763891696929932, "l2_grads": 2.1911439895629883, "l2_params": 256.6936340332031, "l2_updates": 0.1595136672258377, "training_loss": 3.9535346031188965, "uptime": 31333.75842486997, "examples_seen": 88064000.0, "progress": 0.7714595835912341, "epoch": 69.43166542490076, "img/sec/core": 189.86889704686763, "core_hours_Tesla V100-SXM2-32GB": 128.9988770700973, "core_hours": 128.9988770700973}
{"step": 86050, "global_schedule": 0.14709019660949707, "l2_grads": 2.161992073059082, "l2_params": 256.6324768066406, "l2_updates": 0.15854758024215698, "training_loss": 3.6345858573913574, "uptime": 31351.136460579, "examples_seen": 88115200.0, "progress": 0.7719081066049499, "epoch": 69.47203267224081, "img/sec/core": 189.5876777124603, "core_hours_Tesla V100-SXM2-32GB": 129.07389366607984, "core_hours": 129.07389366607984}
{"step": 86100, "global_schedule": 0.14654237031936646, "l2_grads": 2.2856647968292236, "l2_params": 256.5730895996094, "l2_updates": 0.16029208898544312, "training_loss": 2.0132508277893066, "uptime": 31368.026620116958, "examples_seen": 88166400.0, "progress": 0.7723566296186657, "epoch": 69.51239991958087, "img/sec/core": 189.4594300787148, "core_hours_Tesla V100-SXM2-32GB": 129.14896104180409, "core_hours": 129.14896104180409}
{"step": 86150, "global_schedule": 0.1459953486919403, "l2_grads": 2.2101399898529053, "l2_params": 256.5104675292969, "l2_updates": 0.15948674082756042, "training_loss": 1.8102335929870605, "uptime": 31384.903519747953, "examples_seen": 88217600.0, "progress": 0.7728051526323816, "epoch": 69.55276716692093, "img/sec/core": 189.6082852873642, "core_hours_Tesla V100-SXM2-32GB": 129.22396948460852, "core_hours": 129.22396948460852}
{"step": 86200, "global_schedule": 0.1454492211341858, "l2_grads": 2.174105167388916, "l2_params": 256.4490661621094, "l2_updates": 0.15814606845378876, "training_loss": 2.7458605766296387, "uptime": 31401.79691782198, "examples_seen": 88268800.0, "progress": 0.7732536756460974, "epoch": 69.59313441426099, "img/sec/core": 189.42310990233057, "core_hours_Tesla V100-SXM2-32GB": 129.2990512538264, "core_hours": 129.2990512538264}
{"step": 86250, "global_schedule": 0.14490386843681335, "l2_grads": 2.308290481567383, "l2_params": 256.3916931152344, "l2_updates": 0.16046929359436035, "training_loss": 1.8740853071212769, "uptime": 31418.67897763598, "examples_seen": 88320000.0, "progress": 0.7737021986598133, "epoch": 69.63350166160104, "img/sec/core": 189.55032947733736, "core_hours_Tesla V100-SXM2-32GB": 129.3740826307775, "core_hours": 129.3740826307775}
{"step": 86300, "global_schedule": 0.14435946941375732, "l2_grads": 2.3037831783294678, "l2_params": 256.3298034667969, "l2_updates": 0.15802310407161713, "training_loss": 1.8513081073760986, "uptime": 31435.574163043988, "examples_seen": 88371200.0, "progress": 0.774150721673529, "epoch": 69.6738689089411, "img/sec/core": 189.40307091766476, "core_hours_Tesla V100-SXM2-32GB": 129.449172343702, "core_hours": 129.449172343702}
{"step": 86350, "global_schedule": 0.143815815448761, "l2_grads": 2.101059913635254, "l2_params": 256.2654113769531, "l2_updates": 0.1569383591413498, "training_loss": 2.2638931274414062, "uptime": 31452.459371004952, "examples_seen": 88422400.0, "progress": 0.774599244687245, "epoch": 69.71423615628117, "img/sec/core": 189.51498894167446, "core_hours_Tesla V100-SXM2-32GB": 129.5242177124174, "core_hours": 129.5242177124174}
{"step": 86400, "global_schedule": 0.14327311515808105, "l2_grads": 2.311901330947876, "l2_params": 256.2052001953125, "l2_updates": 0.15547117590904236, "training_loss": 4.116214752197266, "uptime": 31469.335488187964, "examples_seen": 88473600.0, "progress": 0.7750477677009607, "epoch": 69.75460340362123, "img/sec/core": 189.61707632732148, "core_hours_Tesla V100-SXM2-32GB": 129.59922267767521, "core_hours": 129.59922267767521}
{"step": 86450, "global_schedule": 0.1427311897277832, "l2_grads": 2.1049773693084717, "l2_params": 256.14691162109375, "l2_updates": 0.15410228073596954, "training_loss": 2.5987472534179688, "uptime": 31486.213528972003, "examples_seen": 88524800.0, "progress": 0.7754962907146765, "epoch": 69.79497065096129, "img/sec/core": 189.59546554871514, "core_hours_Tesla V100-SXM2-32GB": 129.67423619227097, "core_hours": 129.67423619227097}
{"step": 86500, "global_schedule": 0.14219018816947937, "l2_grads": 2.100674629211426, "l2_params": 256.0839538574219, "l2_updates": 0.15327075123786926, "training_loss": 2.657835006713867, "uptime": 31503.09621398797, "examples_seen": 88576000.0, "progress": 0.7759448137283924, "epoch": 69.83533789830135, "img/sec/core": 189.5433100228697, "core_hours_Tesla V100-SXM2-32GB": 129.7492703478975, "core_hours": 129.7492703478975}
{"step": 86550, "global_schedule": 0.14164996147155762, "l2_grads": 2.289902448654175, "l2_params": 256.0274353027344, "l2_updates": 0.15497280657291412, "training_loss": 1.7714622020721436, "uptime": 31519.983459662995, "examples_seen": 88627200.0, "progress": 0.7763933367421082, "epoch": 69.8757051456414, "img/sec/core": 189.49212095211936, "core_hours_Tesla V100-SXM2-32GB": 129.82432477311983, "core_hours": 129.82432477311983}
{"step": 86600, "global_schedule": 0.14111068844795227, "l2_grads": 2.433804988861084, "l2_params": 255.96817016601562, "l2_updates": 0.15277673304080963, "training_loss": 4.124147891998291, "uptime": 31536.87976946798, "examples_seen": 88678400.0, "progress": 0.7768418597558241, "epoch": 69.91607239298146, "img/sec/core": 189.39046673112347, "core_hours_Tesla V100-SXM2-32GB": 129.8994194833642, "core_hours": 129.8994194833642}
{"step": 86650, "global_schedule": 0.140572190284729, "l2_grads": 2.3030178546905518, "l2_params": 255.90614318847656, "l2_updates": 0.1536465883255005, "training_loss": 1.8289079666137695, "uptime": 31553.763434021967, "examples_seen": 88729600.0, "progress": 0.7772903827695399, "epoch": 69.95643964032152, "img/sec/core": 189.53231330604194, "core_hours_Tesla V100-SXM2-32GB": 129.97445799249303, "core_hours": 129.97445799249303}
{"step": 86700, "global_schedule": 0.14003464579582214, "l2_grads": 2.244706153869629, "l2_params": 255.84666442871094, "l2_updates": 0.15353679656982422, "training_loss": 3.6137399673461914, "uptime": 31570.647853197006, "examples_seen": 88780800.0, "progress": 0.7777389057832558, "epoch": 69.99680688766158, "img/sec/core": 189.52384247428586, "core_hours_Tesla V100-SXM2-32GB": 130.0494998554932, "core_hours": 130.0494998554932}
{"step": 86750, "global_schedule": 0.13949784636497498, "l2_grads": 2.2583346366882324, "l2_params": 255.78831481933594, "l2_updates": 0.15095119178295135, "training_loss": 3.800990343093872, "uptime": 31587.53464343195, "examples_seen": 88832000.0, "progress": 0.7781874287969716, "epoch": 70.03717413500164, "img/sec/core": 189.4972315921862, "core_hours_Tesla V100-SXM2-32GB": 130.12455225653738, "core_hours": 130.12455225653738}
{"step": 86800, "global_schedule": 0.1389620304107666, "l2_grads": 2.323329210281372, "l2_params": 255.72836303710938, "l2_updates": 0.15077023208141327, "training_loss": 4.130403518676758, "uptime": 31604.427045382967, "examples_seen": 88883200.0, "progress": 0.7786359518106875, "epoch": 70.07754138234169, "img/sec/core": 189.4342799371731, "core_hours_Tesla V100-SXM2-32GB": 130.19962959854192, "core_hours": 130.19962959854192}
{"step": 86850, "global_schedule": 0.13842695951461792, "l2_grads": 2.2182250022888184, "l2_params": 255.67132568359375, "l2_updates": 0.15180236101150513, "training_loss": 1.6981314420700073, "uptime": 31621.294270881976, "examples_seen": 88934400.0, "progress": 0.7790844748244032, "epoch": 70.11790862968175, "img/sec/core": 189.71703438648228, "core_hours_Tesla V100-SXM2-32GB": 130.27459504520417, "core_hours": 130.27459504520417}
{"step": 86900, "global_schedule": 0.13789287209510803, "l2_grads": 2.278846502304077, "l2_params": 255.6102294921875, "l2_updates": 0.15133242309093475, "training_loss": 3.8306875228881836, "uptime": 31638.181108106975, "examples_seen": 88985600.0, "progress": 0.779532997838119, "epoch": 70.15827587702181, "img/sec/core": 189.4967042888647, "core_hours_Tesla V100-SXM2-32GB": 130.34964765509307, "core_hours": 130.34964765509307}
{"step": 86950, "global_schedule": 0.13735955953598022, "l2_grads": 2.1737825870513916, "l2_params": 255.55043029785156, "l2_updates": 0.1508677899837494, "training_loss": 1.633394718170166, "uptime": 31655.060136216984, "examples_seen": 89036800.0, "progress": 0.7799815208518349, "epoch": 70.19864312436187, "img/sec/core": 189.58437530550694, "core_hours_Tesla V100-SXM2-32GB": 130.4246655578042, "core_hours": 130.4246655578042}
{"step": 87000, "global_schedule": 0.13682720065116882, "l2_grads": 2.250314712524414, "l2_params": 255.4916534423828, "l2_updates": 0.14943036437034607, "training_loss": 1.790130853652954, "uptime": 31671.95178092399, "examples_seen": 89088000.0, "progress": 0.7804300438655507, "epoch": 70.23901037170192, "img/sec/core": 189.44277218146928, "core_hours_Tesla V100-SXM2-32GB": 130.4997395342798, "core_hours": 130.4997395342798}
{"step": 87050, "global_schedule": 0.1362956166267395, "l2_grads": 2.3878908157348633, "l2_params": 255.4355926513672, "l2_updates": 0.14876002073287964, "training_loss": 2.1339035034179688, "uptime": 31689.34193071595, "examples_seen": 89139200.0, "progress": 0.7808785668792666, "epoch": 70.27937761904198, "img/sec/core": 189.6014469003159, "core_hours_Tesla V100-SXM2-32GB": 130.57475068242624, "core_hours": 130.57475068242624}
{"step": 87100, "global_schedule": 0.1357649862766266, "l2_grads": 2.266378402709961, "l2_params": 255.37098693847656, "l2_updates": 0.14760343730449677, "training_loss": 2.0421557426452637, "uptime": 31706.211258038995, "examples_seen": 89190400.0, "progress": 0.7813270898929824, "epoch": 70.31974486638205, "img/sec/core": 189.69339670280777, "core_hours_Tesla V100-SXM2-32GB": 130.6497254705287, "core_hours": 130.6497254705287}
{"step": 87150, "global_schedule": 0.13523516058921814, "l2_grads": 2.3228232860565186, "l2_params": 255.3169403076172, "l2_updates": 0.14843030273914337, "training_loss": 1.8151227235794067, "uptime": 31723.087532314996, "examples_seen": 89241600.0, "progress": 0.7817756129066983, "epoch": 70.36011211372211, "img/sec/core": 189.6153112746333, "core_hours_Tesla V100-SXM2-32GB": 130.72473113397757, "core_hours": 130.72473113397757}
{"step": 87200, "global_schedule": 0.1347062885761261, "l2_grads": 2.2983570098876953, "l2_params": 255.25648498535156, "l2_updates": 0.14809274673461914, "training_loss": 2.0601518154144287, "uptime": 31739.958354871953, "examples_seen": 89292800.0, "progress": 0.7822241359204141, "epoch": 70.40047936106217, "img/sec/core": 189.6765844816733, "core_hours_Tesla V100-SXM2-32GB": 130.79971256756406, "core_hours": 130.79971256756406}
{"step": 87250, "global_schedule": 0.13417822122573853, "l2_grads": 2.322716236114502, "l2_params": 255.20249938964844, "l2_updates": 0.14568071067333221, "training_loss": 1.8501307964324951, "uptime": 31756.824838511006, "examples_seen": 89344000.0, "progress": 0.78267265893413, "epoch": 70.44084660840223, "img/sec/core": 189.72537895158715, "core_hours_Tesla V100-SXM2-32GB": 130.87467471707095, "core_hours": 130.87467471707095}
{"step": 87300, "global_schedule": 0.13365107774734497, "l2_grads": 2.204148530960083, "l2_params": 255.1397705078125, "l2_updates": 0.14571256935596466, "training_loss": 2.753903388977051, "uptime": 31773.69984183897, "examples_seen": 89395200.0, "progress": 0.7831211819478457, "epoch": 70.48121385574228, "img/sec/core": 189.62959223226022, "core_hours_Tesla V100-SXM2-32GB": 130.9496747318619, "core_hours": 130.9496747318619}
{"step": 87350, "global_schedule": 0.13312476873397827, "l2_grads": 2.2128565311431885, "l2_params": 255.08148193359375, "l2_updates": 0.14547127485275269, "training_loss": 2.5432353019714355, "uptime": 31790.58696848998, "examples_seen": 89446400.0, "progress": 0.7835697049615615, "epoch": 70.52158110308234, "img/sec/core": 189.49345653237708, "core_hours_Tesla V100-SXM2-32GB": 131.0247286280886, "core_hours": 131.0247286280886}
{"step": 87400, "global_schedule": 0.1325993835926056, "l2_grads": 2.094423770904541, "l2_params": 255.0222930908203, "l2_updates": 0.1437540203332901, "training_loss": 1.9339752197265625, "uptime": 31807.44447943999, "examples_seen": 89497600.0, "progress": 0.7840182279752774, "epoch": 70.5619483504224, "img/sec/core": 189.82636342278727, "core_hours_Tesla V100-SXM2-32GB": 131.09965089897756, "core_hours": 131.09965089897756}
{"step": 87450, "global_schedule": 0.13207483291625977, "l2_grads": 2.2202858924865723, "l2_params": 254.9661102294922, "l2_updates": 0.14349932968616486, "training_loss": 3.1753249168395996, "uptime": 31824.32422190695, "examples_seen": 89548800.0, "progress": 0.7844667509889932, "epoch": 70.60231559776246, "img/sec/core": 189.5763520245292, "core_hours_Tesla V100-SXM2-32GB": 131.1746719766085, "core_hours": 131.1746719766085}
{"step": 87500, "global_schedule": 0.13155120611190796, "l2_grads": 2.3728549480438232, "l2_params": 254.91110229492188, "l2_updates": 0.14200296998023987, "training_loss": 2.270785331726074, "uptime": 31841.21909723198, "examples_seen": 89600000.0, "progress": 0.7849152740027091, "epoch": 70.64268284510251, "img/sec/core": 189.40654715925652, "core_hours_Tesla V100-SXM2-32GB": 131.2497603113864, "core_hours": 131.2497603113864, "minival/prec@1": 0.7670152981579769, "minival/loss": 0.917291853824631, "minival/sample count": 12812.0, "minival/attn_weight_avg": [13312, 12, 281], "minival/attn_mag": [13312, 12, 281], "minival/before_mlp": [13312, 12, 281], "z/secs/eval/minival": 2.9282446439610794, "real/prec@1": 0.80918931613895, "real/loss": 1.7155049891695535, "real/sample count": 46837.0, "real/attn_weight_avg": [50176, 12, 281], "real/attn_mag": [50176, 12, 281], "real/before_mlp": [50176, 12, 281], "z/secs/eval/real": 11.189529928960837, "train/prec@1": 0.8138781563439098, "train/loss": 0.7122995831557637, "train/sample count": 25623.0, "train/attn_weight_avg": [26624, 12, 281], "train/attn_mag": [26624, 12, 281], "train/before_mlp": [26624, 12, 281], "z/secs/eval/train": 6.598889716959093, "v2/prec@1": 0.6152, "v2/loss": 1.6800692016601562, "v2/sample count": 10000.0, "v2/attn_weight_avg": [10240, 12, 281], "v2/attn_mag": [10240, 12, 281], "v2/before_mlp": [10240, 12, 281], "z/secs/eval/v2": 3.375340700033121, "val/prec@1": 0.7375, "val/loss": 1.0529245263671876, "val/sample count": 50000.0, "val/attn_weight_avg": [50176, 12, 281], "val/attn_mag": [50176, 12, 281], "val/before_mlp": [50176, 12, 281], "z/secs/eval/val": 12.251723370980471}
{"step": 87550, "global_schedule": 0.131028413772583, "l2_grads": 2.1842586994171143, "l2_params": 254.8575897216797, "l2_updates": 0.14369702339172363, "training_loss": 2.3859686851501465, "uptime": 31894.488324164005, "examples_seen": 89651200.0, "progress": 0.7853637970164249, "epoch": 70.68305009244257, "img/sec/core": 189.0866822532706, "core_hours_Tesla V100-SXM2-32GB": 131.32497566792415, "core_hours": 131.32497566792415}
{"step": 87600, "global_schedule": 0.13050657510757446, "l2_grads": 2.421647310256958, "l2_params": 254.7975616455078, "l2_updates": 0.14285559952259064, "training_loss": 1.842294692993164, "uptime": 31911.349766651983, "examples_seen": 89702400.0, "progress": 0.7858123200301408, "epoch": 70.72341733978263, "img/sec/core": 189.7821021114639, "core_hours_Tesla V100-SXM2-32GB": 131.39991541231518, "core_hours": 131.39991541231518}
{"step": 87650, "global_schedule": 0.12998563051223755, "l2_grads": 2.3397867679595947, "l2_params": 254.74215698242188, "l2_updates": 0.14064641296863556, "training_loss": 2.0298900604248047, "uptime": 31928.228639598994, "examples_seen": 89753600.0, "progress": 0.7862608430438566, "epoch": 70.76378458712269, "img/sec/core": 189.58611810433314, "core_hours_Tesla V100-SXM2-32GB": 131.474932625413, "core_hours": 131.474932625413}
{"step": 87700, "global_schedule": 0.12946546077728271, "l2_grads": 2.363576889038086, "l2_params": 254.68124389648438, "l2_updates": 0.1402086317539215, "training_loss": 3.9612157344818115, "uptime": 31945.09215212695, "examples_seen": 89804800.0, "progress": 0.7867093660575725, "epoch": 70.80415183446274, "img/sec/core": 189.75880586535135, "core_hours_Tesla V100-SXM2-32GB": 131.5498815699817, "core_hours": 131.5498815699817}
{"step": 87750, "global_schedule": 0.12894630432128906, "l2_grads": 2.4551305770874023, "l2_params": 254.62828063964844, "l2_updates": 0.14000679552555084, "training_loss": 1.786198616027832, "uptime": 31961.94009849796, "examples_seen": 89856000.0, "progress": 0.7871578890712883, "epoch": 70.8445190818028, "img/sec/core": 189.93412784754486, "core_hours_Tesla V100-SXM2-32GB": 131.62476133163062, "core_hours": 131.62476133163062}
{"step": 87800, "global_schedule": 0.1284279227256775, "l2_grads": 2.377316951751709, "l2_params": 254.5727081298828, "l2_updates": 0.13958171010017395, "training_loss": 1.9519058465957642, "uptime": 31978.815439825994, "examples_seen": 89907200.0, "progress": 0.787606412085004, "epoch": 70.88488632914287, "img/sec/core": 189.62579409779002, "core_hours_Tesla V100-SXM2-32GB": 131.6997628486441, "core_hours": 131.6997628486441}
{"step": 87850, "global_schedule": 0.1279105246067047, "l2_grads": 2.4179723262786865, "l2_params": 254.51121520996094, "l2_updates": 0.13808239996433258, "training_loss": 1.7925326824188232, "uptime": 31995.703174378956, "examples_seen": 89958400.0, "progress": 0.7880549350987199, "epoch": 70.92525357648293, "img/sec/core": 189.4866354018327, "core_hours_Tesla V100-SXM2-32GB": 131.77481944665726, "core_hours": 131.77481944665726}
{"step": 87900, "global_schedule": 0.1273939311504364, "l2_grads": 2.3394064903259277, "l2_params": 254.45310974121094, "l2_updates": 0.13944733142852783, "training_loss": 1.9214482307434082, "uptime": 32012.579109683982, "examples_seen": 90009600.0, "progress": 0.7885034581124357, "epoch": 70.96562082382299, "img/sec/core": 189.61911989831498, "core_hours_Tesla V100-SXM2-32GB": 131.8498236035685, "core_hours": 131.8498236035685}
{"step": 87950, "global_schedule": 0.12687832117080688, "l2_grads": 2.188302755355835, "l2_params": 254.39891052246094, "l2_updates": 0.1374085396528244, "training_loss": 3.0827879905700684, "uptime": 32029.455930000986, "examples_seen": 90060800.0, "progress": 0.7889519811261516, "epoch": 71.00598807116305, "img/sec/core": 189.6091763669433, "core_hours_Tesla V100-SXM2-32GB": 131.9248316938663, "core_hours": 131.9248316938663}
{"step": 88000, "global_schedule": 0.12636351585388184, "l2_grads": 2.418412923812866, "l2_params": 254.34983825683594, "l2_updates": 0.13788315653800964, "training_loss": 4.110525608062744, "uptime": 32046.308130572957, "examples_seen": 90112000.0, "progress": 0.7894005041398674, "epoch": 71.0463553185031, "img/sec/core": 189.88618052186186, "core_hours_Tesla V100-SXM2-32GB": 131.99973036307506, "core_hours": 131.99973036307506}
{"step": 88050, "global_schedule": 0.12584969401359558, "l2_grads": 2.2820723056793213, "l2_params": 254.29244995117188, "l2_updates": 0.13643422722816467, "training_loss": 1.7502671480178833, "uptime": 32064.039936416957, "examples_seen": 90163200.0, "progress": 0.7898490271535833, "epoch": 71.08672256584316, "img/sec/core": 189.64170726136766, "core_hours_Tesla V100-SXM2-32GB": 132.07472558658156, "core_hours": 132.07472558658156}
{"step": 88100, "global_schedule": 0.1253366768360138, "l2_grads": 2.1258418560028076, "l2_params": 254.23280334472656, "l2_updates": 0.13655324280261993, "training_loss": 2.4278926849365234, "uptime": 32080.907495388004, "examples_seen": 90214400.0, "progress": 0.7902975501672991, "epoch": 71.12708981318322, "img/sec/core": 189.71328367623866, "core_hours_Tesla V100-SXM2-32GB": 132.14969251534177, "core_hours": 132.14969251534177}
{"step": 88150, "global_schedule": 0.1248246431350708, "l2_grads": 2.2554099559783936, "l2_params": 254.17747497558594, "l2_updates": 0.13759343326091766, "training_loss": 1.9085900783538818, "uptime": 32097.79796713096, "examples_seen": 90265600.0, "progress": 0.7907460731810149, "epoch": 71.16745706052328, "img/sec/core": 189.45592809359434, "core_hours_Tesla V100-SXM2-32GB": 132.2247612786438, "core_hours": 132.2247612786438}
{"step": 88200, "global_schedule": 0.12431344389915466, "l2_grads": 2.3168370723724365, "l2_params": 254.12252807617188, "l2_updates": 0.13613103330135345, "training_loss": 3.8571650981903076, "uptime": 32114.656553105975, "examples_seen": 90316800.0, "progress": 0.7911945961947308, "epoch": 71.20782430786333, "img/sec/core": 189.81425872503368, "core_hours_Tesla V100-SXM2-32GB": 132.29968832742165, "core_hours": 132.29968832742165}
{"step": 88250, "global_schedule": 0.12380319833755493, "l2_grads": 2.195138454437256, "l2_params": 254.06346130371094, "l2_updates": 0.13660211861133575, "training_loss": 2.2260894775390625, "uptime": 32131.53370450996, "examples_seen": 90368000.0, "progress": 0.7916431192084465, "epoch": 71.24819155520339, "img/sec/core": 189.60545671496968, "core_hours_Tesla V100-SXM2-32GB": 132.37469788921712, "core_hours": 132.37469788921712}
{"step": 88300, "global_schedule": 0.12329378724098206, "l2_grads": 2.3648407459259033, "l2_params": 254.0098876953125, "l2_updates": 0.13401417434215546, "training_loss": 3.9657485485076904, "uptime": 32148.381395956967, "examples_seen": 90419200.0, "progress": 0.7920916422221624, "epoch": 71.28855880254345, "img/sec/core": 189.93700175867212, "core_hours_Tesla V100-SXM2-32GB": 132.4495765178705, "core_hours": 132.4495765178705}
{"step": 88350, "global_schedule": 0.12278535962104797, "l2_grads": 2.407586097717285, "l2_params": 253.95639038085938, "l2_updates": 0.1328546553850174, "training_loss": 1.6607381105422974, "uptime": 32165.254790305975, "examples_seen": 90470400.0, "progress": 0.7925401652358782, "epoch": 71.3289260498835, "img/sec/core": 189.64767454677283, "core_hours_Tesla V100-SXM2-32GB": 132.52456938164386, "core_hours": 132.52456938164386}
{"step": 88400, "global_schedule": 0.12227776646614075, "l2_grads": 2.3336021900177, "l2_params": 253.90342712402344, "l2_updates": 0.1328182965517044, "training_loss": 1.9527678489685059, "uptime": 32182.117384159006, "examples_seen": 90521600.0, "progress": 0.7929886882495941, "epoch": 71.36929329722356, "img/sec/core": 189.7691439342089, "core_hours_Tesla V100-SXM2-32GB": 132.5995142432129, "core_hours": 132.5995142432129}
{"step": 88450, "global_schedule": 0.12177112698554993, "l2_grads": 2.5157546997070312, "l2_params": 253.85052490234375, "l2_updates": 0.131440207362175, "training_loss": 3.978908061981201, "uptime": 32198.98679524497, "examples_seen": 90572800.0, "progress": 0.7934372112633099, "epoch": 71.40966054456362, "img/sec/core": 189.69245480432406, "core_hours_Tesla V100-SXM2-32GB": 132.67448940359495, "core_hours": 132.67448940359495}
{"step": 88500, "global_schedule": 0.12126535177230835, "l2_grads": 2.2841153144836426, "l2_params": 253.7986602783203, "l2_updates": 0.13120943307876587, "training_loss": 1.5422898530960083, "uptime": 32215.867650622968, "examples_seen": 90624000.0, "progress": 0.7938857342770258, "epoch": 71.4500277919037, "img/sec/core": 189.56385374707367, "core_hours_Tesla V100-SXM2-32GB": 132.74951542749716, "core_hours": 132.74951542749716}
{"step": 88550, "global_schedule": 0.12076053023338318, "l2_grads": 2.3963520526885986, "l2_params": 253.74395751953125, "l2_updates": 0.12935154139995575, "training_loss": 3.7128186225891113, "uptime": 32232.751199672, "examples_seen": 90675200.0, "progress": 0.7943342572907416, "epoch": 71.49039503924375, "img/sec/core": 189.5336099481797, "core_hours_Tesla V100-SXM2-32GB": 132.82455342327063, "core_hours": 132.82455342327063}
{"step": 88600, "global_schedule": 0.12025657296180725, "l2_grads": 2.350057363510132, "l2_params": 253.69224548339844, "l2_updates": 0.12931188941001892, "training_loss": 1.9711532592773438, "uptime": 32249.606840216962, "examples_seen": 90726400.0, "progress": 0.7947827803044574, "epoch": 71.53076228658381, "img/sec/core": 189.8474277179671, "core_hours_Tesla V100-SXM2-32GB": 132.89946738124826, "core_hours": 132.89946738124826}
{"step": 88650, "global_schedule": 0.11975356936454773, "l2_grads": 2.3805973529815674, "l2_params": 253.6325225830078, "l2_updates": 0.13060547411441803, "training_loss": 1.8668577671051025, "uptime": 32266.49329400796, "examples_seen": 90777600.0, "progress": 0.7952313033181733, "epoch": 71.57112953392387, "img/sec/core": 189.50100711529853, "core_hours_Tesla V100-SXM2-32GB": 132.974518286986, "core_hours": 132.974518286986}
{"step": 88700, "global_schedule": 0.11925143003463745, "l2_grads": 2.444758653640747, "l2_params": 253.5758514404297, "l2_updates": 0.13014622032642365, "training_loss": 1.947654128074646, "uptime": 32283.34896110196, "examples_seen": 90828800.0, "progress": 0.795679826331889, "epoch": 71.61149678126392, "img/sec/core": 189.84712869292423, "core_hours_Tesla V100-SXM2-32GB": 133.04943236295935, "core_hours": 133.04943236295935}
{"step": 88750, "global_schedule": 0.11875024437904358, "l2_grads": 2.4752941131591797, "l2_params": 253.51939392089844, "l2_updates": 0.12958480417728424, "training_loss": 4.271164417266846, "uptime": 32300.21551986097, "examples_seen": 90880000.0, "progress": 0.796128349345605, "epoch": 71.65186402860398, "img/sec/core": 189.72453395634344, "core_hours_Tesla V100-SXM2-32GB": 133.1243948463327, "core_hours": 133.1243948463327}
{"step": 88800, "global_schedule": 0.11824992299079895, "l2_grads": 2.4925429821014404, "l2_params": 253.47080993652344, "l2_updates": 0.1278703659772873, "training_loss": 4.037594795227051, "uptime": 32317.091238253983, "examples_seen": 90931200.0, "progress": 0.7965768723593207, "epoch": 71.69223127594404, "img/sec/core": 189.6215571672926, "core_hours_Tesla V100-SXM2-32GB": 133.19939803919058, "core_hours": 133.19939803919058}
{"step": 88850, "global_schedule": 0.11775058507919312, "l2_grads": 2.3581697940826416, "l2_params": 253.4142608642578, "l2_updates": 0.12761394679546356, "training_loss": 1.6868377923965454, "uptime": 32333.94528082898, "examples_seen": 90982400.0, "progress": 0.7970253953730366, "epoch": 71.7325985232841, "img/sec/core": 189.86542758277892, "core_hours_Tesla V100-SXM2-32GB": 133.27430489507944, "core_hours": 133.27430489507944}
{"step": 88900, "global_schedule": 0.11725208163261414, "l2_grads": 2.2427847385406494, "l2_params": 253.36065673828125, "l2_updates": 0.12763379514217377, "training_loss": 2.413499116897583, "uptime": 32350.81903381599, "examples_seen": 91033600.0, "progress": 0.7974739183867524, "epoch": 71.77296577062415, "img/sec/core": 189.64364373847602, "core_hours_Tesla V100-SXM2-32GB": 133.34929935279948, "core_hours": 133.34929935279948}
{"step": 88950, "global_schedule": 0.11675459146499634, "l2_grads": 2.371507406234741, "l2_params": 253.30807495117188, "l2_updates": 0.1277766227722168, "training_loss": 1.908259630203247, "uptime": 32367.695079325, "examples_seen": 91084800.0, "progress": 0.7979224414004683, "epoch": 71.81333301796421, "img/sec/core": 189.61788164720173, "core_hours_Tesla V100-SXM2-32GB": 133.42430399950618, "core_hours": 133.42430399950618}
{"step": 89000, "global_schedule": 0.1162579357624054, "l2_grads": 2.4961233139038086, "l2_params": 253.25448608398438, "l2_updates": 0.12695355713367462, "training_loss": 4.1549906730651855, "uptime": 32384.534765917982, "examples_seen": 91136000.0, "progress": 0.7983709644141841, "epoch": 71.85370026530427, "img/sec/core": 190.02728954192617, "core_hours_Tesla V100-SXM2-32GB": 133.49914705103055, "core_hours": 133.49914705103055}
{"step": 89050, "global_schedule": 0.11576226353645325, "l2_grads": 2.1428029537200928, "l2_params": 253.20425415039062, "l2_updates": 0.1267012059688568, "training_loss": 3.2127561569213867, "uptime": 32401.958820361004, "examples_seen": 91187200.0, "progress": 0.7988194874278999, "epoch": 71.89406751264433, "img/sec/core": 189.91896892158854, "core_hours_Tesla V100-SXM2-32GB": 133.57403278942195, "core_hours": 133.57403278942195}
{"step": 89100, "global_schedule": 0.11526742577552795, "l2_grads": 2.2335214614868164, "l2_params": 253.15061950683594, "l2_updates": 0.12679985165596008, "training_loss": 1.6627068519592285, "uptime": 32418.848841001978, "examples_seen": 91238400.0, "progress": 0.7992680104416158, "epoch": 71.93443475998438, "img/sec/core": 189.46098811963262, "core_hours_Tesla V100-SXM2-32GB": 133.64909954782627, "core_hours": 133.64909954782627}
{"step": 89150, "global_schedule": 0.11477360129356384, "l2_grads": 2.423771381378174, "l2_params": 253.101318359375, "l2_updates": 0.12453058362007141, "training_loss": 1.695190191268921, "uptime": 32435.711707615992, "examples_seen": 91289600.0, "progress": 0.7997165334553316, "epoch": 71.97480200732444, "img/sec/core": 189.76607437199527, "core_hours_Tesla V100-SXM2-32GB": 133.72404562166633, "core_hours": 133.72404562166633}
{"step": 89200, "global_schedule": 0.11428064107894897, "l2_grads": 2.3562326431274414, "l2_params": 253.04965209960938, "l2_updates": 0.12269353866577148, "training_loss": 3.047081470489502, "uptime": 32452.564935781003, "examples_seen": 91340800.0, "progress": 0.8001650564690475, "epoch": 72.0151692546645, "img/sec/core": 189.87460257871837, "core_hours_Tesla V100-SXM2-32GB": 133.79894885795528, "core_hours": 133.79894885795528}
{"step": 89250, "global_schedule": 0.1137886643409729, "l2_grads": 2.3407840728759766, "l2_params": 252.99774169921875, "l2_updates": 0.1240956038236618, "training_loss": 1.7788336277008057, "uptime": 32469.46444766398, "examples_seen": 91392000.0, "progress": 0.8006135794827632, "epoch": 72.05553650200457, "img/sec/core": 189.35458149080418, "core_hours_Tesla V100-SXM2-32GB": 133.8740577996574, "core_hours": 133.8740577996574}
{"step": 89300, "global_schedule": 0.11329752206802368, "l2_grads": 2.4762721061706543, "l2_params": 252.94454956054688, "l2_updates": 0.12458343803882599, "training_loss": 1.5543283224105835, "uptime": 32486.32360337698, "examples_seen": 91443200.0, "progress": 0.8010621024964791, "epoch": 72.09590374934463, "img/sec/core": 189.8078441456465, "core_hours_Tesla V100-SXM2-32GB": 133.94898738060405, "core_hours": 133.94898738060405}
{"step": 89350, "global_schedule": 0.11280739307403564, "l2_grads": 2.2693827152252197, "l2_params": 252.89207458496094, "l2_updates": 0.12343841791152954, "training_loss": 2.5625827312469482, "uptime": 32503.198048827995, "examples_seen": 91494400.0, "progress": 0.8015106255101949, "epoch": 72.13627099668469, "img/sec/core": 189.6358614740324, "core_hours_Tesla V100-SXM2-32GB": 134.0239849159419, "core_hours": 134.0239849159419}
{"step": 89401, "global_schedule": 0.11231812834739685, "l2_grads": 2.4240527153015137, "l2_params": 252.84014892578125, "l2_updates": 0.12210298329591751, "training_loss": 1.7861392498016357, "uptime": 32520.070533945982, "examples_seen": 91545600.0, "progress": 0.8019591485239108, "epoch": 72.17663824402474, "img/sec/core": 189.65789435420285, "core_hours_Tesla V100-SXM2-32GB": 134.0989737386885, "core_hours": 134.0989737386885}
{"step": 89450, "global_schedule": 0.11182984709739685, "l2_grads": 2.417452812194824, "l2_params": 252.7892608642578, "l2_updates": 0.12079780548810959, "training_loss": 1.7014381885528564, "uptime": 32536.936571992992, "examples_seen": 91596800.0, "progress": 0.8024076715376266, "epoch": 72.2170054913648, "img/sec/core": 189.73039139842797, "core_hours_Tesla V100-SXM2-32GB": 134.17393390778633, "core_hours": 134.17393390778633}
{"step": 89500, "global_schedule": 0.1113424301147461, "l2_grads": 2.360957145690918, "l2_params": 252.73800659179688, "l2_updates": 0.11993923038244247, "training_loss": 1.6871135234832764, "uptime": 32553.80529660295, "examples_seen": 91648000.0, "progress": 0.8028561945513424, "epoch": 72.25737273870486, "img/sec/core": 189.7001743754216, "core_hours_Tesla V100-SXM2-32GB": 134.24890601716393, "core_hours": 134.24890601716393}
{"step": 89550, "global_schedule": 0.11085596680641174, "l2_grads": 2.371428966522217, "l2_params": 252.68788146972656, "l2_updates": 0.12044127285480499, "training_loss": 3.7701399326324463, "uptime": 32570.699451975, "examples_seen": 91699200.0, "progress": 0.8033047175650583, "epoch": 72.29773998604492, "img/sec/core": 189.41461881509784, "core_hours_Tesla V100-SXM2-32GB": 134.32399115215082, "core_hours": 134.32399115215082}
{"step": 89600, "global_schedule": 0.11037048697471619, "l2_grads": 2.314051628112793, "l2_params": 252.6377410888672, "l2_updates": 0.1209426149725914, "training_loss": 1.7058416604995728, "uptime": 32587.575525288004, "examples_seen": 91750400.0, "progress": 0.8037532405787741, "epoch": 72.33810723338497, "img/sec/core": 189.6175692442766, "core_hours_Tesla V100-SXM2-32GB": 134.39899592243083, "core_hours": 134.39899592243083}
{"step": 89650, "global_schedule": 0.10988587141036987, "l2_grads": 2.226813316345215, "l2_params": 252.58880615234375, "l2_updates": 0.12012320011854172, "training_loss": 2.9422459602355957, "uptime": 32604.43613179197, "examples_seen": 91801600.0, "progress": 0.80420176359249, "epoch": 72.37847448072503, "img/sec/core": 189.79151190366008, "core_hours_Tesla V100-SXM2-32GB": 134.47393195133733, "core_hours": 134.47393195133733}
{"step": 89700, "global_schedule": 0.10940226912498474, "l2_grads": 2.2951173782348633, "l2_params": 252.5357666015625, "l2_updates": 0.11837910115718842, "training_loss": 1.7316186428070068, "uptime": 32621.327736996987, "examples_seen": 91852800.0, "progress": 0.8046502866062057, "epoch": 72.41884172806509, "img/sec/core": 189.44321520427104, "core_hours_Tesla V100-SXM2-32GB": 134.54900575224852, "core_hours": 134.54900575224852}
{"step": 89750, "global_schedule": 0.10891953110694885, "l2_grads": 2.3569858074188232, "l2_params": 252.4819793701172, "l2_updates": 0.1201651394367218, "training_loss": 1.7253170013427734, "uptime": 32638.198862331978, "examples_seen": 91904000.0, "progress": 0.8050988096199216, "epoch": 72.45920897540515, "img/sec/core": 189.6731804465524, "core_hours_Tesla V100-SXM2-32GB": 134.62398853151515, "core_hours": 134.62398853151515}
{"step": 89800, "global_schedule": 0.10843777656555176, "l2_grads": 2.246547222137451, "l2_params": 252.43234252929688, "l2_updates": 0.11743436753749847, "training_loss": 3.216184616088867, "uptime": 32655.077701737988, "examples_seen": 91955200.0, "progress": 0.8055473326336374, "epoch": 72.4995762227452, "img/sec/core": 189.58649484279954, "core_hours_Tesla V100-SXM2-32GB": 134.69900559554188, "core_hours": 134.69900559554188}
{"step": 89850, "global_schedule": 0.1079569160938263, "l2_grads": 2.425128698348999, "l2_params": 252.3837127685547, "l2_updates": 0.11650211364030838, "training_loss": 2.0973706245422363, "uptime": 32671.952398200985, "examples_seen": 92006400.0, "progress": 0.8059958556473533, "epoch": 72.53994347008526, "img/sec/core": 189.63304063080167, "core_hours_Tesla V100-SXM2-32GB": 134.77400424648852, "core_hours": 134.77400424648852}
{"step": 89900, "global_schedule": 0.10747706890106201, "l2_grads": 2.40543532371521, "l2_params": 252.3308563232422, "l2_updates": 0.11828334629535675, "training_loss": 1.8679077625274658, "uptime": 32688.820333754993, "examples_seen": 92057600.0, "progress": 0.8064443786610691, "epoch": 72.58031071742532, "img/sec/core": 189.7090482563319, "core_hours_Tesla V100-SXM2-32GB": 134.84897284895078, "core_hours": 134.84897284895078}
{"step": 89950, "global_schedule": 0.10699805617332458, "l2_grads": 2.4928038120269775, "l2_params": 252.28314208984375, "l2_updates": 0.11663956195116043, "training_loss": 4.026297092437744, "uptime": 32705.68256865599, "examples_seen": 92108800.0, "progress": 0.8068929016747849, "epoch": 72.62067796476539, "img/sec/core": 189.7731836134533, "core_hours_Tesla V100-SXM2-32GB": 134.92391611517743, "core_hours": 134.92391611517743}
{"step": 90000, "global_schedule": 0.10652008652687073, "l2_grads": 2.4329638481140137, "l2_params": 252.2324676513672, "l2_updates": 0.11629345268011093, "training_loss": 1.7526769638061523, "uptime": 32722.560527646972, "examples_seen": 92160000.0, "progress": 0.8073414246885008, "epoch": 72.66104521210545, "img/sec/core": 189.59638435604927, "core_hours_Tesla V100-SXM2-32GB": 134.99892926624847, "core_hours": 134.99892926624847, "minival/prec@1": 0.779191383078364, "minival/loss": 0.9054026893999217, "minival/sample count": 12812.0, "minival/attn_weight_avg": [13312, 12, 281], "minival/attn_mag": [13312, 12, 281], "minival/before_mlp": [13312, 12, 281], "z/secs/eval/minival": 2.9135266430093907, "real/prec@1": 0.8119648995452313, "real/loss": 1.6994908950981262, "real/sample count": 46837.0, "real/attn_weight_avg": [50176, 12, 281], "real/attn_mag": [50176, 12, 281], "real/before_mlp": [50176, 12, 281], "z/secs/eval/real": 11.27361730398843, "train/prec@1": 0.8222690551457674, "train/loss": 0.6895774111360473, "train/sample count": 25623.0, "train/attn_weight_avg": [26624, 12, 281], "train/attn_mag": [26624, 12, 281], "train/before_mlp": [26624, 12, 281], "z/secs/eval/train": 6.575248526991345, "v2/prec@1": 0.6174, "v2/loss": 1.6597005493164063, "v2/sample count": 10000.0, "v2/attn_weight_avg": [10240, 12, 281], "v2/attn_mag": [10240, 12, 281], "v2/before_mlp": [10240, 12, 281], "z/secs/eval/v2": 3.3829921719734557, "val/prec@1": 0.74162, "val/loss": 1.0381363464355469, "val/sample count": 50000.0, "val/attn_weight_avg": [50176, 12, 281], "val/attn_mag": [50176, 12, 281], "val/before_mlp": [50176, 12, 281], "z/secs/eval/val": 12.322045462962706}
{"step": 90050, "global_schedule": 0.10604298114776611, "l2_grads": 2.138397216796875, "l2_params": 252.18141174316406, "l2_updates": 0.11464336514472961, "training_loss": 2.8778035640716553, "uptime": 32776.482682648, "examples_seen": 92211200.0, "progress": 0.8077899477022166, "epoch": 72.7014124594455, "img/sec/core": 189.08529324000227, "core_hours_Tesla V100-SXM2-32GB": 135.07414517531532, "core_hours": 135.07414517531532}
{"step": 90100, "global_schedule": 0.10556688904762268, "l2_grads": 2.481065034866333, "l2_params": 252.132080078125, "l2_updates": 0.11457070708274841, "training_loss": 4.0541839599609375, "uptime": 32793.38284631999, "examples_seen": 92262400.0, "progress": 0.8082384707159325, "epoch": 72.74177970678556, "img/sec/core": 189.34727864815693, "core_hours_Tesla V100-SXM2-32GB": 135.14925701385752, "core_hours": 135.14925701385752}
{"step": 90150, "global_schedule": 0.10509169101715088, "l2_grads": 2.32816743850708, "l2_params": 252.0871124267578, "l2_updates": 0.11557811498641968, "training_loss": 1.6598454713821411, "uptime": 32810.272003109974, "examples_seen": 92313600.0, "progress": 0.8086869937296483, "epoch": 72.78214695412562, "img/sec/core": 189.47067871959322, "core_hours_Tesla V100-SXM2-32GB": 135.22431993292412, "core_hours": 135.22431993292412}
{"step": 90200, "global_schedule": 0.10461747646331787, "l2_grads": 2.4675261974334717, "l2_params": 252.03456115722656, "l2_updates": 0.11393914371728897, "training_loss": 1.6189634799957275, "uptime": 32827.16174795898, "examples_seen": 92364800.0, "progress": 0.8091355167433641, "epoch": 72.82251420146568, "img/sec/core": 189.46408182057286, "core_hours_Tesla V100-SXM2-32GB": 135.29938546558634, "core_hours": 135.29938546558634}
{"step": 90250, "global_schedule": 0.1041441559791565, "l2_grads": 2.3666365146636963, "l2_params": 251.98435974121094, "l2_updates": 0.11479693651199341, "training_loss": 1.834824562072754, "uptime": 32844.05615692597, "examples_seen": 92416000.0, "progress": 0.8095840397570799, "epoch": 72.86288144880574, "img/sec/core": 189.41177559103798, "core_hours_Tesla V100-SXM2-32GB": 135.3744717276619, "core_hours": 135.3744717276619}
{"step": 90300, "global_schedule": 0.1036718487739563, "l2_grads": 2.4083056449890137, "l2_params": 251.93695068359375, "l2_updates": 0.11309187859296799, "training_loss": 1.7661750316619873, "uptime": 32860.94066914398, "examples_seen": 92467200.0, "progress": 0.8100325627707957, "epoch": 72.9032486961458, "img/sec/core": 189.5227980934725, "core_hours_Tesla V100-SXM2-32GB": 135.44951400418637, "core_hours": 135.44951400418637}
{"step": 90350, "global_schedule": 0.10320043563842773, "l2_grads": 2.3945693969726562, "l2_params": 251.8882598876953, "l2_updates": 0.11278962343931198, "training_loss": 3.9129409790039062, "uptime": 32877.826457457966, "examples_seen": 92518400.0, "progress": 0.8104810857845116, "epoch": 72.94361594348585, "img/sec/core": 189.50847544082285, "core_hours_Tesla V100-SXM2-32GB": 135.52456195224852, "core_hours": 135.52456195224852}
{"step": 90400, "global_schedule": 0.10273003578186035, "l2_grads": 2.427565574645996, "l2_params": 251.84144592285156, "l2_updates": 0.11218011379241943, "training_loss": 1.7151261568069458, "uptime": 32894.74013590097, "examples_seen": 92569600.0, "progress": 0.8109296087982274, "epoch": 72.98398319082591, "img/sec/core": 189.19598186662702, "core_hours_Tesla V100-SXM2-32GB": 135.59973385643966, "core_hours": 135.59973385643966}
{"step": 90450, "global_schedule": 0.10226050019264221, "l2_grads": 2.215984344482422, "l2_params": 251.7920684814453, "l2_updates": 0.11221379041671753, "training_loss": 2.7445180416107178, "uptime": 32911.62606030295, "examples_seen": 92620800.0, "progress": 0.8113781318119433, "epoch": 73.02435043816597, "img/sec/core": 189.5069481433899, "core_hours_Tesla V100-SXM2-32GB": 135.67478240933735, "core_hours": 135.67478240933735}
{"step": 90500, "global_schedule": 0.10179200768470764, "l2_grads": 2.393735647201538, "l2_params": 251.74526977539062, "l2_updates": 0.11082420498132706, "training_loss": 1.7345423698425293, "uptime": 32928.513878753, "examples_seen": 92672000.0, "progress": 0.8118266548256591, "epoch": 73.06471768550603, "img/sec/core": 189.48569405011176, "core_hours_Tesla V100-SXM2-32GB": 135.74983938022646, "core_hours": 135.74983938022646}
{"step": 90550, "global_schedule": 0.1013244092464447, "l2_grads": 2.333906650543213, "l2_params": 251.69866943359375, "l2_updates": 0.11076217144727707, "training_loss": 1.7980519533157349, "uptime": 32945.39508821996, "examples_seen": 92723200.0, "progress": 0.812275177839375, "epoch": 73.10508493284608, "img/sec/core": 189.5598775824616, "core_hours_Tesla V100-SXM2-32GB": 135.82486697785737, "core_hours": 135.82486697785737}
{"step": 90600, "global_schedule": 0.10085782408714294, "l2_grads": 2.2851691246032715, "l2_params": 251.65048217773438, "l2_updates": 0.10945450514554977, "training_loss": 2.5791449546813965, "uptime": 32962.303555321996, "examples_seen": 92774400.0, "progress": 0.8127237008530908, "epoch": 73.14545218018614, "img/sec/core": 189.25429376232952, "core_hours_Tesla V100-SXM2-32GB": 135.9000157205331, "core_hours": 135.9000157205331}
{"step": 90650, "global_schedule": 0.10039210319519043, "l2_grads": 2.5513880252838135, "l2_params": 251.59996032714844, "l2_updates": 0.1097547858953476, "training_loss": 3.9825804233551025, "uptime": 32979.19479235995, "examples_seen": 92825600.0, "progress": 0.8131722238668067, "epoch": 73.18581942752621, "img/sec/core": 189.44734437208797, "core_hours_Tesla V100-SXM2-32GB": 135.97508788514625, "core_hours": 135.97508788514625}
{"step": 90700, "global_schedule": 0.09992742538452148, "l2_grads": 2.3032796382904053, "l2_params": 251.55357360839844, "l2_updates": 0.10963082313537598, "training_loss": 1.6794559955596924, "uptime": 32996.09801840398, "examples_seen": 92876800.0, "progress": 0.8136207468805224, "epoch": 73.22618667486627, "img/sec/core": 189.31297443841427, "core_hours_Tesla V100-SXM2-32GB": 136.05021333423082, "core_hours": 136.05021333423082}
{"step": 90750, "global_schedule": 0.09946364164352417, "l2_grads": 2.359215021133423, "l2_params": 251.50462341308594, "l2_updates": 0.10859378427267075, "training_loss": 1.584791660308838, "uptime": 33012.990920247976, "examples_seen": 92928000.0, "progress": 0.8140692698942382, "epoch": 73.26655392220633, "img/sec/core": 189.4286742178266, "core_hours_Tesla V100-SXM2-32GB": 136.1252928979819, "core_hours": 136.1252928979819}
{"step": 90801, "global_schedule": 0.09900090098381042, "l2_grads": 2.3708701133728027, "l2_params": 251.4576416015625, "l2_updates": 0.10721851140260696, "training_loss": 2.0665011405944824, "uptime": 33029.874167423, "examples_seen": 92979200.0, "progress": 0.8145177929079541, "epoch": 73.30692116954638, "img/sec/core": 189.5369988265306, "core_hours_Tesla V100-SXM2-32GB": 136.2003295520931, "core_hours": 136.2003295520931}
{"step": 90850, "global_schedule": 0.09853902459144592, "l2_grads": 2.349514961242676, "l2_params": 251.41006469726562, "l2_updates": 0.1078684851527214, "training_loss": 2.121150016784668, "uptime": 33046.746819722, "examples_seen": 93030400.0, "progress": 0.8149663159216699, "epoch": 73.34728841688644, "img/sec/core": 189.65601514759828, "core_hours_Tesla V100-SXM2-32GB": 136.27531911786645, "core_hours": 136.27531911786645}
{"step": 90900, "global_schedule": 0.09807819128036499, "l2_grads": 2.378342390060425, "l2_params": 251.36245727539062, "l2_updates": 0.10573671013116837, "training_loss": 2.9605743885040283, "uptime": 33063.66128176998, "examples_seen": 93081600.0, "progress": 0.8154148389353858, "epoch": 73.3876556642265, "img/sec/core": 189.18721688712998, "core_hours_Tesla V100-SXM2-32GB": 136.35049450474637, "core_hours": 136.35049450474637}
{"step": 90950, "global_schedule": 0.09761825203895569, "l2_grads": 2.39904522895813, "l2_params": 251.31646728515625, "l2_updates": 0.10726012289524078, "training_loss": 1.6924617290496826, "uptime": 33080.55303973495, "examples_seen": 93132800.0, "progress": 0.8158633619491016, "epoch": 73.42802291156656, "img/sec/core": 189.441501981964, "core_hours_Tesla V100-SXM2-32GB": 136.42556898459068, "core_hours": 136.42556898459068}
{"step": 91000, "global_schedule": 0.09715935587882996, "l2_grads": 2.4778048992156982, "l2_params": 251.2664031982422, "l2_updates": 0.10727736353874207, "training_loss": 1.6120905876159668, "uptime": 33097.43521236599, "examples_seen": 93184000.0, "progress": 0.8163118849628175, "epoch": 73.46839015890662, "img/sec/core": 189.5490627856803, "core_hours_Tesla V100-SXM2-32GB": 136.50060086295085, "core_hours": 136.50060086295085}
{"step": 91050, "global_schedule": 0.09670135378837585, "l2_grads": 2.4287540912628174, "l2_params": 251.21897888183594, "l2_updates": 0.10523531585931778, "training_loss": 1.634244441986084, "uptime": 33114.89761200099, "examples_seen": 93235200.0, "progress": 0.8167604079765333, "epoch": 73.50875740624667, "img/sec/core": 189.6428368959566, "core_hours_Tesla V100-SXM2-32GB": 136.57559563973763, "core_hours": 136.57559563973763}
{"step": 91100, "global_schedule": 0.09624436497688293, "l2_grads": 2.5382513999938965, "l2_params": 251.17379760742188, "l2_updates": 0.10478073358535767, "training_loss": 1.948869228363037, "uptime": 33131.76809151395, "examples_seen": 93286400.0, "progress": 0.8172089309902492, "epoch": 73.54912465358673, "img/sec/core": 189.6804413615982, "core_hours_Tesla V100-SXM2-32GB": 136.65057554868412, "core_hours": 136.65057554868412}
{"step": 91150, "global_schedule": 0.09578830003738403, "l2_grads": 2.570197820663452, "l2_params": 251.12376403808594, "l2_updates": 0.10253148525953293, "training_loss": 1.6396665573120117, "uptime": 33148.641764339, "examples_seen": 93337600.0, "progress": 0.817657454003965, "epoch": 73.58949190092679, "img/sec/core": 189.64454468081928, "core_hours_Tesla V100-SXM2-32GB": 136.7255696501288, "core_hours": 136.7255696501288}
{"step": 91200, "global_schedule": 0.09533324837684631, "l2_grads": 2.347243309020996, "l2_params": 251.07675170898438, "l2_updates": 0.10337719321250916, "training_loss": 1.8667702674865723, "uptime": 33165.519705806975, "examples_seen": 93388800.0, "progress": 0.8181059770176807, "epoch": 73.62985914826685, "img/sec/core": 189.5965811987229, "core_hours_Tesla V100-SXM2-32GB": 136.8005827233198, "core_hours": 136.8005827233198}
{"step": 91250, "global_schedule": 0.09487912058830261, "l2_grads": 2.277677297592163, "l2_params": 251.02984619140625, "l2_updates": 0.10433516651391983, "training_loss": 1.7515690326690674, "uptime": 33182.40112839296, "examples_seen": 93440000.0, "progress": 0.8185545000313966, "epoch": 73.6702263956069, "img/sec/core": 189.5574844893195, "core_hours_Tesla V100-SXM2-32GB": 136.87561126814637, "core_hours": 136.87561126814637}
{"step": 91300, "global_schedule": 0.09442600607872009, "l2_grads": 2.277751922607422, "l2_params": 250.98414611816406, "l2_updates": 0.10236401110887527, "training_loss": 2.419369697570801, "uptime": 33199.26535803196, "examples_seen": 93491200.0, "progress": 0.8190030230451124, "epoch": 73.71059364294696, "img/sec/core": 189.750736825786, "core_hours_Tesla V100-SXM2-32GB": 136.95056339987528, "core_hours": 136.95056339987528}
{"step": 91350, "global_schedule": 0.09397381544113159, "l2_grads": 2.4690890312194824, "l2_params": 250.9414520263672, "l2_updates": 0.10105518996715546, "training_loss": 2.1820321083068848, "uptime": 33216.13815365598, "examples_seen": 93542400.0, "progress": 0.8194515460588283, "epoch": 73.75096089028702, "img/sec/core": 189.6544041252326, "core_hours_Tesla V100-SXM2-32GB": 137.0255536026487, "core_hours": 137.0255536026487}
{"step": 91400, "global_schedule": 0.09352266788482666, "l2_grads": 2.2310428619384766, "l2_params": 250.89405822753906, "l2_updates": 0.10086571425199509, "training_loss": 2.750335216522217, "uptime": 33233.00711623597, "examples_seen": 93593600.0, "progress": 0.8199000690725441, "epoch": 73.79132813762709, "img/sec/core": 189.6974982798326, "core_hours_Tesla V100-SXM2-32GB": 137.10052676967086, "core_hours": 137.10052676967086}
{"step": 91450, "global_schedule": 0.09307241439819336, "l2_grads": 2.194995641708374, "l2_params": 250.8477783203125, "l2_updates": 0.1030615046620369, "training_loss": 2.7789528369903564, "uptime": 33249.910435531, "examples_seen": 93644800.0, "progress": 0.82034859208626, "epoch": 73.83169538496715, "img/sec/core": 189.3119300503815, "core_hours_Tesla V100-SXM2-32GB": 137.17565263320432, "core_hours": 137.17565263320432}
{"step": 91500, "global_schedule": 0.09262320399284363, "l2_grads": 2.3590917587280273, "l2_params": 250.8023681640625, "l2_updates": 0.09957829117774963, "training_loss": 2.799345016479492, "uptime": 33266.75040606398, "examples_seen": 93696000.0, "progress": 0.8207971150999758, "epoch": 73.8720626323072, "img/sec/core": 190.02408547765145, "core_hours_Tesla V100-SXM2-32GB": 137.25049694668422, "core_hours": 137.25049694668422}
{"step": 91550, "global_schedule": 0.09217491745948792, "l2_grads": 2.3641178607940674, "l2_params": 250.75604248046875, "l2_updates": 0.10110893100500107, "training_loss": 3.3288004398345947, "uptime": 33283.648870909994, "examples_seen": 93747200.0, "progress": 0.8212456381136917, "epoch": 73.91242987964726, "img/sec/core": 189.36631399119005, "core_hours_Tesla V100-SXM2-32GB": 137.32560123488878, "core_hours": 137.32560123488878}
{"step": 91600, "global_schedule": 0.09172767400741577, "l2_grads": 2.6124892234802246, "l2_params": 250.7095184326172, "l2_updates": 0.09999450296163559, "training_loss": 3.8065030574798584, "uptime": 33300.529721284984, "examples_seen": 93798400.0, "progress": 0.8216941611274075, "epoch": 73.95279712698732, "img/sec/core": 189.56390992843907, "core_hours_Tesla V100-SXM2-32GB": 137.40062723655538, "core_hours": 137.40062723655538}
{"step": 91650, "global_schedule": 0.09128132462501526, "l2_grads": 2.391206979751587, "l2_params": 250.66307067871094, "l2_updates": 0.09997761994600296, "training_loss": 1.6205418109893799, "uptime": 33317.406537687, "examples_seen": 93849600.0, "progress": 0.8221426841411232, "epoch": 73.99316437432738, "img/sec/core": 189.60922035141493, "core_hours_Tesla V100-SXM2-32GB": 137.47563530945322, "core_hours": 137.47563530945322}
{"step": 91700, "global_schedule": 0.09083595871925354, "l2_grads": 2.5476250648498535, "l2_params": 250.61892700195312, "l2_updates": 0.09906082600355148, "training_loss": 1.7166388034820557, "uptime": 33334.29139352596, "examples_seen": 93900800.0, "progress": 0.8225912071548391, "epoch": 74.03353162166744, "img/sec/core": 189.5189411458692, "core_hours_Tesla V100-SXM2-32GB": 137.55067911318193, "core_hours": 137.55067911318193}
{"step": 91750, "global_schedule": 0.09039163589477539, "l2_grads": 2.4652390480041504, "l2_params": 250.572021484375, "l2_updates": 0.09930690377950668, "training_loss": 1.8361566066741943, "uptime": 33351.17403010395, "examples_seen": 93952000.0, "progress": 0.8230397301685549, "epoch": 74.0738988690075, "img/sec/core": 189.54385384155898, "core_hours_Tesla V100-SXM2-32GB": 137.62571305352859, "core_hours": 137.62571305352859}
{"step": 91800, "global_schedule": 0.08994823694229126, "l2_grads": 2.4925732612609863, "l2_params": 250.5281524658203, "l2_updates": 0.09762316197156906, "training_loss": 3.009887933731079, "uptime": 33368.075644317956, "examples_seen": 94003200.0, "progress": 0.8234882531822708, "epoch": 74.11426611634755, "img/sec/core": 189.33102835520108, "core_hours_Tesla V100-SXM2-32GB": 137.70083133892416, "core_hours": 137.70083133892416}
{"step": 91850, "global_schedule": 0.08950591087341309, "l2_grads": 2.2532105445861816, "l2_params": 250.48265075683594, "l2_updates": 0.09677117317914963, "training_loss": 2.797609806060791, "uptime": 33384.95697791496, "examples_seen": 94054400.0, "progress": 0.8239367761959866, "epoch": 74.15463336368761, "img/sec/core": 189.55848373068338, "core_hours_Tesla V100-SXM2-32GB": 137.77585948824418, "core_hours": 137.77585948824418}
{"step": 91900, "global_schedule": 0.08906444907188416, "l2_grads": 2.5359046459198, "l2_params": 250.4377899169922, "l2_updates": 0.0975487232208252, "training_loss": 1.648591160774231, "uptime": 33401.846223175, "examples_seen": 94105600.0, "progress": 0.8243852992097025, "epoch": 74.19500061102767, "img/sec/core": 189.46968622517312, "core_hours_Tesla V100-SXM2-32GB": 137.850922800511, "core_hours": 137.850922800511}
{"step": 91950, "global_schedule": 0.08862408995628357, "l2_grads": 2.3367977142333984, "l2_params": 250.3935089111328, "l2_updates": 0.09547465294599533, "training_loss": 2.653132915496826, "uptime": 33418.714982189005, "examples_seen": 94156800.0, "progress": 0.8248338222234183, "epoch": 74.23536785836772, "img/sec/core": 189.69978747953834, "core_hours_Tesla V100-SXM2-32GB": 137.9258950627955, "core_hours": 137.9258950627955}
{"step": 92000, "global_schedule": 0.08818462491035461, "l2_grads": 2.280684471130371, "l2_params": 250.3506622314453, "l2_updates": 0.0965656191110611, "training_loss": 3.0382533073425293, "uptime": 33435.605210598966, "examples_seen": 94208000.0, "progress": 0.8252823452371341, "epoch": 74.27573510570778, "img/sec/core": 189.45865753437153, "core_hours_Tesla V100-SXM2-32GB": 138.0009627446175, "core_hours": 138.0009627446175}
{"step": 92050, "global_schedule": 0.08774620294570923, "l2_grads": 2.4459428787231445, "l2_params": 250.3074188232422, "l2_updates": 0.09526306390762329, "training_loss": 1.6001641750335693, "uptime": 33453.27270466497, "examples_seen": 94259200.0, "progress": 0.82573086825085, "epoch": 74.31610235304784, "img/sec/core": 189.73573719593375, "core_hours_Tesla V100-SXM2-32GB": 138.0759208017153, "core_hours": 138.0759208017153}
{"step": 92100, "global_schedule": 0.08730870485305786, "l2_grads": 2.4472804069519043, "l2_params": 250.26394653320312, "l2_updates": 0.09335143119096756, "training_loss": 3.525561571121216, "uptime": 33470.144244375, "examples_seen": 94310400.0, "progress": 0.8261793912645657, "epoch": 74.35646960038791, "img/sec/core": 189.66852196052784, "core_hours_Tesla V100-SXM2-32GB": 138.15090542264878, "core_hours": 138.15090542264878}
{"step": 92151, "global_schedule": 0.08687227964401245, "l2_grads": 2.285187005996704, "l2_params": 250.2236328125, "l2_updates": 0.09358679503202438, "training_loss": 3.073187828063965, "uptime": 33487.022522214975, "examples_seen": 94361600.0, "progress": 0.8266279142782816, "epoch": 74.39683684772797, "img/sec/core": 189.59280267449853, "core_hours_Tesla V100-SXM2-32GB": 138.22591999082644, "core_hours": 138.22591999082644}
{"step": 92200, "global_schedule": 0.08643677830696106, "l2_grads": 2.611999273300171, "l2_params": 250.17796325683594, "l2_updates": 0.09389372169971466, "training_loss": 1.9089679718017578, "uptime": 33503.91309182299, "examples_seen": 94412800.0, "progress": 0.8270764372919974, "epoch": 74.43720409506803, "img/sec/core": 189.45483037356541, "core_hours_Tesla V100-SXM2-32GB": 138.3009891890843, "core_hours": 138.3009891890843}
{"step": 92250, "global_schedule": 0.08600232005119324, "l2_grads": 2.4447402954101562, "l2_params": 250.133056640625, "l2_updates": 0.09449895471334457, "training_loss": 2.067028284072876, "uptime": 33520.77237599698, "examples_seen": 94464000.0, "progress": 0.8275249603057133, "epoch": 74.47757134240808, "img/sec/core": 189.80639788593115, "core_hours_Tesla V100-SXM2-32GB": 138.3759193409687, "core_hours": 138.3759193409687}
{"step": 92300, "global_schedule": 0.08556878566741943, "l2_grads": 2.5305583477020264, "l2_params": 250.08734130859375, "l2_updates": 0.09340418875217438, "training_loss": 1.7608619928359985, "uptime": 33537.66327487596, "examples_seen": 94515200.0, "progress": 0.8279734833194291, "epoch": 74.51793858974814, "img/sec/core": 189.45113714361284, "core_hours_Tesla V100-SXM2-32GB": 138.45099000265307, "core_hours": 138.45099000265307}
{"step": 92350, "global_schedule": 0.08513632416725159, "l2_grads": 2.3223133087158203, "l2_params": 250.04861450195312, "l2_updates": 0.0926603153347969, "training_loss": 2.557469367980957, "uptime": 33554.533927896, "examples_seen": 94566400.0, "progress": 0.828422006333145, "epoch": 74.5583058370882, "img/sec/core": 189.6784905835121, "core_hours_Tesla V100-SXM2-32GB": 138.5259706827421, "core_hours": 138.5259706827421}
{"step": 92400, "global_schedule": 0.08470478653907776, "l2_grads": 2.3895249366760254, "l2_params": 250.004150390625, "l2_updates": 0.09359168261289597, "training_loss": 1.8530864715576172, "uptime": 33571.421204285, "examples_seen": 94617600.0, "progress": 0.8288705293468608, "epoch": 74.59867308442826, "img/sec/core": 189.4917763106668, "core_hours_Tesla V100-SXM2-32GB": 138.601025244471, "core_hours": 138.601025244471}
{"step": 92450, "global_schedule": 0.08427432179450989, "l2_grads": 2.318162441253662, "l2_params": 249.9619903564453, "l2_updates": 0.09207246452569962, "training_loss": 3.437821388244629, "uptime": 33588.313552154985, "examples_seen": 94668800.0, "progress": 0.8293190523605766, "epoch": 74.63904033176831, "img/sec/core": 189.4348864130062, "core_hours_Tesla V100-SXM2-32GB": 138.67610234611539, "core_hours": 138.67610234611539}
{"step": 92500, "global_schedule": 0.08384475111961365, "l2_grads": 2.3441290855407715, "l2_params": 249.91941833496094, "l2_updates": 0.09231039881706238, "training_loss": 1.6279842853546143, "uptime": 33605.19248175796, "examples_seen": 94720000.0, "progress": 0.8297675753742925, "epoch": 74.67940757910837, "img/sec/core": 189.58548173792943, "core_hours_Tesla V100-SXM2-32GB": 138.75111981101747, "core_hours": 138.75111981101747, "minival/prec@1": 0.7813768342179207, "minival/loss": 0.8700039042110485, "minival/sample count": 12812.0, "minival/attn_weight_avg": [13312, 12, 281], "minival/attn_mag": [13312, 12, 281], "minival/before_mlp": [13312, 12, 281], "z/secs/eval/minival": 2.907552807999309, "real/prec@1": 0.8170890535260584, "real/loss": 1.673114616895263, "real/sample count": 46837.0, "real/attn_weight_avg": [50176, 12, 281], "real/attn_mag": [50176, 12, 281], "real/before_mlp": [50176, 12, 281], "z/secs/eval/real": 11.143883528013248, "train/prec@1": 0.8294110759864185, "train/loss": 0.6484378084935243, "train/sample count": 25623.0, "train/attn_weight_avg": [26624, 12, 281], "train/attn_mag": [26624, 12, 281], "train/before_mlp": [26624, 12, 281], "z/secs/eval/train": 6.558820712030865, "v2/prec@1": 0.6203, "v2/loss": 1.6288108764648437, "v2/sample count": 10000.0, "v2/attn_weight_avg": [10240, 12, 281], "v2/attn_mag": [10240, 12, 281], "v2/before_mlp": [10240, 12, 281], "z/secs/eval/v2": 3.3580686139757745, "val/prec@1": 0.7476, "val/loss": 0.999786630859375, "val/sample count": 50000.0, "val/attn_weight_avg": [50176, 12, 281], "val/attn_mag": [50176, 12, 281], "val/before_mlp": [50176, 12, 281], "z/secs/eval/val": 12.292302482994273}
{"step": 92550, "global_schedule": 0.08341628313064575, "l2_grads": 2.595083475112915, "l2_params": 249.8780975341797, "l2_updates": 0.09107176959514618, "training_loss": 1.6501965522766113, "uptime": 33658.34534400399, "examples_seen": 94771200.0, "progress": 0.8302160983880083, "epoch": 74.71977482644843, "img/sec/core": 189.45801626791004, "core_hours_Tesla V100-SXM2-32GB": 138.82618774692426, "core_hours": 138.82618774692426}
{"step": 92601, "global_schedule": 0.08298870921134949, "l2_grads": 2.480518341064453, "l2_params": 249.83621215820312, "l2_updates": 0.09071382880210876, "training_loss": 1.7617855072021484, "uptime": 33675.222414847, "examples_seen": 94822400.0, "progress": 0.8306646214017241, "epoch": 74.76014207378849, "img/sec/core": 189.60636177725624, "core_hours_Tesla V100-SXM2-32GB": 138.90119695067096, "core_hours": 138.90119695067096}
{"step": 92650, "global_schedule": 0.08256223797798157, "l2_grads": 2.519310235977173, "l2_params": 249.79396057128906, "l2_updates": 0.08945957571268082, "training_loss": 1.5335891246795654, "uptime": 33692.08168241795, "examples_seen": 94873600.0, "progress": 0.8311131444154399, "epoch": 74.80050932112854, "img/sec/core": 189.80658480761045, "core_hours_Tesla V100-SXM2-32GB": 138.97612702876407, "core_hours": 138.97612702876407}
{"step": 92700, "global_schedule": 0.08213669061660767, "l2_grads": 2.404944658279419, "l2_params": 249.75294494628906, "l2_updates": 0.08969872444868088, "training_loss": 1.682145118713379, "uptime": 33708.982141871005, "examples_seen": 94924800.0, "progress": 0.8315616674291558, "epoch": 74.8408765684686, "img/sec/core": 189.34396481282323, "core_hours_Tesla V100-SXM2-32GB": 139.05124018188877, "core_hours": 139.05124018188877}
{"step": 92750, "global_schedule": 0.08171218633651733, "l2_grads": 2.4735090732574463, "l2_params": 249.70982360839844, "l2_updates": 0.0896586999297142, "training_loss": 1.7637343406677246, "uptime": 33725.878955892986, "examples_seen": 94976000.0, "progress": 0.8320101904428716, "epoch": 74.88124381580866, "img/sec/core": 189.38481513954335, "core_hours_Tesla V100-SXM2-32GB": 139.12633713309756, "core_hours": 139.12633713309756}
{"step": 92800, "global_schedule": 0.08128863573074341, "l2_grads": 2.3857581615448, "l2_params": 249.6683807373047, "l2_updates": 0.0884813442826271, "training_loss": 1.6731051206588745, "uptime": 33742.76673831395, "examples_seen": 95027200.0, "progress": 0.8324587134565875, "epoch": 74.92161106314873, "img/sec/core": 189.48609830665472, "core_hours_Tesla V100-SXM2-32GB": 139.2013939438574, "core_hours": 139.2013939438574}
{"step": 92850, "global_schedule": 0.08086615800857544, "l2_grads": 2.4098875522613525, "l2_params": 249.62843322753906, "l2_updates": 0.08875823020935059, "training_loss": 1.6645071506500244, "uptime": 33759.652512526955, "examples_seen": 95078400.0, "progress": 0.8329072364703033, "epoch": 74.96197831048879, "img/sec/core": 189.50863369565198, "core_hours_Tesla V100-SXM2-32GB": 139.27644182924854, "core_hours": 139.27644182924854}
{"step": 92900, "global_schedule": 0.08044463396072388, "l2_grads": 2.306281328201294, "l2_params": 249.5867156982422, "l2_updates": 0.08658457547426224, "training_loss": 2.8704638481140137, "uptime": 33776.54404379096, "examples_seen": 95129600.0, "progress": 0.8333557594840191, "epoch": 75.00234555782885, "img/sec/core": 189.44404447331618, "core_hours_Tesla V100-SXM2-32GB": 139.35151530153297, "core_hours": 139.35151530153297}
{"step": 92950, "global_schedule": 0.08002415299415588, "l2_grads": 2.5808277130126953, "l2_params": 249.5445098876953, "l2_updates": 0.08678293973207474, "training_loss": 1.6932594776153564, "uptime": 33793.411562238995, "examples_seen": 95180800.0, "progress": 0.833804282497735, "epoch": 75.0427128051689, "img/sec/core": 189.7137394488644, "core_hours_Tesla V100-SXM2-32GB": 139.42648205019094, "core_hours": 139.42648205019094}
{"step": 93000, "global_schedule": 0.0796046257019043, "l2_grads": 2.548347234725952, "l2_params": 249.5026092529297, "l2_updates": 0.08616412431001663, "training_loss": 1.4769221544265747, "uptime": 33810.29794323997, "examples_seen": 95232000.0, "progress": 0.8342528055114508, "epoch": 75.08308005250896, "img/sec/core": 189.50182397368044, "core_hours_Tesla V100-SXM2-32GB": 139.5015326324175, "core_hours": 139.5015326324175}
{"step": 93050, "global_schedule": 0.07918617129325867, "l2_grads": 2.501685380935669, "l2_params": 249.4626007080078, "l2_updates": 0.08554992824792862, "training_loss": 1.9298985004425049, "uptime": 33827.711463390966, "examples_seen": 95283200.0, "progress": 0.8347013285251667, "epoch": 75.12344729984902, "img/sec/core": 189.4855830373446, "core_hours_Tesla V100-SXM2-32GB": 139.5765896472798, "core_hours": 139.5765896472798}
{"step": 93100, "global_schedule": 0.07876864075660706, "l2_grads": 2.443498134613037, "l2_params": 249.42103576660156, "l2_updates": 0.08671297132968903, "training_loss": 1.5313020944595337, "uptime": 33844.584680136, "examples_seen": 95334400.0, "progress": 0.8351498515388824, "epoch": 75.16381454718908, "img/sec/core": 189.6496707387692, "core_hours_Tesla V100-SXM2-32GB": 139.65158172170217, "core_hours": 139.65158172170217}
{"step": 93150, "global_schedule": 0.07835221290588379, "l2_grads": 2.3882150650024414, "l2_params": 249.38124084472656, "l2_updates": 0.08569886535406113, "training_loss": 2.157846450805664, "uptime": 33861.46384905698, "examples_seen": 95385600.0, "progress": 0.8355983745525983, "epoch": 75.20418179452913, "img/sec/core": 189.5827937371596, "core_hours_Tesla V100-SXM2-32GB": 139.72660025023984, "core_hours": 139.72660025023984}
{"step": 93200, "global_schedule": 0.07793670892715454, "l2_grads": 2.554460287094116, "l2_params": 249.34085083007812, "l2_updates": 0.08426747471094131, "training_loss": 1.7019118070602417, "uptime": 33878.35375988798, "examples_seen": 95436800.0, "progress": 0.8360468975663141, "epoch": 75.24454904186919, "img/sec/core": 189.46221990270803, "core_hours_Tesla V100-SXM2-32GB": 139.80166652059987, "core_hours": 139.80166652059987}
{"step": 93250, "global_schedule": 0.07752227783203125, "l2_grads": 2.3596749305725098, "l2_params": 249.30313110351562, "l2_updates": 0.08464705944061279, "training_loss": 2.3082237243652344, "uptime": 33895.23806068697, "examples_seen": 95488000.0, "progress": 0.83649542058003, "epoch": 75.28491628920925, "img/sec/core": 189.52517122834738, "core_hours_Tesla V100-SXM2-32GB": 139.87670785748426, "core_hours": 139.87670785748426}
{"step": 93300, "global_schedule": 0.07710888981819153, "l2_grads": 2.5277154445648193, "l2_params": 249.2616729736328, "l2_updates": 0.08417186141014099, "training_loss": 1.7991198301315308, "uptime": 33912.12821537, "examples_seen": 95539200.0, "progress": 0.8369439435937458, "epoch": 75.3252835365493, "img/sec/core": 189.45948453716125, "core_hours_Tesla V100-SXM2-32GB": 139.95177521163106, "core_hours": 139.95177521163106}
{"step": 93350, "global_schedule": 0.07669642567634583, "l2_grads": 2.50946307182312, "l2_params": 249.21963500976562, "l2_updates": 0.08372538536787033, "training_loss": 1.657062292098999, "uptime": 33929.01314191497, "examples_seen": 95590400.0, "progress": 0.8373924666074616, "epoch": 75.36565078388936, "img/sec/core": 189.51814753103844, "core_hours_Tesla V100-SXM2-32GB": 140.0268193296087, "core_hours": 140.0268193296087}
{"step": 93400, "global_schedule": 0.07628503441810608, "l2_grads": 2.612048864364624, "l2_params": 249.18075561523438, "l2_updates": 0.08337780088186264, "training_loss": 1.6465466022491455, "uptime": 33945.889352631, "examples_seen": 95641600.0, "progress": 0.8378409896211775, "epoch": 75.40601803122942, "img/sec/core": 189.61602541266055, "core_hours_Tesla V100-SXM2-32GB": 140.10182471056885, "core_hours": 140.10182471056885}
{"step": 93450, "global_schedule": 0.07587462663650513, "l2_grads": 2.308494806289673, "l2_params": 249.1406707763672, "l2_updates": 0.0833783820271492, "training_loss": 2.3561887741088867, "uptime": 33962.77228304697, "examples_seen": 95692800.0, "progress": 0.8382895126348933, "epoch": 75.44638527856948, "img/sec/core": 189.54055493662213, "core_hours_Tesla V100-SXM2-32GB": 140.17685995686205, "core_hours": 140.17685995686205}
{"step": 93500, "global_schedule": 0.07546526193618774, "l2_grads": 2.4456074237823486, "l2_params": 249.10092163085938, "l2_updates": 0.08160378783941269, "training_loss": 1.7678736448287964, "uptime": 33979.651292910974, "examples_seen": 95744000.0, "progress": 0.8387380356486092, "epoch": 75.48675252590954, "img/sec/core": 189.58458024393158, "core_hours_Tesla V100-SXM2-32GB": 140.25187777847984, "core_hours": 140.25187777847984}
{"step": 93550, "global_schedule": 0.07505688071250916, "l2_grads": 2.5283281803131104, "l2_params": 249.06199645996094, "l2_updates": 0.08169563859701157, "training_loss": 1.6431372165679932, "uptime": 33996.531062845956, "examples_seen": 95795200.0, "progress": 0.8391865586623249, "epoch": 75.52711977324961, "img/sec/core": 189.57604353175026, "core_hours_Tesla V100-SXM2-32GB": 140.32689897819085, "core_hours": 140.32689897819085}
{"step": 93600, "global_schedule": 0.07464957237243652, "l2_grads": 2.4986860752105713, "l2_params": 249.02212524414062, "l2_updates": 0.08201925456523895, "training_loss": 1.6394505500793457, "uptime": 34013.41556573997, "examples_seen": 95846400.0, "progress": 0.8396350816760408, "epoch": 75.56748702058967, "img/sec/core": 189.5229027521334, "core_hours_Tesla V100-SXM2-32GB": 140.40194121327534, "core_hours": 140.40194121327534}
{"step": 93650, "global_schedule": 0.07424318790435791, "l2_grads": 2.5701332092285156, "l2_params": 248.984130859375, "l2_updates": 0.08136641979217529, "training_loss": 1.834309458732605, "uptime": 34030.305683971965, "examples_seen": 95897600.0, "progress": 0.8400836046897566, "epoch": 75.60785426792972, "img/sec/core": 189.4598934149479, "core_hours_Tesla V100-SXM2-32GB": 140.47700840541756, "core_hours": 140.47700840541756}
{"step": 93700, "global_schedule": 0.07383793592453003, "l2_grads": 2.5351459980010986, "l2_params": 248.94549560546875, "l2_updates": 0.08093517273664474, "training_loss": 1.6761173009872437, "uptime": 34047.17087484896, "examples_seen": 95948800.0, "progress": 0.8405321277034725, "epoch": 75.64822151526978, "img/sec/core": 189.7399219100789, "core_hours_Tesla V100-SXM2-32GB": 140.55196480931534, "core_hours": 140.55196480931534}
{"step": 93750, "global_schedule": 0.07343360781669617, "l2_grads": 2.508556842803955, "l2_params": 248.90687561035156, "l2_updates": 0.0799991711974144, "training_loss": 2.438260316848755, "uptime": 34064.050677057996, "examples_seen": 96000000.0, "progress": 0.8409806507171883, "epoch": 75.68858876260984, "img/sec/core": 189.57568106380742, "core_hours_Tesla V100-SXM2-32GB": 140.6269861524666, "core_hours": 140.6269861524666}
{"step": 93800, "global_schedule": 0.07303038239479065, "l2_grads": 2.397991180419922, "l2_params": 248.86932373046875, "l2_updates": 0.07898718118667603, "training_loss": 3.0434396266937256, "uptime": 34080.96404222096, "examples_seen": 96051200.0, "progress": 0.8414291737309041, "epoch": 75.7289560099499, "img/sec/core": 189.19948627412003, "core_hours_Tesla V100-SXM2-32GB": 140.702156664302, "core_hours": 140.702156664302}
{"step": 93850, "global_schedule": 0.07262811064720154, "l2_grads": 2.4566702842712402, "l2_params": 248.83030700683594, "l2_updates": 0.07953717559576035, "training_loss": 1.5874686241149902, "uptime": 34097.85243713, "examples_seen": 96102400.0, "progress": 0.84187769674462, "epoch": 75.76932325728995, "img/sec/core": 189.47922625184088, "core_hours_Tesla V100-SXM2-32GB": 140.77721619723107, "core_hours": 140.77721619723107}
{"step": 93900, "global_schedule": 0.07222694158554077, "l2_grads": 2.5312371253967285, "l2_params": 248.79539489746094, "l2_updates": 0.07836984097957611, "training_loss": 1.9126287698745728, "uptime": 34114.73228079395, "examples_seen": 96153600.0, "progress": 0.8423262197583358, "epoch": 75.80969050463001, "img/sec/core": 189.57521548819452, "core_hours_Tesla V100-SXM2-32GB": 140.85223772462638, "core_hours": 140.85223772462638}
{"step": 93950, "global_schedule": 0.07182669639587402, "l2_grads": 2.3764262199401855, "l2_params": 248.75772094726562, "l2_updates": 0.07911555469036102, "training_loss": 3.06533145904541, "uptime": 34131.61538186099, "examples_seen": 96204800.0, "progress": 0.8427747427720517, "epoch": 75.85005775197007, "img/sec/core": 189.53863909795407, "core_hours_Tesla V100-SXM2-32GB": 140.92727372936878, "core_hours": 140.92727372936878}
{"step": 94000, "global_schedule": 0.07142758369445801, "l2_grads": 2.4376614093780518, "l2_params": 248.7209014892578, "l2_updates": 0.07791133224964142, "training_loss": 3.6110262870788574, "uptime": 34148.505980521964, "examples_seen": 96256000.0, "progress": 0.8432232657857675, "epoch": 75.89042499931013, "img/sec/core": 189.4545044986131, "core_hours_Tesla V100-SXM2-32GB": 141.0023430567509, "core_hours": 141.0023430567509}
{"step": 94050, "global_schedule": 0.07102939486503601, "l2_grads": 2.4566292762756348, "l2_params": 248.68199157714844, "l2_updates": 0.07724785059690475, "training_loss": 2.412541389465332, "uptime": 34165.923095546954, "examples_seen": 96307200.0, "progress": 0.8436717887994833, "epoch": 75.93079224665019, "img/sec/core": 189.61398742542318, "core_hours_Tesla V100-SXM2-32GB": 141.07734924387523, "core_hours": 141.07734924387523}
{"step": 94100, "global_schedule": 0.07063233852386475, "l2_grads": 2.6079039573669434, "l2_params": 248.6459197998047, "l2_updates": 0.07652044296264648, "training_loss": 2.136652708053589, "uptime": 34182.792741336976, "examples_seen": 96358400.0, "progress": 0.8441203118131991, "epoch": 75.97115949399024, "img/sec/core": 189.6898156505848, "core_hours_Tesla V100-SXM2-32GB": 141.15232544738643, "core_hours": 141.15232544738643}
{"step": 94150, "global_schedule": 0.0702362060546875, "l2_grads": 2.4624454975128174, "l2_params": 248.60955810546875, "l2_updates": 0.07682716101408005, "training_loss": 1.5866949558258057, "uptime": 34199.668080239964, "examples_seen": 96409600.0, "progress": 0.8445688348269149, "epoch": 76.0115267413303, "img/sec/core": 189.62582134770622, "core_hours_Tesla V100-SXM2-32GB": 141.22732695362194, "core_hours": 141.22732695362194}
{"step": 94200, "global_schedule": 0.06984120607376099, "l2_grads": 2.6087148189544678, "l2_params": 248.57260131835938, "l2_updates": 0.07634300738573074, "training_loss": 1.6657614707946777, "uptime": 34216.552811943984, "examples_seen": 96460800.0, "progress": 0.8450173578406308, "epoch": 76.05189398867036, "img/sec/core": 189.52033447106177, "core_hours_Tesla V100-SXM2-32GB": 141.30237020563982, "core_hours": 141.30237020563982}
{"step": 94250, "global_schedule": 0.06944712996482849, "l2_grads": 2.562969207763672, "l2_params": 248.5348358154297, "l2_updates": 0.0765433982014656, "training_loss": 1.9445624351501465, "uptime": 34233.433549929, "examples_seen": 96512000.0, "progress": 0.8454658808543466, "epoch": 76.09226123601043, "img/sec/core": 189.56517202268904, "core_hours_Tesla V100-SXM2-32GB": 141.37739570779544, "core_hours": 141.37739570779544}
{"step": 94300, "global_schedule": 0.06905418634414673, "l2_grads": 2.524773359298706, "l2_params": 248.499267578125, "l2_updates": 0.07486969977617264, "training_loss": 2.139880418777466, "uptime": 34250.30813007796, "examples_seen": 96563200.0, "progress": 0.8459144038680625, "epoch": 76.13262848335049, "img/sec/core": 189.63434774392525, "core_hours_Tesla V100-SXM2-32GB": 141.45239384179084, "core_hours": 141.45239384179084}
{"step": 94351, "global_schedule": 0.06866219639778137, "l2_grads": 2.4879796504974365, "l2_params": 248.46400451660156, "l2_updates": 0.07556655257940292, "training_loss": 1.6396862268447876, "uptime": 34267.19873337197, "examples_seen": 96614400.0, "progress": 0.8463629268817783, "epoch": 76.17299573069054, "img/sec/core": 189.454452531845, "core_hours_Tesla V100-SXM2-32GB": 141.5274631897642, "core_hours": 141.5274631897642}
{"step": 94400, "global_schedule": 0.06827130913734436, "l2_grads": 2.352818489074707, "l2_params": 248.4265594482422, "l2_updates": 0.07436776161193848, "training_loss": 2.5703694820404053, "uptime": 34284.075120377005, "examples_seen": 96665600.0, "progress": 0.8468114498954942, "epoch": 76.2133629780306, "img/sec/core": 189.6140447031668, "core_hours_Tesla V100-SXM2-32GB": 141.602469354231, "core_hours": 141.602469354231}
{"step": 94450, "global_schedule": 0.06788137555122375, "l2_grads": 2.4565329551696777, "l2_params": 248.390869140625, "l2_updates": 0.07322542369365692, "training_loss": 2.679957151412964, "uptime": 34300.97673478798, "examples_seen": 96716800.0, "progress": 0.84725997290921, "epoch": 76.25373022537066, "img/sec/core": 189.3310261487002, "core_hours_Tesla V100-SXM2-32GB": 141.67758764050203, "core_hours": 141.67758764050203}
{"step": 94500, "global_schedule": 0.06749257445335388, "l2_grads": 2.32007098197937, "l2_params": 248.35336303710938, "l2_updates": 0.0735536515712738, "training_loss": 3.0346338748931885, "uptime": 34317.86618733499, "examples_seen": 96768000.0, "progress": 0.8477084959229259, "epoch": 76.29409747271072, "img/sec/core": 189.46736083323134, "core_hours_Tesla V100-SXM2-32GB": 141.7526518740443, "core_hours": 141.7526518740443}
{"step": 94550, "global_schedule": 0.06710472702980042, "l2_grads": 2.48539137840271, "l2_params": 248.31761169433594, "l2_updates": 0.0739157423377037, "training_loss": 1.5777522325515747, "uptime": 34334.748470766994, "examples_seen": 96819200.0, "progress": 0.8481570189366416, "epoch": 76.33446472005078, "img/sec/core": 189.54781874673097, "core_hours_Tesla V100-SXM2-32GB": 141.82768424485317, "core_hours": 141.82768424485317}
{"step": 94600, "global_schedule": 0.06671798229217529, "l2_grads": 2.5857362747192383, "l2_params": 248.28225708007812, "l2_updates": 0.07374446839094162, "training_loss": 1.59192955493927, "uptime": 34351.60873891995, "examples_seen": 96870400.0, "progress": 0.8486055419503574, "epoch": 76.37483196739083, "img/sec/core": 189.79532063007917, "core_hours_Tesla V100-SXM2-32GB": 141.90261876997744, "core_hours": 141.90261876997744}
{"step": 94650, "global_schedule": 0.06633219122886658, "l2_grads": 2.374429941177368, "l2_params": 248.2450714111328, "l2_updates": 0.07238633185625076, "training_loss": 2.324352741241455, "uptime": 34368.51458967, "examples_seen": 96921600.0, "progress": 0.8490540649640733, "epoch": 76.41519921473089, "img/sec/core": 189.28358278517854, "core_hours_Tesla V100-SXM2-32GB": 141.9777558844221, "core_hours": 141.9777558844221}
{"step": 94700, "global_schedule": 0.0659475326538086, "l2_grads": 2.459331512451172, "l2_params": 248.21287536621094, "l2_updates": 0.07289879769086838, "training_loss": 1.6857049465179443, "uptime": 34385.407359784, "examples_seen": 96972800.0, "progress": 0.8495025879777891, "epoch": 76.45556646207095, "img/sec/core": 189.43015138452205, "core_hours_Tesla V100-SXM2-32GB": 142.05283486270656, "core_hours": 142.05283486270656}
{"step": 94750, "global_schedule": 0.06556382775306702, "l2_grads": 2.5786290168762207, "l2_params": 248.1790313720703, "l2_updates": 0.07197173684835434, "training_loss": 1.7812728881835938, "uptime": 34402.27810058399, "examples_seen": 97024000.0, "progress": 0.849951110991505, "epoch": 76.495933709411, "img/sec/core": 189.67750366966064, "core_hours_Tesla V100-SXM2-32GB": 142.12781593292874, "core_hours": 142.12781593292874}
{"step": 94800, "global_schedule": 0.06518125534057617, "l2_grads": 2.5313503742218018, "l2_params": 248.14479064941406, "l2_updates": 0.07172167301177979, "training_loss": 1.6558456420898438, "uptime": 34419.153580198996, "examples_seen": 97075200.0, "progress": 0.8503996340052208, "epoch": 76.53630095675106, "img/sec/core": 189.62424019967884, "core_hours_Tesla V100-SXM2-32GB": 142.202818064551, "core_hours": 142.202818064551}
{"step": 94850, "global_schedule": 0.06479963660240173, "l2_grads": 2.3587896823883057, "l2_params": 248.10809326171875, "l2_updates": 0.07072389125823975, "training_loss": 2.538609266281128, "uptime": 34436.048459465965, "examples_seen": 97126400.0, "progress": 0.8508481570189367, "epoch": 76.57666820409112, "img/sec/core": 189.40650296662963, "core_hours_Tesla V100-SXM2-32GB": 142.2779064168486, "core_hours": 142.2779064168486}
{"step": 94900, "global_schedule": 0.06441912055015564, "l2_grads": 2.5365772247314453, "l2_params": 248.0714874267578, "l2_updates": 0.07077977061271667, "training_loss": 1.6404733657836914, "uptime": 34452.93643783999, "examples_seen": 97177600.0, "progress": 0.8512966800326525, "epoch": 76.61703545143118, "img/sec/core": 189.4838996786921, "core_hours_Tesla V100-SXM2-32GB": 142.35296409851097, "core_hours": 142.35296409851097}
{"step": 94950, "global_schedule": 0.06403961777687073, "l2_grads": 2.53851056098938, "l2_params": 248.03790283203125, "l2_updates": 0.06985322386026382, "training_loss": 1.5109071731567383, "uptime": 34469.81094562495, "examples_seen": 97228800.0, "progress": 0.8517452030463684, "epoch": 76.65740269877125, "img/sec/core": 189.63516096464392, "core_hours_Tesla V100-SXM2-32GB": 142.42796191088854, "core_hours": 142.42796191088854}
{"step": 95001, "global_schedule": 0.06366118788719177, "l2_grads": 2.545963764190674, "l2_params": 248.00381469726562, "l2_updates": 0.06862053275108337, "training_loss": 1.9718053340911865, "uptime": 34486.68338688696, "examples_seen": 97280000.0, "progress": 0.8521937260600841, "epoch": 76.69776994611131, "img/sec/core": 189.65838732571183, "core_hours_Tesla V100-SXM2-32GB": 142.5029505387197, "core_hours": 142.5029505387197, "minival/prec@1": 0.7851233218857321, "minival/loss": 0.8611165694880776, "minival/sample count": 12812.0, "minival/attn_weight_avg": [13312, 12, 281], "minival/attn_mag": [13312, 12, 281], "minival/before_mlp": [13312, 12, 281], "z/secs/eval/minival": 2.9233976859832183, "real/prec@1": 0.8213805324850012, "real/loss": 1.6596981624978984, "real/sample count": 46837.0, "real/attn_weight_avg": [50176, 12, 281], "real/attn_mag": [50176, 12, 281], "real/before_mlp": [50176, 12, 281], "z/secs/eval/real": 11.168611030036118, "train/prec@1": 0.8344846427038208, "train/loss": 0.6351899825842269, "train/sample count": 25623.0, "train/attn_weight_avg": [26624, 12, 281], "train/attn_mag": [26624, 12, 281], "train/before_mlp": [26624, 12, 281], "z/secs/eval/train": 6.596505285007879, "v2/prec@1": 0.6267, "v2/loss": 1.6135721435546875, "v2/sample count": 10000.0, "v2/attn_weight_avg": [10240, 12, 281], "v2/attn_mag": [10240, 12, 281], "v2/before_mlp": [10240, 12, 281], "z/secs/eval/v2": 3.3555699579883367, "val/prec@1": 0.75326, "val/loss": 0.9923138635253906, "val/sample count": 50000.0, "val/attn_weight_avg": [50176, 12, 281], "val/attn_mag": [50176, 12, 281], "val/before_mlp": [50176, 12, 281], "z/secs/eval/val": 12.4564563119784}
{"step": 95050, "global_schedule": 0.063283771276474, "l2_grads": 2.598118543624878, "l2_params": 247.96746826171875, "l2_updates": 0.06864441931247711, "training_loss": 1.6769964694976807, "uptime": 34540.68527940399, "examples_seen": 97331200.0, "progress": 0.8526422490737999, "epoch": 76.73813719345137, "img/sec/core": 188.95925288044072, "core_hours_Tesla V100-SXM2-32GB": 142.57821661860422, "core_hours": 142.57821661860422}
{"step": 95100, "global_schedule": 0.06290742754936218, "l2_grads": 2.6721038818359375, "l2_params": 247.93490600585938, "l2_updates": 0.06836359202861786, "training_loss": 1.6427212953567505, "uptime": 34557.58358749299, "examples_seen": 97382400.0, "progress": 0.8530907720875158, "epoch": 76.77850444079142, "img/sec/core": 189.36807064622565, "core_hours_Tesla V100-SXM2-32GB": 142.6533202101109, "core_hours": 142.6533202101109}
{"step": 95150, "global_schedule": 0.06253209710121155, "l2_grads": 2.558211088180542, "l2_params": 247.90191650390625, "l2_updates": 0.06738925725221634, "training_loss": 1.613566279411316, "uptime": 34574.46046172996, "examples_seen": 97433600.0, "progress": 0.8535392951012316, "epoch": 76.81887168813148, "img/sec/core": 189.60857058410605, "core_hours_Tesla V100-SXM2-32GB": 142.728328540053, "core_hours": 142.728328540053}
{"step": 95200, "global_schedule": 0.06215786933898926, "l2_grads": 2.5190536975860596, "l2_params": 247.86788940429688, "l2_updates": 0.06796138733625412, "training_loss": 3.7201485633850098, "uptime": 34591.34049320995, "examples_seen": 97484800.0, "progress": 0.8539878181149475, "epoch": 76.85923893547154, "img/sec/core": 189.57310617540554, "core_hours_Tesla V100-SXM2-32GB": 142.80335090218628, "core_hours": 142.80335090218628}
{"step": 95250, "global_schedule": 0.06178462505340576, "l2_grads": 2.481604814529419, "l2_params": 247.83499145507812, "l2_updates": 0.06815409660339355, "training_loss": 1.8620036840438843, "uptime": 34608.23721318797, "examples_seen": 97536000.0, "progress": 0.8544363411286633, "epoch": 76.8996061828116, "img/sec/core": 189.38586921978913, "core_hours_Tesla V100-SXM2-32GB": 142.87844743542192, "core_hours": 142.87844743542192}
{"step": 95300, "global_schedule": 0.06141248345375061, "l2_grads": 2.403693437576294, "l2_params": 247.8036346435547, "l2_updates": 0.06625854223966599, "training_loss": 2.323883533477783, "uptime": 34625.128867711, "examples_seen": 97587200.0, "progress": 0.8548848641423792, "epoch": 76.93997343015165, "img/sec/core": 189.4426620930996, "core_hours_Tesla V100-SXM2-32GB": 142.95352145552428, "core_hours": 142.95352145552428}
{"step": 95350, "global_schedule": 0.06104135513305664, "l2_grads": 2.5199384689331055, "l2_params": 247.76995849609375, "l2_updates": 0.06664488464593887, "training_loss": 1.8291919231414795, "uptime": 34642.008056108956, "examples_seen": 97638400.0, "progress": 0.855333387156095, "epoch": 76.98034067749171, "img/sec/core": 189.58257497660412, "core_hours_Tesla V100-SXM2-32GB": 143.0285400706263, "core_hours": 143.0285400706263}
{"step": 95400, "global_schedule": 0.060671329498291016, "l2_grads": 2.7850003242492676, "l2_params": 247.73526000976562, "l2_updates": 0.0656273365020752, "training_loss": 3.9098613262176514, "uptime": 34658.88644605997, "examples_seen": 97689600.0, "progress": 0.8557819101698109, "epoch": 77.02070792483177, "img/sec/core": 189.5915433454789, "core_hours_Tesla V100-SXM2-32GB": 143.10355513707526, "core_hours": 143.10355513707526}
{"step": 95450, "global_schedule": 0.060302287340164185, "l2_grads": 2.3985142707824707, "l2_params": 247.70217895507812, "l2_updates": 0.06610371917486191, "training_loss": 2.2028706073760986, "uptime": 34675.77264075499, "examples_seen": 97740800.0, "progress": 0.8562304331835267, "epoch": 77.06107517217183, "img/sec/core": 189.50391475373144, "core_hours_Tesla V100-SXM2-32GB": 143.17860489127537, "core_hours": 143.17860489127537}
{"step": 95500, "global_schedule": 0.0599343478679657, "l2_grads": 2.6991066932678223, "l2_params": 247.66888427734375, "l2_updates": 0.06399250030517578, "training_loss": 3.52504563331604, "uptime": 34692.66260846995, "examples_seen": 97792000.0, "progress": 0.8566789561972424, "epoch": 77.10144241951188, "img/sec/core": 189.4615818102253, "core_hours_Tesla V100-SXM2-32GB": 143.25367141445298, "core_hours": 143.25367141445298}
{"step": 95550, "global_schedule": 0.059567421674728394, "l2_grads": 2.578059673309326, "l2_params": 247.6355743408203, "l2_updates": 0.065098837018013, "training_loss": 1.6687456369400024, "uptime": 34709.54908513598, "examples_seen": 97843200.0, "progress": 0.8571274792109583, "epoch": 77.14180966685194, "img/sec/core": 189.50075041041833, "core_hours_Tesla V100-SXM2-32GB": 143.32872242185752, "core_hours": 143.32872242185752}
{"step": 95600, "global_schedule": 0.05920162796974182, "l2_grads": 2.6136670112609863, "l2_params": 247.6036376953125, "l2_updates": 0.06541930884122849, "training_loss": 1.6355689764022827, "uptime": 34726.40015744895, "examples_seen": 97894400.0, "progress": 0.8575760022246741, "epoch": 77.182176914192, "img/sec/core": 189.89889429982722, "core_hours_Tesla V100-SXM2-32GB": 143.40361607658184, "core_hours": 143.40361607658184}
{"step": 95650, "global_schedule": 0.05883681774139404, "l2_grads": 2.6803982257843018, "l2_params": 247.5707550048828, "l2_updates": 0.06392519921064377, "training_loss": 1.7988731861114502, "uptime": 34743.295470564975, "examples_seen": 97945600.0, "progress": 0.85802452523839, "epoch": 77.22254416153206, "img/sec/core": 189.40163926084077, "core_hours_Tesla V100-SXM2-32GB": 143.4787063570975, "core_hours": 143.4787063570975}
{"step": 95700, "global_schedule": 0.05847311019897461, "l2_grads": 2.5190727710723877, "l2_params": 247.53848266601562, "l2_updates": 0.06495937705039978, "training_loss": 1.6523789167404175, "uptime": 34760.170673519955, "examples_seen": 97996800.0, "progress": 0.8584730482521058, "epoch": 77.26291140887213, "img/sec/core": 189.62734898875567, "core_hours_Tesla V100-SXM2-32GB": 143.55370725911965, "core_hours": 143.55370725911965}
{"step": 95750, "global_schedule": 0.05811041593551636, "l2_grads": 2.5453085899353027, "l2_params": 247.50648498535156, "l2_updates": 0.063457190990448, "training_loss": 1.6525969505310059, "uptime": 34777.06487037998, "examples_seen": 98048000.0, "progress": 0.8589215712658217, "epoch": 77.30327865621219, "img/sec/core": 189.41415365956425, "core_hours_Tesla V100-SXM2-32GB": 143.62879257849755, "core_hours": 143.62879257849755}
{"step": 95800, "global_schedule": 0.05774882435798645, "l2_grads": 2.4420390129089355, "l2_params": 247.4728546142578, "l2_updates": 0.06312623620033264, "training_loss": 2.4500396251678467, "uptime": 34793.946119987, "examples_seen": 98099200.0, "progress": 0.8593700942795375, "epoch": 77.34364590355224, "img/sec/core": 189.55942684894012, "core_hours_Tesla V100-SXM2-32GB": 143.70382035452874, "core_hours": 143.70382035452874}
{"step": 95850, "global_schedule": 0.057388246059417725, "l2_grads": 2.5643396377563477, "l2_params": 247.44163513183594, "l2_updates": 0.06172943115234375, "training_loss": 1.7896051406860352, "uptime": 34810.848138612, "examples_seen": 98150400.0, "progress": 0.8598186172932533, "epoch": 77.3840131508923, "img/sec/core": 189.3264982720576, "core_hours_Tesla V100-SXM2-32GB": 143.7789404373065, "core_hours": 143.7789404373065}
{"step": 95900, "global_schedule": 0.057028770446777344, "l2_grads": 2.5181221961975098, "l2_params": 247.40948486328125, "l2_updates": 0.06170324236154556, "training_loss": 1.7504695653915405, "uptime": 34827.72574025899, "examples_seen": 98201600.0, "progress": 0.8602671403069692, "epoch": 77.42438039823236, "img/sec/core": 189.60039861884985, "core_hours_Tesla V100-SXM2-32GB": 143.853952000182, "core_hours": 143.853952000182}
{"step": 95950, "global_schedule": 0.056670308113098145, "l2_grads": 2.5673460960388184, "l2_params": 247.3785400390625, "l2_updates": 0.06279412657022476, "training_loss": 1.5714809894561768, "uptime": 34844.635598250956, "examples_seen": 98252800.0, "progress": 0.8607156633206849, "epoch": 77.46474764557242, "img/sec/core": 189.23872699109978, "core_hours_Tesla V100-SXM2-32GB": 143.92910692459074, "core_hours": 143.92910692459074}
{"step": 96000, "global_schedule": 0.0563129186630249, "l2_grads": 2.744852304458618, "l2_params": 247.34695434570312, "l2_updates": 0.06112518534064293, "training_loss": 3.841834545135498, "uptime": 34861.53095524397, "examples_seen": 98304000.0, "progress": 0.8611641863344008, "epoch": 77.50511489291247, "img/sec/core": 189.40114738757617, "core_hours_Tesla V100-SXM2-32GB": 144.00419740011526, "core_hours": 144.00419740011526}
{"step": 96050, "global_schedule": 0.055956631898880005, "l2_grads": 2.722590446472168, "l2_params": 247.31886291503906, "l2_updates": 0.060990843921899796, "training_loss": 1.6676716804504395, "uptime": 34879.235711218964, "examples_seen": 98355200.0, "progress": 0.8616127093481166, "epoch": 77.54548214025253, "img/sec/core": 189.4974523322453, "core_hours_Tesla V100-SXM2-32GB": 144.07924971373313, "core_hours": 144.07924971373313}
{"step": 96100, "global_schedule": 0.05560138821601868, "l2_grads": 2.6039047241210938, "l2_params": 247.28875732421875, "l2_updates": 0.06067715585231781, "training_loss": 1.8412384986877441, "uptime": 34896.12337156298, "examples_seen": 98406400.0, "progress": 0.8620612323618325, "epoch": 77.58584938759259, "img/sec/core": 189.4874680573562, "core_hours_Tesla V100-SXM2-32GB": 144.15430598192873, "core_hours": 144.15430598192873}
{"step": 96150, "global_schedule": 0.055247217416763306, "l2_grads": 2.4251205921173096, "l2_params": 247.25697326660156, "l2_updates": 0.061068277806043625, "training_loss": 1.5211025476455688, "uptime": 34913.03098579997, "examples_seen": 98457600.0, "progress": 0.8625097553755483, "epoch": 77.62621663493265, "img/sec/core": 189.26384025248203, "core_hours_Tesla V100-SXM2-32GB": 144.22945093409314, "core_hours": 144.22945093409314}
{"step": 96200, "global_schedule": 0.054894089698791504, "l2_grads": 2.732374429702759, "l2_params": 247.22605895996094, "l2_updates": 0.05962304025888443, "training_loss": 1.6995445489883423, "uptime": 34929.891726067, "examples_seen": 98508800.0, "progress": 0.8629582783892642, "epoch": 77.6665838822727, "img/sec/core": 189.79000621088497, "core_hours_Tesla V100-SXM2-32GB": 144.30438755750217, "core_hours": 144.30438755750217}
{"step": 96250, "global_schedule": 0.05454206466674805, "l2_grads": 2.5194592475891113, "l2_params": 247.19729614257812, "l2_updates": 0.059292253106832504, "training_loss": 2.043083429336548, "uptime": 34946.79090973496, "examples_seen": 98560000.0, "progress": 0.86340680140298, "epoch": 77.70695112961276, "img/sec/core": 189.35825912504876, "core_hours_Tesla V100-SXM2-32GB": 144.37949504047089, "core_hours": 144.37949504047089}
{"step": 96300, "global_schedule": 0.05419105291366577, "l2_grads": 2.5254733562469482, "l2_params": 247.1665802001953, "l2_updates": 0.059730950742959976, "training_loss": 1.5910700559616089, "uptime": 34963.65909559198, "examples_seen": 98611200.0, "progress": 0.8638553244166958, "epoch": 77.74731837695282, "img/sec/core": 189.70623320872946, "core_hours_Tesla V100-SXM2-32GB": 144.454464755391, "core_hours": 144.454464755391}
{"step": 96350, "global_schedule": 0.05384117364883423, "l2_grads": 2.5084824562072754, "l2_params": 247.1370086669922, "l2_updates": 0.058925267308950424, "training_loss": 3.670689344406128, "uptime": 34980.554350255, "examples_seen": 98662400.0, "progress": 0.8643038474304117, "epoch": 77.78768562429288, "img/sec/core": 189.40229453922606, "core_hours_Tesla V100-SXM2-32GB": 144.5295547761155, "core_hours": 144.5295547761155}
{"step": 96400, "global_schedule": 0.05349230766296387, "l2_grads": 2.4840781688690186, "l2_params": 247.10763549804688, "l2_updates": 0.05844353884458542, "training_loss": 1.5366517305374146, "uptime": 34997.435424441996, "examples_seen": 98713600.0, "progress": 0.8647523704441274, "epoch": 77.82805287163295, "img/sec/core": 189.56139665951773, "core_hours_Tesla V100-SXM2-32GB": 144.60458177250214, "core_hours": 144.60458177250214}
{"step": 96450, "global_schedule": 0.05314457416534424, "l2_grads": 2.5425243377685547, "l2_params": 247.07830810546875, "l2_updates": 0.058219581842422485, "training_loss": 2.2145848274230957, "uptime": 35014.33539913298, "examples_seen": 98764800.0, "progress": 0.8652008934578433, "epoch": 77.868420118973, "img/sec/core": 189.3493959909508, "core_hours_Tesla V100-SXM2-32GB": 144.67969277112874, "core_hours": 144.67969277112874}
{"step": 96500, "global_schedule": 0.05279785394668579, "l2_grads": 2.645538330078125, "l2_params": 247.0493621826172, "l2_updates": 0.05711446702480316, "training_loss": 1.831528663635254, "uptime": 35031.224203018995, "examples_seen": 98816000.0, "progress": 0.8656494164715591, "epoch": 77.90878736631306, "img/sec/core": 189.47463784865522, "core_hours_Tesla V100-SXM2-32GB": 144.75475412173324, "core_hours": 144.75475412173324}
{"step": 96550, "global_schedule": 0.05245223641395569, "l2_grads": 2.49865984916687, "l2_params": 247.01803588867188, "l2_updates": 0.058045949786901474, "training_loss": 1.626786231994629, "uptime": 35048.14169424196, "examples_seen": 98867200.0, "progress": 0.866097939485275, "epoch": 77.94915461365312, "img/sec/core": 189.1533418179741, "core_hours_Tesla V100-SXM2-32GB": 144.8299429716131, "core_hours": 144.8299429716131}
{"step": 96600, "global_schedule": 0.052107661962509155, "l2_grads": 2.7253410816192627, "l2_params": 246.9882354736328, "l2_updates": 0.05679488927125931, "training_loss": 1.759374737739563, "uptime": 35065.01602575695, "examples_seen": 98918400.0, "progress": 0.8665464624989908, "epoch": 77.98952186099318, "img/sec/core": 189.6371419014189, "core_hours_Tesla V100-SXM2-32GB": 144.90494000056864, "core_hours": 144.90494000056864}
{"step": 96650, "global_schedule": 0.051764219999313354, "l2_grads": 2.63458514213562, "l2_params": 246.95932006835938, "l2_updates": 0.05711064487695694, "training_loss": 1.736224889755249, "uptime": 35081.914719077, "examples_seen": 98969600.0, "progress": 0.8669949855127067, "epoch": 78.02988910833324, "img/sec/core": 189.36375371716977, "core_hours_Tesla V100-SXM2-32GB": 144.9800453042133, "core_hours": 144.9800453042133}
{"step": 96700, "global_schedule": 0.05142176151275635, "l2_grads": 2.4981002807617188, "l2_params": 246.93035888671875, "l2_updates": 0.05606485903263092, "training_loss": 2.941694736480713, "uptime": 35098.80763616797, "examples_seen": 99020800.0, "progress": 0.8674435085264225, "epoch": 78.0702563556733, "img/sec/core": 189.42850324594244, "core_hours_Tesla V100-SXM2-32GB": 145.05512493572868, "core_hours": 145.05512493572868}
{"step": 96750, "global_schedule": 0.05108046531677246, "l2_grads": 2.7441461086273193, "l2_params": 246.90211486816406, "l2_updates": 0.05571875348687172, "training_loss": 3.8914082050323486, "uptime": 35115.71935729997, "examples_seen": 99072000.0, "progress": 0.8678920315401383, "epoch": 78.11062360301335, "img/sec/core": 189.2178788323065, "core_hours_Tesla V100-SXM2-32GB": 145.1302881407598, "core_hours": 145.1302881407598}
{"step": 96800, "global_schedule": 0.050740182399749756, "l2_grads": 2.531682014465332, "l2_params": 246.87429809570312, "l2_updates": 0.05511348322033882, "training_loss": 1.9143325090408325, "uptime": 35132.61378765199, "examples_seen": 99123200.0, "progress": 0.8683405545538542, "epoch": 78.15099085035341, "img/sec/core": 189.41153583295073, "core_hours_Tesla V100-SXM2-32GB": 145.20537449787992, "core_hours": 145.20537449787992}
{"step": 96850, "global_schedule": 0.05040103197097778, "l2_grads": 2.5658555030822754, "l2_params": 246.8473663330078, "l2_updates": 0.055412452667951584, "training_loss": 1.5401880741119385, "uptime": 35149.51926929696, "examples_seen": 99174400.0, "progress": 0.86878907756757, "epoch": 78.19135809769347, "img/sec/core": 189.2877154998535, "core_hours_Tesla V100-SXM2-32GB": 145.28050997185753, "core_hours": 145.28050997185753}
{"step": 96900, "global_schedule": 0.05006289482116699, "l2_grads": 2.5295395851135254, "l2_params": 246.81881713867188, "l2_updates": 0.054830458015203476, "training_loss": 3.2994537353515625, "uptime": 35166.400958715996, "examples_seen": 99225600.0, "progress": 0.8692376005812859, "epoch": 78.23172534503352, "img/sec/core": 189.55448833166835, "core_hours_Tesla V100-SXM2-32GB": 145.35553970260884, "core_hours": 145.35553970260884}
{"step": 96950, "global_schedule": 0.049725890159606934, "l2_grads": 2.447939157485962, "l2_params": 246.7918243408203, "l2_updates": 0.05431872233748436, "training_loss": 2.559889316558838, "uptime": 35183.29975986399, "examples_seen": 99276800.0, "progress": 0.8696861235950016, "epoch": 78.27209259237358, "img/sec/core": 189.36254542408685, "core_hours_Tesla V100-SXM2-32GB": 145.43064548548878, "core_hours": 145.43064548548878}
{"step": 97000, "global_schedule": 0.049389928579330444, "l2_grads": 2.649582862854004, "l2_params": 246.76248168945312, "l2_updates": 0.05373377725481987, "training_loss": 1.69948148727417, "uptime": 35200.193211795005, "examples_seen": 99328000.0, "progress": 0.8701346466087175, "epoch": 78.31245983971364, "img/sec/core": 189.42250601402492, "core_hours_Tesla V100-SXM2-32GB": 145.50572749407107, "core_hours": 145.50572749407107}
{"step": 97050, "global_schedule": 0.0490550696849823, "l2_grads": 2.4366979598999023, "l2_params": 246.73385620117188, "l2_updates": 0.05355606600642204, "training_loss": 2.535086154937744, "uptime": 35217.59727985598, "examples_seen": 99379200.0, "progress": 0.8705831696224333, "epoch": 78.3528270870537, "img/sec/core": 189.25771912371994, "core_hours_Tesla V100-SXM2-32GB": 145.5808748766353, "core_hours": 145.5808748766353}
{"step": 97100, "global_schedule": 0.04872128367424011, "l2_grads": 2.539924383163452, "l2_params": 246.70558166503906, "l2_updates": 0.05364326387643814, "training_loss": 1.560495138168335, "uptime": 35234.525596476975, "examples_seen": 99430400.0, "progress": 0.8710316926361492, "epoch": 78.39319433439377, "img/sec/core": 189.0323811660967, "core_hours_Tesla V100-SXM2-32GB": 145.65611183939527, "core_hours": 145.65611183939527}
{"step": 97150, "global_schedule": 0.04838860034942627, "l2_grads": 2.6052372455596924, "l2_params": 246.67929077148438, "l2_updates": 0.052407730370759964, "training_loss": 1.5917242765426636, "uptime": 35251.434445906954, "examples_seen": 99481600.0, "progress": 0.871480215649865, "epoch": 78.43356158173383, "img/sec/core": 189.25001451171408, "core_hours_Tesla V100-SXM2-32GB": 145.7312622813063, "core_hours": 145.7312622813063}
{"step": 97200, "global_schedule": 0.04805693030357361, "l2_grads": 2.5373940467834473, "l2_params": 246.65199279785156, "l2_updates": 0.05270516499876976, "training_loss": 3.4719696044921875, "uptime": 35268.34369340795, "examples_seen": 99532800.0, "progress": 0.8719287386635808, "epoch": 78.47392882907388, "img/sec/core": 189.24555926048177, "core_hours_Tesla V100-SXM2-32GB": 145.80641449242185, "core_hours": 145.80641449242185}
{"step": 97250, "global_schedule": 0.04772642254829407, "l2_grads": 2.3693745136260986, "l2_params": 246.62425231933594, "l2_updates": 0.05201057717204094, "training_loss": 2.2264699935913086, "uptime": 35285.261909861, "examples_seen": 99584000.0, "progress": 0.8723772616772967, "epoch": 78.51429607641394, "img/sec/core": 189.14523341631897, "core_hours_Tesla V100-SXM2-32GB": 145.8816065655465, "core_hours": 145.8816065655465}
{"step": 97300, "global_schedule": 0.047396957874298096, "l2_grads": 2.6708295345306396, "l2_params": 246.59735107421875, "l2_updates": 0.05202052742242813, "training_loss": 3.862452507019043, "uptime": 35302.18344543397, "examples_seen": 99635200.0, "progress": 0.8728257846910125, "epoch": 78.554663323754, "img/sec/core": 189.10813301789767, "core_hours_Tesla V100-SXM2-32GB": 145.95681339031526, "core_hours": 145.95681339031526}
{"step": 97350, "global_schedule": 0.04706859588623047, "l2_grads": 2.6159884929656982, "l2_params": 246.570556640625, "l2_updates": 0.05115806683897972, "training_loss": 3.512578010559082, "uptime": 35319.09828574798, "examples_seen": 99686400.0, "progress": 0.8732743077047284, "epoch": 78.59503057109406, "img/sec/core": 189.18298609942536, "core_hours_Tesla V100-SXM2-32GB": 146.03199045837752, "core_hours": 146.03199045837752}
{"step": 97400, "global_schedule": 0.04674127697944641, "l2_grads": 2.5973010063171387, "l2_params": 246.54373168945312, "l2_updates": 0.05142022669315338, "training_loss": 1.5500943660736084, "uptime": 35336.01715215697, "examples_seen": 99737600.0, "progress": 0.8737228307184441, "epoch": 78.63539781843411, "img/sec/core": 189.13796720446177, "core_hours_Tesla V100-SXM2-32GB": 146.10718542019524, "core_hours": 146.10718542019524}
{"step": 97450, "global_schedule": 0.046415120363235474, "l2_grads": 2.6179885864257812, "l2_params": 246.5172119140625, "l2_updates": 0.050448980182409286, "training_loss": 1.5442726612091064, "uptime": 35352.92043681099, "examples_seen": 99788800.0, "progress": 0.87417135373216, "epoch": 78.67576506577417, "img/sec/core": 189.31231801972436, "core_hours_Tesla V100-SXM2-32GB": 146.1823111297687, "core_hours": 146.1823111297687}
{"step": 97500, "global_schedule": 0.04608997702598572, "l2_grads": 2.5417919158935547, "l2_params": 246.49197387695312, "l2_updates": 0.049856510013341904, "training_loss": 2.2835824489593506, "uptime": 35369.820762219955, "examples_seen": 99840000.0, "progress": 0.8746198767458758, "epoch": 78.71613231311423, "img/sec/core": 189.34546658510308, "core_hours_Tesla V100-SXM2-32GB": 146.25742368714185, "core_hours": 146.25742368714185, "minival/prec@1": 0.7855916328442085, "minival/loss": 0.8511529446690298, "minival/sample count": 12812.0, "minival/attn_weight_avg": [13312, 12, 281], "minival/attn_mag": [13312, 12, 281], "minival/before_mlp": [13312, 12, 281], "z/secs/eval/minival": 2.895139525004197, "real/prec@1": 0.8237077524179601, "real/loss": 1.6459114209419103, "real/sample count": 46837.0, "real/attn_weight_avg": [50176, 12, 281], "real/attn_mag": [50176, 12, 281], "real/before_mlp": [50176, 12, 281], "z/secs/eval/real": 11.158784702012781, "train/prec@1": 0.8410412520001561, "train/loss": 0.6152766254929596, "train/sample count": 25623.0, "train/attn_weight_avg": [26624, 12, 281], "train/attn_mag": [26624, 12, 281], "train/before_mlp": [26624, 12, 281], "z/secs/eval/train": 6.607338438974693, "v2/prec@1": 0.6309, "v2/loss": 1.5919787719726564, "v2/sample count": 10000.0, "v2/attn_weight_avg": [10240, 12, 281], "v2/attn_mag": [10240, 12, 281], "v2/before_mlp": [10240, 12, 281], "z/secs/eval/v2": 3.3975704389740713, "val/prec@1": 0.75564, "val/loss": 0.9767684631347656, "val/sample count": 50000.0, "val/attn_weight_avg": [50176, 12, 281], "val/attn_mag": [50176, 12, 281], "val/before_mlp": [50176, 12, 281], "z/secs/eval/val": 12.339999978023116}
{"step": 97550, "global_schedule": 0.045765966176986694, "l2_grads": 2.4235997200012207, "l2_params": 246.46649169921875, "l2_updates": 0.04984503239393234, "training_loss": 2.0117719173431396, "uptime": 35423.13779481099, "examples_seen": 99891200.0, "progress": 0.8750683997595917, "epoch": 78.75649956045429, "img/sec/core": 189.16774807072792, "core_hours_Tesla V100-SXM2-32GB": 146.33260681094214, "core_hours": 146.33260681094214}
{"step": 97600, "global_schedule": 0.04544299840927124, "l2_grads": 2.689502000808716, "l2_params": 246.438720703125, "l2_updates": 0.04953642934560776, "training_loss": 1.5534098148345947, "uptime": 35440.01771474298, "examples_seen": 99942400.0, "progress": 0.8755169227733075, "epoch": 78.79686680779434, "img/sec/core": 189.5743589361062, "core_hours_Tesla V100-SXM2-32GB": 146.40762867730655, "core_hours": 146.40762867730655}
{"step": 97650, "global_schedule": 0.045121192932128906, "l2_grads": 2.779982566833496, "l2_params": 246.41419982910156, "l2_updates": 0.04901951551437378, "training_loss": 1.6225827932357788, "uptime": 35456.87625653099, "examples_seen": 99993600.0, "progress": 0.8759654457870233, "epoch": 78.8372340551344, "img/sec/core": 189.81475623686393, "core_hours_Tesla V100-SXM2-32GB": 146.4825555296977, "core_hours": 146.4825555296977}
{"step": 97700, "global_schedule": 0.044800400733947754, "l2_grads": 2.628753185272217, "l2_params": 246.3881378173828, "l2_updates": 0.049065954983234406, "training_loss": 3.8447327613830566, "uptime": 35473.75421651499, "examples_seen": 100044800.0, "progress": 0.8764139688007392, "epoch": 78.87760130247446, "img/sec/core": 189.59637320105705, "core_hours_Tesla V100-SXM2-32GB": 146.55756868518216, "core_hours": 146.55756868518216}
{"step": 97750, "global_schedule": 0.044480741024017334, "l2_grads": 2.6575875282287598, "l2_params": 246.36192321777344, "l2_updates": 0.048251014202833176, "training_loss": 1.5367013216018677, "uptime": 35490.627759178984, "examples_seen": 100096000.0, "progress": 0.876862491814455, "epoch": 78.91796854981452, "img/sec/core": 189.6460075825721, "core_hours_Tesla V100-SXM2-32GB": 146.63256220813324, "core_hours": 146.63256220813324}
{"step": 97800, "global_schedule": 0.04416215419769287, "l2_grads": 2.804311990737915, "l2_params": 246.3366241455078, "l2_updates": 0.04817674681544304, "training_loss": 1.7618193626403809, "uptime": 35507.524331705994, "examples_seen": 100147200.0, "progress": 0.8773110148281709, "epoch": 78.95833579715458, "img/sec/core": 189.3875219299443, "core_hours_Tesla V100-SXM2-32GB": 146.70765808603107, "core_hours": 146.70765808603107}
{"step": 97851, "global_schedule": 0.04384469985961914, "l2_grads": 2.6513960361480713, "l2_params": 246.31204223632812, "l2_updates": 0.04845855012536049, "training_loss": 1.6619226932525635, "uptime": 35524.398723665974, "examples_seen": 100198400.0, "progress": 0.8777595378418867, "epoch": 78.99870304449465, "img/sec/core": 189.6364626108737, "core_hours_Tesla V100-SXM2-32GB": 146.78265538363095, "core_hours": 146.78265538363095}
{"step": 97900, "global_schedule": 0.04352828860282898, "l2_grads": 2.498342275619507, "l2_params": 246.28773498535156, "l2_updates": 0.04780559986829758, "training_loss": 2.148509979248047, "uptime": 35541.29168441199, "examples_seen": 100249600.0, "progress": 0.8782080608556025, "epoch": 79.0390702918347, "img/sec/core": 189.4280137219109, "core_hours_Tesla V100-SXM2-32GB": 146.85773520916882, "core_hours": 146.85773520916882}
{"step": 97950, "global_schedule": 0.04321300983428955, "l2_grads": 2.8126978874206543, "l2_params": 246.26260375976562, "l2_updates": 0.04727637767791748, "training_loss": 1.644354224205017, "uptime": 35558.15109959396, "examples_seen": 100300800.0, "progress": 0.8786565838693183, "epoch": 79.07943753917476, "img/sec/core": 189.80492297396245, "core_hours_Tesla V100-SXM2-32GB": 146.9326659433109, "core_hours": 146.9326659433109}
{"step": 98000, "global_schedule": 0.04289877414703369, "l2_grads": 2.9280409812927246, "l2_params": 246.23780822753906, "l2_updates": 0.04686151444911957, "training_loss": 3.8880105018615723, "uptime": 35575.05318254995, "examples_seen": 100352000.0, "progress": 0.8791051068830341, "epoch": 79.11980478651482, "img/sec/core": 189.3257776767807, "core_hours_Tesla V100-SXM2-32GB": 147.00778631200419, "core_hours": 147.00778631200419}
{"step": 98050, "global_schedule": 0.04258570075035095, "l2_grads": 2.7218101024627686, "l2_params": 246.21304321289062, "l2_updates": 0.04655323922634125, "training_loss": 1.6893733739852905, "uptime": 35592.44434521196, "examples_seen": 100403200.0, "progress": 0.87955362989675, "epoch": 79.16017203385488, "img/sec/core": 189.6298003021646, "core_hours_Tesla V100-SXM2-32GB": 147.08278624450193, "core_hours": 147.08278624450193}
{"step": 98100, "global_schedule": 0.042273640632629395, "l2_grads": 2.4872591495513916, "l2_params": 246.18711853027344, "l2_updates": 0.04609754681587219, "training_loss": 2.0689048767089844, "uptime": 35609.315605624986, "examples_seen": 100454400.0, "progress": 0.8800021529104658, "epoch": 79.20053928119493, "img/sec/core": 189.67166184745543, "core_hours_Tesla V100-SXM2-32GB": 147.15776962411536, "core_hours": 147.15776962411536}
{"step": 98150, "global_schedule": 0.04196271300315857, "l2_grads": 2.54327130317688, "l2_params": 246.16212463378906, "l2_updates": 0.04577530175447464, "training_loss": 2.3353800773620605, "uptime": 35626.19194110698, "examples_seen": 100505600.0, "progress": 0.8804506759241817, "epoch": 79.24090652853499, "img/sec/core": 189.6146235901567, "core_hours_Tesla V100-SXM2-32GB": 147.23277555959095, "core_hours": 147.23277555959095}
{"step": 98200, "global_schedule": 0.04165291786193848, "l2_grads": 2.6337273120880127, "l2_params": 246.1370849609375, "l2_updates": 0.04560057818889618, "training_loss": 2.6060116291046143, "uptime": 35643.10159128497, "examples_seen": 100556800.0, "progress": 0.8808991989378975, "epoch": 79.28127377587505, "img/sec/core": 189.2410526721583, "core_hours_Tesla V100-SXM2-32GB": 147.30792956038198, "core_hours": 147.30792956038198}
{"step": 98250, "global_schedule": 0.04134416580200195, "l2_grads": 2.5147552490234375, "l2_params": 246.11390686035156, "l2_updates": 0.04610123112797737, "training_loss": 1.5518791675567627, "uptime": 35659.98897142196, "examples_seen": 100608000.0, "progress": 0.8813477219516134, "epoch": 79.32164102321511, "img/sec/core": 189.49061216371814, "core_hours_Tesla V100-SXM2-32GB": 147.38298458321304, "core_hours": 147.38298458321304}
{"step": 98301, "global_schedule": 0.04103657603263855, "l2_grads": 2.5227904319763184, "l2_params": 246.09173583984375, "l2_updates": 0.04435361176729202, "training_loss": 3.0420165061950684, "uptime": 35676.89257476898, "examples_seen": 100659200.0, "progress": 0.8817962449653292, "epoch": 79.36200827055517, "img/sec/core": 189.3087488097294, "core_hours_Tesla V100-SXM2-32GB": 147.45811170919978, "core_hours": 147.45811170919978}
{"step": 98350, "global_schedule": 0.040730029344558716, "l2_grads": 2.5618722438812256, "l2_params": 246.0681915283203, "l2_updates": 0.045163869857788086, "training_loss": 1.536478042602539, "uptime": 35693.75498292199, "examples_seen": 100710400.0, "progress": 0.882244767979045, "epoch": 79.40237551789522, "img/sec/core": 189.77123379782387, "core_hours_Tesla V100-SXM2-32GB": 147.5330557454354, "core_hours": 147.5330557454354}
{"step": 98400, "global_schedule": 0.040424644947052, "l2_grads": 2.729386806488037, "l2_params": 246.04396057128906, "l2_updates": 0.044686250388622284, "training_loss": 1.5496217012405396, "uptime": 35710.64456897596, "examples_seen": 100761600.0, "progress": 0.8826932909927608, "epoch": 79.44274276523528, "img/sec/core": 189.46586315234723, "core_hours_Tesla V100-SXM2-32GB": 147.6081205723419, "core_hours": 147.6081205723419}
{"step": 98450, "global_schedule": 0.04012030363082886, "l2_grads": 2.661745309829712, "l2_params": 246.0208740234375, "l2_updates": 0.04374893009662628, "training_loss": 1.6097954511642456, "uptime": 35727.52701400098, "examples_seen": 100812800.0, "progress": 0.8831418140064766, "epoch": 79.48311001257534, "img/sec/core": 189.5460044594621, "core_hours_Tesla V100-SXM2-32GB": 147.68315366134203, "core_hours": 147.68315366134203}
{"step": 98500, "global_schedule": 0.039817094802856445, "l2_grads": 2.6866276264190674, "l2_params": 245.99673461914062, "l2_updates": 0.04358110576868057, "training_loss": 1.7007734775543213, "uptime": 35744.40502507199, "examples_seen": 100864000.0, "progress": 0.8835903370201925, "epoch": 79.5234772599154, "img/sec/core": 189.59579932359418, "core_hours_Tesla V100-SXM2-32GB": 147.75816704387984, "core_hours": 147.75816704387984}
{"step": 98550, "global_schedule": 0.03951495885848999, "l2_grads": 2.5526742935180664, "l2_params": 245.97291564941406, "l2_updates": 0.04269213601946831, "training_loss": 2.1954636573791504, "uptime": 35761.268967249955, "examples_seen": 100915200.0, "progress": 0.8840388600339083, "epoch": 79.56384450725547, "img/sec/core": 189.75397129747006, "core_hours_Tesla V100-SXM2-32GB": 147.83311789800413, "core_hours": 147.83311789800413}
{"step": 98600, "global_schedule": 0.039213985204696655, "l2_grads": 2.597227096557617, "l2_params": 245.9515838623047, "l2_updates": 0.04296201840043068, "training_loss": 3.287191390991211, "uptime": 35778.176119546, "examples_seen": 100966400.0, "progress": 0.8844873830476242, "epoch": 79.60421175459553, "img/sec/core": 189.26901136087602, "core_hours_Tesla V100-SXM2-32GB": 147.90826079709765, "core_hours": 147.90826079709765}
{"step": 98650, "global_schedule": 0.03891405463218689, "l2_grads": 2.8184359073638916, "l2_params": 245.9287567138672, "l2_updates": 0.04244432970881462, "training_loss": 3.7418293952941895, "uptime": 35795.056434753, "examples_seen": 101017600.0, "progress": 0.88493590606134, "epoch": 79.64457900193558, "img/sec/core": 189.56991980057418, "core_hours_Tesla V100-SXM2-32GB": 147.98328442023987, "core_hours": 147.98328442023987}
{"step": 98700, "global_schedule": 0.038615256547927856, "l2_grads": 2.7675347328186035, "l2_params": 245.9072723388672, "l2_updates": 0.04211342707276344, "training_loss": 1.972893238067627, "uptime": 35811.92346350697, "examples_seen": 101068800.0, "progress": 0.8853844290750559, "epoch": 79.68494624927564, "img/sec/core": 189.71924733610805, "core_hours_Tesla V100-SXM2-32GB": 148.05824899247975, "core_hours": 148.05824899247975}
{"step": 98750, "global_schedule": 0.03831756114959717, "l2_grads": 2.6641650199890137, "l2_params": 245.8846435546875, "l2_updates": 0.04224314168095589, "training_loss": 1.6180939674377441, "uptime": 35828.81834335596, "examples_seen": 101120000.0, "progress": 0.8858329520887717, "epoch": 79.7253134966157, "img/sec/core": 189.40649644169008, "core_hours_Tesla V100-SXM2-32GB": 148.13333734736415, "core_hours": 148.13333734736415}
{"step": 98800, "global_schedule": 0.038020968437194824, "l2_grads": 2.5698275566101074, "l2_params": 245.86276245117188, "l2_updates": 0.041578080505132675, "training_loss": 1.6446192264556885, "uptime": 35845.708603470004, "examples_seen": 101171200.0, "progress": 0.8862814751024876, "epoch": 79.76568074395576, "img/sec/core": 189.45830190852686, "core_hours_Tesla V100-SXM2-32GB": 148.20840517009324, "core_hours": 148.20840517009324}
{"step": 98850, "global_schedule": 0.037725478410720825, "l2_grads": 2.6195335388183594, "l2_params": 245.8407440185547, "l2_updates": 0.04104732349514961, "training_loss": 2.901797294616699, "uptime": 35862.58313837997, "examples_seen": 101222400.0, "progress": 0.8867299981162033, "epoch": 79.80604799129581, "img/sec/core": 189.63485613524847, "core_hours_Tesla V100-SXM2-32GB": 148.28340310302642, "core_hours": 148.28340310302642}
{"step": 98900, "global_schedule": 0.03743112087249756, "l2_grads": 2.671311616897583, "l2_params": 245.81822204589844, "l2_updates": 0.04083843156695366, "training_loss": 2.762249231338501, "uptime": 35879.479906063, "examples_seen": 101273600.0, "progress": 0.8871785211299191, "epoch": 79.84641523863587, "img/sec/core": 189.3853345224544, "core_hours_Tesla V100-SXM2-32GB": 148.35849984828434, "core_hours": 148.35849984828434}
{"step": 98950, "global_schedule": 0.03713783621788025, "l2_grads": 2.5963354110717773, "l2_params": 245.7953338623047, "l2_updates": 0.04071986675262451, "training_loss": 2.515836238861084, "uptime": 35896.35859851597, "examples_seen": 101324800.0, "progress": 0.887627044143635, "epoch": 79.88678248597593, "img/sec/core": 189.5881454630594, "core_hours_Tesla V100-SXM2-32GB": 148.43351625918643, "core_hours": 148.43351625918643}
{"step": 99000, "global_schedule": 0.03684568405151367, "l2_grads": 2.463656187057495, "l2_params": 245.77395629882812, "l2_updates": 0.03996056690812111, "training_loss": 2.3225252628326416, "uptime": 35913.23107129795, "examples_seen": 101376000.0, "progress": 0.8880755671573508, "epoch": 79.92714973331599, "img/sec/core": 189.65803301919235, "core_hours_Tesla V100-SXM2-32GB": 148.50850502710634, "core_hours": 148.50850502710634}
{"step": 99050, "global_schedule": 0.03655466437339783, "l2_grads": 2.6728928089141846, "l2_params": 245.75241088867188, "l2_updates": 0.04042443633079529, "training_loss": 1.614635705947876, "uptime": 35930.70558634598, "examples_seen": 101427200.0, "progress": 0.8885240901710667, "epoch": 79.96751698065604, "img/sec/core": 189.1028527320109, "core_hours_Tesla V100-SXM2-32GB": 148.5837139518621, "core_hours": 148.5837139518621}
{"step": 99100, "global_schedule": 0.03626471757888794, "l2_grads": 2.6322035789489746, "l2_params": 245.73143005371094, "l2_updates": 0.039554327726364136, "training_loss": 1.4778584241867065, "uptime": 35947.60343223397, "examples_seen": 101478400.0, "progress": 0.8889726131847825, "epoch": 80.0078842279961, "img/sec/core": 189.3732503664884, "core_hours_Tesla V100-SXM2-32GB": 148.65881548914203, "core_hours": 148.65881548914203}
{"step": 99150, "global_schedule": 0.035975903272628784, "l2_grads": 2.7139039039611816, "l2_params": 245.70973205566406, "l2_updates": 0.03945884481072426, "training_loss": 1.6175930500030518, "uptime": 35964.50380225899, "examples_seen": 101529600.0, "progress": 0.8894211361984984, "epoch": 80.04825147533616, "img/sec/core": 189.344966723392, "core_hours_Tesla V100-SXM2-32GB": 148.7339282448088, "core_hours": 148.7339282448088}
{"step": 99200, "global_schedule": 0.035688161849975586, "l2_grads": 2.5344817638397217, "l2_params": 245.68734741210938, "l2_updates": 0.038914717733860016, "training_loss": 2.3181209564208984, "uptime": 35981.42594538897, "examples_seen": 101580800.0, "progress": 0.8898696592122142, "epoch": 80.08861872267622, "img/sec/core": 189.10134345398185, "core_hours_Tesla V100-SXM2-32GB": 148.80913776983093, "core_hours": 148.80913776983093}
{"step": 99250, "global_schedule": 0.03540158271789551, "l2_grads": 2.570347309112549, "l2_params": 245.6673583984375, "l2_updates": 0.03888452798128128, "training_loss": 1.7527523040771484, "uptime": 35998.31436833396, "examples_seen": 101632000.0, "progress": 0.8903181822259301, "epoch": 80.12898597001629, "img/sec/core": 189.47891170319153, "core_hours_Tesla V100-SXM2-32GB": 148.88419742736423, "core_hours": 148.88419742736423}
{"step": 99300, "global_schedule": 0.03511607646942139, "l2_grads": 2.6368465423583984, "l2_params": 245.64697265625, "l2_updates": 0.03847191110253334, "training_loss": 3.4214959144592285, "uptime": 36015.21588943596, "examples_seen": 101683200.0, "progress": 0.8907667052396459, "epoch": 80.16935321735635, "img/sec/core": 189.33207139687954, "core_hours_Tesla V100-SXM2-32GB": 148.9593152989287, "core_hours": 148.9593152989287}
{"step": 99350, "global_schedule": 0.034831702709198, "l2_grads": 2.884493827819824, "l2_params": 245.62425231933594, "l2_updates": 0.03712703660130501, "training_loss": 1.6975817680358887, "uptime": 36032.125230189995, "examples_seen": 101734400.0, "progress": 0.8912152282533616, "epoch": 80.2097204646964, "img/sec/core": 189.2445155933363, "core_hours_Tesla V100-SXM2-32GB": 149.03446792450217, "core_hours": 149.03446792450217}
{"step": 99400, "global_schedule": 0.034548431634902954, "l2_grads": 2.4512507915496826, "l2_params": 245.60333251953125, "l2_updates": 0.0380653478205204, "training_loss": 2.2428393363952637, "uptime": 36049.00530851999, "examples_seen": 101785600.0, "progress": 0.8916637512670775, "epoch": 80.25008771203646, "img/sec/core": 189.57258002254824, "core_hours_Tesla V100-SXM2-32GB": 149.1094904948577, "core_hours": 149.1094904948577}
{"step": 99450, "global_schedule": 0.03426632285118103, "l2_grads": 2.7391161918640137, "l2_params": 245.58287048339844, "l2_updates": 0.03756270557641983, "training_loss": 1.5153062343597412, "uptime": 36065.919946882, "examples_seen": 101836800.0, "progress": 0.8921122742807933, "epoch": 80.29045495937652, "img/sec/core": 189.18524484609412, "core_hours_Tesla V100-SXM2-32GB": 149.1846666653555, "core_hours": 149.1846666653555}
{"step": 99500, "global_schedule": 0.033985257148742676, "l2_grads": 2.8892745971679688, "l2_params": 245.56239318847656, "l2_updates": 0.037550605833530426, "training_loss": 1.6922075748443604, "uptime": 36082.818918644974, "examples_seen": 101888000.0, "progress": 0.8925607972945092, "epoch": 80.33082220671658, "img/sec/core": 189.36063358667192, "core_hours_Tesla V100-SXM2-32GB": 149.25977320652427, "core_hours": 149.25977320652427}
{"step": 99550, "global_schedule": 0.03370535373687744, "l2_grads": 2.88665509223938, "l2_params": 245.54281616210938, "l2_updates": 0.03721323236823082, "training_loss": 3.7996749877929688, "uptime": 36099.71551945497, "examples_seen": 101939200.0, "progress": 0.893009320308225, "epoch": 80.37118945405663, "img/sec/core": 189.387204916795, "core_hours_Tesla V100-SXM2-32GB": 149.33486921012428, "core_hours": 149.33486921012428}
{"step": 99600, "global_schedule": 0.03342655301094055, "l2_grads": 2.5585522651672363, "l2_params": 245.523193359375, "l2_updates": 0.03667225316166878, "training_loss": 3.3244810104370117, "uptime": 36116.618584804004, "examples_seen": 101990400.0, "progress": 0.8934578433219409, "epoch": 80.41155670139669, "img/sec/core": 189.3147742094578, "core_hours_Tesla V100-SXM2-32GB": 149.40999394500886, "core_hours": 149.40999394500886}
{"step": 99650, "global_schedule": 0.033148884773254395, "l2_grads": 2.6911020278930664, "l2_params": 245.5028533935547, "l2_updates": 0.03629105165600777, "training_loss": 1.646087884902954, "uptime": 36133.53711707296, "examples_seen": 102041600.0, "progress": 0.8939063663356567, "epoch": 80.45192394873675, "img/sec/core": 189.14170266832951, "core_hours_Tesla V100-SXM2-32GB": 149.4851874217598, "core_hours": 149.4851874217598}
{"step": 99700, "global_schedule": 0.03287231922149658, "l2_grads": 2.588334321975708, "l2_params": 245.484130859375, "l2_updates": 0.036077335476875305, "training_loss": 2.0229897499084473, "uptime": 36150.43237721396, "examples_seen": 102092800.0, "progress": 0.8943548893493725, "epoch": 80.4922911960768, "img/sec/core": 189.40223312897282, "core_hours_Tesla V100-SXM2-32GB": 149.5602774668309, "core_hours": 149.5602774668309}
{"step": 99750, "global_schedule": 0.0325968861579895, "l2_grads": 2.817641496658325, "l2_params": 245.46534729003906, "l2_updates": 0.03554560989141464, "training_loss": 3.8051257133483887, "uptime": 36167.330920348, "examples_seen": 102144000.0, "progress": 0.8948034123630884, "epoch": 80.53265844341686, "img/sec/core": 189.3654366898573, "core_hours_Tesla V100-SXM2-32GB": 149.6353821029822, "core_hours": 149.6353821029822}
{"step": 99800, "global_schedule": 0.03232255578041077, "l2_grads": 2.5443036556243896, "l2_params": 245.44656372070312, "l2_updates": 0.03533092141151428, "training_loss": 3.058795690536499, "uptime": 36184.260333099985, "examples_seen": 102195200.0, "progress": 0.8952519353768041, "epoch": 80.57302569075692, "img/sec/core": 189.02014186081416, "core_hours_Tesla V100-SXM2-32GB": 149.71062393743543, "core_hours": 149.71062393743543}
{"step": 99850, "global_schedule": 0.032049357891082764, "l2_grads": 2.5564043521881104, "l2_params": 245.42822265625, "l2_updates": 0.03461908549070358, "training_loss": 2.623906135559082, "uptime": 36201.17364062095, "examples_seen": 102246400.0, "progress": 0.89570045839052, "epoch": 80.61339293809698, "img/sec/core": 189.20013108215414, "core_hours_Tesla V100-SXM2-32GB": 149.7857941930842, "core_hours": 149.7857941930842}
{"step": 99900, "global_schedule": 0.031777262687683105, "l2_grads": 2.710636615753174, "l2_params": 245.4086151123047, "l2_updates": 0.03455458953976631, "training_loss": 3.6879801750183105, "uptime": 36218.06528983795, "examples_seen": 102297600.0, "progress": 0.8961489814042358, "epoch": 80.65376018543704, "img/sec/core": 189.4427216011751, "core_hours_Tesla V100-SXM2-32GB": 149.8608681896042, "core_hours": 149.8608681896042}
{"step": 99950, "global_schedule": 0.03150632977485657, "l2_grads": 2.6994526386260986, "l2_params": 245.38916015625, "l2_updates": 0.034659527242183685, "training_loss": 1.5549118518829346, "uptime": 36234.982760048995, "examples_seen": 102348800.0, "progress": 0.8965975044179517, "epoch": 80.6941274327771, "img/sec/core": 189.15357675111898, "core_hours_Tesla V100-SXM2-32GB": 149.93605694609772, "core_hours": 149.93605694609772}
{"step": 100000, "global_schedule": 0.03123652935028076, "l2_grads": 2.6967010498046875, "l2_params": 245.37037658691406, "l2_updates": 0.03394250571727753, "training_loss": 3.6549906730651855, "uptime": 36251.89592281898, "examples_seen": 102400000.0, "progress": 0.8970460274316675, "epoch": 80.73449468011717, "img/sec/core": 189.2017503479211, "core_hours_Tesla V100-SXM2-32GB": 150.01122655840877, "core_hours": 150.01122655840877, "minival/prec@1": 0.7915235716515766, "minival/loss": 0.8248275675849546, "minival/sample count": 12812.0, "minival/attn_weight_avg": [13312, 12, 281], "minival/attn_mag": [13312, 12, 281], "minival/before_mlp": [13312, 12, 281], "z/secs/eval/minival": 2.8879057239973918, "real/prec@1": 0.8260136217093323, "real/loss": 1.6271610513714785, "real/sample count": 46837.0, "real/attn_weight_avg": [50176, 12, 281], "real/attn_mag": [50176, 12, 281], "real/before_mlp": [50176, 12, 281], "z/secs/eval/real": 11.11037726700306, "train/prec@1": 0.8465831479530109, "train/loss": 0.5824606347613492, "train/sample count": 25623.0, "train/attn_weight_avg": [26624, 12, 281], "train/attn_mag": [26624, 12, 281], "train/before_mlp": [26624, 12, 281], "z/secs/eval/train": 6.550261892029084, "v2/prec@1": 0.6368, "v2/loss": 1.5708744262695313, "v2/sample count": 10000.0, "v2/attn_weight_avg": [10240, 12, 281], "v2/attn_mag": [10240, 12, 281], "v2/before_mlp": [10240, 12, 281], "z/secs/eval/v2": 3.367668605002109, "val/prec@1": 0.75908, "val/loss": 0.9526066577148438, "val/sample count": 50000.0, "val/attn_weight_avg": [50176, 12, 281], "val/attn_mag": [50176, 12, 281], "val/before_mlp": [50176, 12, 281], "z/secs/eval/val": 12.28567612200277}
{"step": 100050, "global_schedule": 0.030967801809310913, "l2_grads": 2.788011074066162, "l2_params": 245.35240173339844, "l2_updates": 0.034010667353868484, "training_loss": 1.5970675945281982, "uptime": 36305.824727308995, "examples_seen": 102451200.0, "progress": 0.8974945504453834, "epoch": 80.77486192745722, "img/sec/core": 188.8138544533988, "core_hours_Tesla V100-SXM2-32GB": 150.0865505978623, "core_hours": 150.0865505978623}
{"step": 100100, "global_schedule": 0.030700236558914185, "l2_grads": 2.619382381439209, "l2_params": 245.3331298828125, "l2_updates": 0.03333858773112297, "training_loss": 1.7630302906036377, "uptime": 36322.73809873097, "examples_seen": 102502400.0, "progress": 0.8979430734590992, "epoch": 80.81522917479728, "img/sec/core": 189.1994162584062, "core_hours_Tesla V100-SXM2-32GB": 150.16172113751554, "core_hours": 150.16172113751554}
{"step": 100150, "global_schedule": 0.030433744192123413, "l2_grads": 2.6726369857788086, "l2_params": 245.3149871826172, "l2_updates": 0.0333358459174633, "training_loss": 1.5715816020965576, "uptime": 36339.62809447496, "examples_seen": 102553600.0, "progress": 0.898391596472815, "epoch": 80.85559642213734, "img/sec/core": 189.46126739785464, "core_hours_Tesla V100-SXM2-32GB": 150.23678778526659, "core_hours": 150.23678778526659}
{"step": 100200, "global_schedule": 0.03016841411590576, "l2_grads": 2.764188528060913, "l2_params": 245.29698181152344, "l2_updates": 0.033059824258089066, "training_loss": 3.7266592979431152, "uptime": 36356.53101387597, "examples_seen": 102604800.0, "progress": 0.8988401194865309, "epoch": 80.8959636694774, "img/sec/core": 189.31640884528582, "core_hours_Tesla V100-SXM2-32GB": 150.31191187149327, "core_hours": 150.31191187149327}
{"step": 100250, "global_schedule": 0.029904186725616455, "l2_grads": 2.526331663131714, "l2_params": 245.27880859375, "l2_updates": 0.03257850557565689, "training_loss": 2.3041064739227295, "uptime": 36373.42037740897, "examples_seen": 102656000.0, "progress": 0.8992886425002466, "epoch": 80.93633091681745, "img/sec/core": 189.46835940543903, "core_hours_Tesla V100-SXM2-32GB": 150.38697570941773, "core_hours": 150.38697570941773}
{"step": 100300, "global_schedule": 0.02964109182357788, "l2_grads": 2.682313919067383, "l2_params": 245.2603759765625, "l2_updates": 0.03260205313563347, "training_loss": 1.823627233505249, "uptime": 36390.312659382995, "examples_seen": 102707200.0, "progress": 0.8997371655139625, "epoch": 80.97669816415751, "img/sec/core": 189.43562538918596, "core_hours_Tesla V100-SXM2-32GB": 150.46205251819117, "core_hours": 150.46205251819117}
{"step": 100350, "global_schedule": 0.029379159212112427, "l2_grads": 2.5351483821868896, "l2_params": 245.2421875, "l2_updates": 0.032301537692546844, "training_loss": 2.786807060241699, "uptime": 36407.199821279966, "examples_seen": 102758400.0, "progress": 0.9001856885276783, "epoch": 81.01706541149757, "img/sec/core": 189.49306103199473, "core_hours_Tesla V100-SXM2-32GB": 150.5371065710666, "core_hours": 150.5371065710666}
{"step": 100400, "global_schedule": 0.02911829948425293, "l2_grads": 2.600799083709717, "l2_params": 245.2238006591797, "l2_updates": 0.03241504356265068, "training_loss": 1.6043604612350464, "uptime": 36424.08737420698, "examples_seen": 102809600.0, "progress": 0.9006342115413942, "epoch": 81.05743265883763, "img/sec/core": 189.4886733341275, "core_hours_Tesla V100-SXM2-32GB": 150.61216236185334, "core_hours": 150.61216236185334}
{"step": 100450, "global_schedule": 0.028858602046966553, "l2_grads": 2.8385846614837646, "l2_params": 245.20602416992188, "l2_updates": 0.031550440937280655, "training_loss": 1.608748197555542, "uptime": 36440.974307089986, "examples_seen": 102860800.0, "progress": 0.90108273455511, "epoch": 81.09779990617768, "img/sec/core": 189.4956308626436, "core_hours_Tesla V100-SXM2-32GB": 150.68721539688892, "core_hours": 150.68721539688892}
{"step": 100500, "global_schedule": 0.028600037097930908, "l2_grads": 2.854757308959961, "l2_params": 245.18975830078125, "l2_updates": 0.03134361281991005, "training_loss": 3.7351040840148926, "uptime": 36457.87133725098, "examples_seen": 102912000.0, "progress": 0.9015312575688259, "epoch": 81.13816715351774, "img/sec/core": 189.38239261635587, "core_hours_Tesla V100-SXM2-32GB": 150.76231330871556, "core_hours": 150.76231330871556}
{"step": 100550, "global_schedule": 0.028342604637145996, "l2_grads": 2.7345123291015625, "l2_params": 245.1725311279297, "l2_updates": 0.031177939847111702, "training_loss": 1.6000728607177734, "uptime": 36474.73668455996, "examples_seen": 102963200.0, "progress": 0.9019797805825417, "epoch": 81.1785344008578, "img/sec/core": 189.73816200607874, "core_hours_Tesla V100-SXM2-32GB": 150.83727040786658, "core_hours": 150.83727040786658}
{"step": 100600, "global_schedule": 0.02808627486228943, "l2_grads": 2.634291648864746, "l2_params": 245.15582275390625, "l2_updates": 0.030827051028609276, "training_loss": 3.0147883892059326, "uptime": 36491.638548750954, "examples_seen": 103014400.0, "progress": 0.9024283035962575, "epoch": 81.21890164819786, "img/sec/core": 189.32822816699772, "core_hours_Tesla V100-SXM2-32GB": 150.912389804271, "core_hours": 150.912389804271}
{"step": 100650, "global_schedule": 0.02783110737800598, "l2_grads": 2.679340124130249, "l2_params": 245.1390838623047, "l2_updates": 0.03047739714384079, "training_loss": 1.648566722869873, "uptime": 36508.536947772955, "examples_seen": 103065600.0, "progress": 0.9028768266099734, "epoch": 81.25926889553791, "img/sec/core": 189.36705162624304, "core_hours_Tesla V100-SXM2-32GB": 150.98749379992432, "core_hours": 150.98749379992432}
{"step": 100701, "global_schedule": 0.02757704257965088, "l2_grads": 2.7050583362579346, "l2_params": 245.12185668945312, "l2_updates": 0.030395105481147766, "training_loss": 3.5493175983428955, "uptime": 36525.42328633199, "examples_seen": 103116800.0, "progress": 0.9033253496236892, "epoch": 81.29963614287799, "img/sec/core": 189.50230026552236, "core_hours_Tesla V100-SXM2-32GB": 151.06254419352004, "core_hours": 151.06254419352004}
{"step": 100750, "global_schedule": 0.027324140071868896, "l2_grads": 2.860250949859619, "l2_params": 245.1062774658203, "l2_updates": 0.029720930382609367, "training_loss": 3.870298147201538, "uptime": 36542.29284127097, "examples_seen": 103168000.0, "progress": 0.903773872637405, "epoch": 81.34000339021804, "img/sec/core": 189.6908372256818, "core_hours_Tesla V100-SXM2-32GB": 151.13751999324887, "core_hours": 151.13751999324887}
{"step": 100800, "global_schedule": 0.02707231044769287, "l2_grads": 2.549558401107788, "l2_params": 245.09011840820312, "l2_updates": 0.029524754732847214, "training_loss": 2.258512258529663, "uptime": 36559.17838285299, "examples_seen": 103219200.0, "progress": 0.9042223956511208, "epoch": 81.3803706375581, "img/sec/core": 189.51124454358464, "core_hours_Tesla V100-SXM2-32GB": 151.21256684472448, "core_hours": 151.21256684472448}
{"step": 100850, "global_schedule": 0.02682170271873474, "l2_grads": 2.824371576309204, "l2_params": 245.07440185546875, "l2_updates": 0.0293562188744545, "training_loss": 1.6281859874725342, "uptime": 36576.079279359954, "examples_seen": 103270400.0, "progress": 0.9046709186648367, "epoch": 81.42073788489816, "img/sec/core": 189.33906841456883, "core_hours_Tesla V100-SXM2-32GB": 151.287681940311, "core_hours": 151.287681940311}
{"step": 100900, "global_schedule": 0.02657213807106018, "l2_grads": 2.5943796634674072, "l2_params": 245.05812072753906, "l2_updates": 0.02888508513569832, "training_loss": 1.9774600267410278, "uptime": 36592.967876648996, "examples_seen": 103321600.0, "progress": 0.9051194416785525, "epoch": 81.46110513223822, "img/sec/core": 189.4769556780345, "core_hours_Tesla V100-SXM2-32GB": 151.36274237270672, "core_hours": 151.36274237270672}
{"step": 100950, "global_schedule": 0.026323795318603516, "l2_grads": 2.65693998336792, "l2_params": 245.04074096679688, "l2_updates": 0.029090501368045807, "training_loss": 3.5380373001098633, "uptime": 36609.87123772397, "examples_seen": 103372800.0, "progress": 0.9055679646922684, "epoch": 81.50147237957827, "img/sec/core": 189.31146212911398, "core_hours_Tesla V100-SXM2-32GB": 151.43786842192884, "core_hours": 151.43786842192884}
{"step": 101000, "global_schedule": 0.026076525449752808, "l2_grads": 2.6423423290252686, "l2_params": 245.02529907226562, "l2_updates": 0.02861836552619934, "training_loss": 1.8536441326141357, "uptime": 36626.756808037, "examples_seen": 103424000.0, "progress": 0.9060164877059842, "epoch": 81.54183962691833, "img/sec/core": 189.51092208781708, "core_hours_Tesla V100-SXM2-32GB": 151.51291540109784, "core_hours": 151.51291540109784}
{"step": 101050, "global_schedule": 0.02583041787147522, "l2_grads": 2.7035629749298096, "l2_params": 245.00929260253906, "l2_updates": 0.028603017330169678, "training_loss": 1.692651629447937, "uptime": 36644.17979267897, "examples_seen": 103475200.0, "progress": 0.9064650107197, "epoch": 81.58220687425839, "img/sec/core": 189.53271886124983, "core_hours_Tesla V100-SXM2-32GB": 151.587953749662, "core_hours": 151.587953749662}
{"step": 101100, "global_schedule": 0.025585412979125977, "l2_grads": 2.852128505706787, "l2_params": 244.99241638183594, "l2_updates": 0.02820846065878868, "training_loss": 1.70891273021698, "uptime": 36661.09854927298, "examples_seen": 103526400.0, "progress": 0.9069135337334159, "epoch": 81.62257412159845, "img/sec/core": 189.13919484681665, "core_hours_Tesla V100-SXM2-32GB": 151.66314822341317, "core_hours": 151.66314822341317}
{"step": 101150, "global_schedule": 0.02534160017967224, "l2_grads": 2.571333885192871, "l2_params": 244.97659301757812, "l2_updates": 0.027936700731515884, "training_loss": 1.5900182723999023, "uptime": 36677.98064796196, "examples_seen": 103577600.0, "progress": 0.9073620567471317, "epoch": 81.6629413689385, "img/sec/core": 189.54989299342498, "core_hours_Tesla V100-SXM2-32GB": 151.73817977314192, "core_hours": 151.73817977314192}
{"step": 101200, "global_schedule": 0.025098860263824463, "l2_grads": 2.8351755142211914, "l2_params": 244.96188354492188, "l2_updates": 0.02751646190881729, "training_loss": 3.6326522827148438, "uptime": 36694.881721831975, "examples_seen": 103628800.0, "progress": 0.9078105797608476, "epoch": 81.70330861627856, "img/sec/core": 189.33708145474907, "core_hours_Tesla V100-SXM2-32GB": 151.8132956570087, "core_hours": 151.8132956570087}
{"step": 101250, "global_schedule": 0.024857312440872192, "l2_grads": 2.653862476348877, "l2_params": 244.94630432128906, "l2_updates": 0.027346700429916382, "training_loss": 2.459641933441162, "uptime": 36711.78276338399, "examples_seen": 103680000.0, "progress": 0.9082591027745633, "epoch": 81.74367586361862, "img/sec/core": 189.3374435031852, "core_hours_Tesla V100-SXM2-32GB": 151.88841139723988, "core_hours": 151.88841139723988}
{"step": 101300, "global_schedule": 0.024616867303848267, "l2_grads": 2.708343982696533, "l2_params": 244.93173217773438, "l2_updates": 0.02726537548005581, "training_loss": 1.557295560836792, "uptime": 36728.65762282, "examples_seen": 103731200.0, "progress": 0.9087076257882792, "epoch": 81.78404311095868, "img/sec/core": 189.6312092041383, "core_hours_Tesla V100-SXM2-32GB": 151.963410772511, "core_hours": 151.963410772511}
{"step": 101350, "global_schedule": 0.02437761425971985, "l2_grads": 2.675475835800171, "l2_params": 244.91685485839844, "l2_updates": 0.02674214169383049, "training_loss": 3.4255876541137695, "uptime": 36745.555731309985, "examples_seen": 103782400.0, "progress": 0.909156148801995, "epoch": 81.82441035829873, "img/sec/core": 189.37030744573252, "core_hours_Tesla V100-SXM2-32GB": 152.03851347691094, "core_hours": 152.03851347691094}
{"step": 101400, "global_schedule": 0.024139434099197388, "l2_grads": 2.7439799308776855, "l2_params": 244.9019012451172, "l2_updates": 0.026372209191322327, "training_loss": 1.563701868057251, "uptime": 36762.44246088597, "examples_seen": 103833600.0, "progress": 0.9096046718157109, "epoch": 81.8647776056388, "img/sec/core": 189.49791228674968, "core_hours_Tesla V100-SXM2-32GB": 152.11356560835978, "core_hours": 152.11356560835978}
{"step": 101450, "global_schedule": 0.023902446031570435, "l2_grads": 2.635096788406372, "l2_params": 244.8866424560547, "l2_updates": 0.026070015504956245, "training_loss": 3.3943674564361572, "uptime": 36779.332124937966, "examples_seen": 103884800.0, "progress": 0.9100531948294267, "epoch": 81.90514485297886, "img/sec/core": 189.4649881814442, "core_hours_Tesla V100-SXM2-32GB": 152.1886307819242, "core_hours": 152.1886307819242}
{"step": 101500, "global_schedule": 0.023666560649871826, "l2_grads": 2.8185205459594727, "l2_params": 244.870849609375, "l2_updates": 0.025697946548461914, "training_loss": 2.169724702835083, "uptime": 36796.21866975096, "examples_seen": 103936000.0, "progress": 0.9105017178431425, "epoch": 81.94551210031892, "img/sec/core": 189.49998566536442, "core_hours_Tesla V100-SXM2-32GB": 152.2636820922042, "core_hours": 152.2636820922042}
{"step": 101550, "global_schedule": 0.023431837558746338, "l2_grads": 2.688197612762451, "l2_params": 244.85765075683594, "l2_updates": 0.025696180760860443, "training_loss": 2.037039041519165, "uptime": 36813.12257417897, "examples_seen": 103987200.0, "progress": 0.9109502408568584, "epoch": 81.98587934765898, "img/sec/core": 189.30537696948338, "core_hours_Tesla V100-SXM2-32GB": 152.33881055632864, "core_hours": 152.33881055632864}
{"step": 101600, "global_schedule": 0.023198246955871582, "l2_grads": 2.60624098777771, "l2_params": 244.84312438964844, "l2_updates": 0.025254257023334503, "training_loss": 1.781752347946167, "uptime": 36829.99833115295, "examples_seen": 104038400.0, "progress": 0.9113987638705742, "epoch": 82.02624659499904, "img/sec/core": 189.62112365883277, "core_hours_Tesla V100-SXM2-32GB": 152.41381392065747, "core_hours": 152.41381392065747}
{"step": 101650, "global_schedule": 0.022965818643569946, "l2_grads": 2.7876529693603516, "l2_params": 244.82760620117188, "l2_updates": 0.0248174536973238, "training_loss": 1.5949506759643555, "uptime": 36846.889244789956, "examples_seen": 104089600.0, "progress": 0.9118472868842901, "epoch": 82.0666138423391, "img/sec/core": 189.4509716152494, "core_hours_Tesla V100-SXM2-32GB": 152.48888464793305, "core_hours": 152.48888464793305}
{"step": 101700, "global_schedule": 0.022734493017196655, "l2_grads": 2.577392816543579, "l2_params": 244.8140411376953, "l2_updates": 0.02439660020172596, "training_loss": 2.2421181201934814, "uptime": 36863.78858389199, "examples_seen": 104140800.0, "progress": 0.9122958098980058, "epoch": 82.10698108967915, "img/sec/core": 189.35651747557694, "core_hours_Tesla V100-SXM2-32GB": 152.56399282171984, "core_hours": 152.56399282171984}
{"step": 101750, "global_schedule": 0.022504359483718872, "l2_grads": 2.7454586029052734, "l2_params": 244.80064392089844, "l2_updates": 0.024857889860868454, "training_loss": 1.4972350597381592, "uptime": 36880.678569465, "examples_seen": 104192000.0, "progress": 0.9127443329117217, "epoch": 82.14734833701921, "img/sec/core": 189.4613814894615, "core_hours_Tesla V100-SXM2-32GB": 152.63905942426658, "core_hours": 152.63905942426658}
{"step": 101800, "global_schedule": 0.022275328636169434, "l2_grads": 2.7445690631866455, "l2_params": 244.7863311767578, "l2_updates": 0.024232633411884308, "training_loss": 1.5923819541931152, "uptime": 36897.57369877695, "examples_seen": 104243200.0, "progress": 0.9131928559254375, "epoch": 82.18771558435927, "img/sec/core": 189.40369978330628, "core_hours_Tesla V100-SXM2-32GB": 152.7141488878752, "core_hours": 152.7141488878752}
{"step": 101850, "global_schedule": 0.022047489881515503, "l2_grads": 2.697272539138794, "l2_params": 244.7730255126953, "l2_updates": 0.024281825870275497, "training_loss": 1.6486762762069702, "uptime": 36914.470421159, "examples_seen": 104294400.0, "progress": 0.9136413789391533, "epoch": 82.22808283169933, "img/sec/core": 189.38584227431576, "core_hours_Tesla V100-SXM2-32GB": 152.78924543179545, "core_hours": 152.78924543179545}
{"step": 101900, "global_schedule": 0.021820753812789917, "l2_grads": 2.53682279586792, "l2_params": 244.75962829589844, "l2_updates": 0.023716198280453682, "training_loss": 2.9269862174987793, "uptime": 36931.37386307499, "examples_seen": 104345600.0, "progress": 0.9140899019528692, "epoch": 82.26845007903938, "img/sec/core": 189.31055674368193, "core_hours_Tesla V100-SXM2-32GB": 152.86437184031095, "core_hours": 152.86437184031095}
{"step": 101950, "global_schedule": 0.02159518003463745, "l2_grads": 2.6738314628601074, "l2_params": 244.74636840820312, "l2_updates": 0.02332303300499916, "training_loss": 1.9505654573440552, "uptime": 36948.27652772097, "examples_seen": 104396800.0, "progress": 0.914538424966585, "epoch": 82.30881732637944, "img/sec/core": 189.3192622005076, "core_hours_Tesla V100-SXM2-32GB": 152.93949479429313, "core_hours": 152.93949479429313}
{"step": 102000, "global_schedule": 0.021370738744735718, "l2_grads": 2.7921149730682373, "l2_params": 244.7333984375, "l2_updates": 0.023466682061553, "training_loss": 1.7244327068328857, "uptime": 36965.19779311796, "examples_seen": 104448000.0, "progress": 0.9149869479803009, "epoch": 82.3491845737195, "img/sec/core": 189.11115244192075, "core_hours_Tesla V100-SXM2-32GB": 153.0147004182797, "core_hours": 153.0147004182797}
{"step": 102050, "global_schedule": 0.021147459745407104, "l2_grads": 2.61201548576355, "l2_params": 244.7205810546875, "l2_updates": 0.023248549550771713, "training_loss": 2.541531562805176, "uptime": 36982.60479956999, "examples_seen": 104499200.0, "progress": 0.9154354709940167, "epoch": 82.38955182105956, "img/sec/core": 189.28149314679473, "core_hours_Tesla V100-SXM2-32GB": 153.0898383622265, "core_hours": 153.0898383622265}
{"step": 102100, "global_schedule": 0.020925313234329224, "l2_grads": 2.8065543174743652, "l2_params": 244.70730590820312, "l2_updates": 0.022783882915973663, "training_loss": 2.1634202003479004, "uptime": 36999.53953168896, "examples_seen": 104550400.0, "progress": 0.9158839940077326, "epoch": 82.42991906839961, "img/sec/core": 188.96076876322593, "core_hours_Tesla V100-SXM2-32GB": 153.16510383831078, "core_hours": 153.16510383831078}
{"step": 102150, "global_schedule": 0.02070435881614685, "l2_grads": 2.718588352203369, "l2_params": 244.69422912597656, "l2_updates": 0.022478193044662476, "training_loss": 1.9237889051437378, "uptime": 37016.45245080296, "examples_seen": 104601600.0, "progress": 0.9163325170214484, "epoch": 82.47028631573968, "img/sec/core": 189.2044760831478, "core_hours_Tesla V100-SXM2-32GB": 153.24027236770632, "core_hours": 153.24027236770632}
{"step": 102201, "global_schedule": 0.020484477281570435, "l2_grads": 2.6566247940063477, "l2_params": 244.68124389648438, "l2_updates": 0.02228464186191559, "training_loss": 1.6574244499206543, "uptime": 37033.358623798005, "examples_seen": 104652800.0, "progress": 0.9167810400351643, "epoch": 82.51065356307974, "img/sec/core": 189.27997489066826, "core_hours_Tesla V100-SXM2-32GB": 153.315410914351, "core_hours": 153.315410914351}
{"step": 102250, "global_schedule": 0.020265817642211914, "l2_grads": 2.75705885887146, "l2_params": 244.66957092285156, "l2_updates": 0.02216917835175991, "training_loss": 1.542415976524353, "uptime": 37050.264333055005, "examples_seen": 104704000.0, "progress": 0.91722956304888, "epoch": 82.5510208104198, "img/sec/core": 189.28516700208718, "core_hours_Tesla V100-SXM2-32GB": 153.39054739993765, "core_hours": 153.39054739993765}
{"step": 102300, "global_schedule": 0.02004826068878174, "l2_grads": 2.5154287815093994, "l2_params": 244.65647888183594, "l2_updates": 0.022019023075699806, "training_loss": 2.3639955520629883, "uptime": 37067.199538545974, "examples_seen": 104755200.0, "progress": 0.9176780860625958, "epoch": 82.59138805775986, "img/sec/core": 188.9554869414795, "core_hours_Tesla V100-SXM2-32GB": 153.4658149798975, "core_hours": 153.4658149798975}
{"step": 102350, "global_schedule": 0.01983189582824707, "l2_grads": 2.5899412631988525, "l2_params": 244.64337158203125, "l2_updates": 0.021878264844417572, "training_loss": 1.4189927577972412, "uptime": 37084.088535722985, "examples_seen": 104806400.0, "progress": 0.9181266090763117, "epoch": 82.63175530509992, "img/sec/core": 189.4724693515681, "core_hours_Tesla V100-SXM2-32GB": 153.5408771895731, "core_hours": 153.5408771895731}
{"step": 102400, "global_schedule": 0.019616633653640747, "l2_grads": 2.6215004920959473, "l2_params": 244.63104248046875, "l2_updates": 0.021415460854768753, "training_loss": 2.2224299907684326, "uptime": 37101.01109823998, "examples_seen": 104857600.0, "progress": 0.9185751320900275, "epoch": 82.67212255243997, "img/sec/core": 189.09665700964007, "core_hours_Tesla V100-SXM2-32GB": 153.61608857853753, "core_hours": 153.61608857853753}
{"step": 102450, "global_schedule": 0.01940256357192993, "l2_grads": 2.6444239616394043, "l2_params": 244.6186981201172, "l2_updates": 0.02111767791211605, "training_loss": 3.0624985694885254, "uptime": 37117.937358269, "examples_seen": 104908800.0, "progress": 0.9190236551037434, "epoch": 82.71248979978003, "img/sec/core": 189.0553491741744, "core_hours_Tesla V100-SXM2-32GB": 153.69131640088875, "core_hours": 153.69131640088875}
{"step": 102500, "global_schedule": 0.01918959617614746, "l2_grads": 2.850545644760132, "l2_params": 244.60702514648438, "l2_updates": 0.020984767004847527, "training_loss": 1.8014298677444458, "uptime": 37134.853395204, "examples_seen": 104960000.0, "progress": 0.9194721781174592, "epoch": 82.75285704712009, "img/sec/core": 189.1696035126998, "core_hours_Tesla V100-SXM2-32GB": 153.7664987872665, "core_hours": 153.7664987872665, "minival/prec@1": 0.7942553855760225, "minival/loss": 0.8193198593192051, "minival/sample count": 12812.0, "minival/attn_weight_avg": [13312, 12, 281], "minival/attn_mag": [13312, 12, 281], "minival/before_mlp": [13312, 12, 281], "z/secs/eval/minival": 2.924361692974344, "real/prec@1": 0.8275508679035805, "real/loss": 1.6236861797213609, "real/sample count": 46837.0, "real/attn_weight_avg": [50176, 12, 281], "real/attn_mag": [50176, 12, 281], "real/before_mlp": [50176, 12, 281], "z/secs/eval/real": 11.166873526992276, "train/prec@1": 0.8481832728408071, "train/loss": 0.575846887130776, "train/sample count": 25623.0, "train/attn_weight_avg": [26624, 12, 281], "train/attn_mag": [26624, 12, 281], "train/before_mlp": [26624, 12, 281], "z/secs/eval/train": 6.626326113997493, "v2/prec@1": 0.6358, "v2/loss": 1.5688860473632813, "v2/sample count": 10000.0, "v2/attn_weight_avg": [10240, 12, 281], "v2/attn_mag": [10240, 12, 281], "v2/before_mlp": [10240, 12, 281], "z/secs/eval/v2": 3.36203583504539, "val/prec@1": 0.761, "val/loss": 0.9477263134765626, "val/sample count": 50000.0, "val/attn_weight_avg": [50176, 12, 281], "val/attn_mag": [50176, 12, 281], "val/before_mlp": [50176, 12, 281], "z/secs/eval/val": 12.292132911970839}
{"step": 102550, "global_schedule": 0.01897779107093811, "l2_grads": 2.8766214847564697, "l2_params": 244.5948028564453, "l2_updates": 0.020983636379241943, "training_loss": 3.8277385234832764, "uptime": 37188.19251369097, "examples_seen": 105011200.0, "progress": 0.9199207011311751, "epoch": 82.79322429446015, "img/sec/core": 188.61897174615098, "core_hours_Tesla V100-SXM2-32GB": 153.84190065215083, "core_hours": 153.84190065215083}
{"step": 102600, "global_schedule": 0.018767178058624268, "l2_grads": 2.6866226196289062, "l2_params": 244.58267211914062, "l2_updates": 0.020594725385308266, "training_loss": 1.9572417736053467, "uptime": 37205.09373722796, "examples_seen": 105062400.0, "progress": 0.9203692241448909, "epoch": 82.8335915418002, "img/sec/core": 189.33540480053495, "core_hours_Tesla V100-SXM2-32GB": 153.91701720120412, "core_hours": 153.91701720120412}
{"step": 102650, "global_schedule": 0.01855766773223877, "l2_grads": 2.738753318786621, "l2_params": 244.57095336914062, "l2_updates": 0.02021219953894615, "training_loss": 3.3503804206848145, "uptime": 37222.007467624964, "examples_seen": 105113600.0, "progress": 0.9208177471586068, "epoch": 82.87395878914026, "img/sec/core": 189.1954007122245, "core_hours_Tesla V100-SXM2-32GB": 153.99218933630192, "core_hours": 153.99218933630192}
{"step": 102700, "global_schedule": 0.018349379301071167, "l2_grads": 2.668562412261963, "l2_params": 244.55943298339844, "l2_updates": 0.02015538513660431, "training_loss": 1.7228323221206665, "uptime": 37238.92662051297, "examples_seen": 105164800.0, "progress": 0.9212662701723225, "epoch": 82.91432603648032, "img/sec/core": 189.13476467659976, "core_hours_Tesla V100-SXM2-32GB": 154.06738557135972, "core_hours": 154.06738557135972}
{"step": 102750, "global_schedule": 0.01814219355583191, "l2_grads": 2.6926279067993164, "l2_params": 244.54859924316406, "l2_updates": 0.019969383254647255, "training_loss": 1.8629131317138672, "uptime": 37255.834971338976, "examples_seen": 105216000.0, "progress": 0.9217147931860383, "epoch": 82.95469328382038, "img/sec/core": 189.25559523391212, "core_hours_Tesla V100-SXM2-32GB": 154.1425337972531, "core_hours": 154.1425337972531}
{"step": 102800, "global_schedule": 0.01793617010116577, "l2_grads": 2.738647699356079, "l2_params": 244.53688049316406, "l2_updates": 0.019859617576003075, "training_loss": 1.4627532958984375, "uptime": 37272.75477351097, "examples_seen": 105267200.0, "progress": 0.9221633161997542, "epoch": 82.99506053116043, "img/sec/core": 189.12750678000722, "core_hours_Tesla V100-SXM2-32GB": 154.2177329180175, "core_hours": 154.2177329180175}
{"step": 102851, "global_schedule": 0.017731308937072754, "l2_grads": 2.7194201946258545, "l2_params": 244.52606201171875, "l2_updates": 0.019442342221736908, "training_loss": 1.5392581224441528, "uptime": 37289.69842594699, "examples_seen": 105318400.0, "progress": 0.92261183921347, "epoch": 83.0354277785005, "img/sec/core": 188.86128667258708, "core_hours_Tesla V100-SXM2-32GB": 154.29303803995535, "core_hours": 154.29303803995535}
{"step": 102901, "global_schedule": 0.017527610063552856, "l2_grads": 2.657813310623169, "l2_params": 244.51539611816406, "l2_updates": 0.01900653727352619, "training_loss": 2.972170829772949, "uptime": 37306.60930879798, "examples_seen": 105369600.0, "progress": 0.9230603622271859, "epoch": 83.07579502584056, "img/sec/core": 189.22725845813503, "core_hours_Tesla V100-SXM2-32GB": 154.3681975192931, "core_hours": 154.3681975192931}
{"step": 102950, "global_schedule": 0.01732504367828369, "l2_grads": 2.5917701721191406, "l2_params": 244.5045623779297, "l2_updates": 0.018799850717186928, "training_loss": 3.3257460594177246, "uptime": 37323.50735127495, "examples_seen": 105420800.0, "progress": 0.9235088852409017, "epoch": 83.11616227318062, "img/sec/core": 189.37104722996375, "core_hours_Tesla V100-SXM2-32GB": 154.44329993030183, "core_hours": 154.44329993030183}
{"step": 103000, "global_schedule": 0.017123669385910034, "l2_grads": 2.576078414916992, "l2_params": 244.49391174316406, "l2_updates": 0.01849258691072464, "training_loss": 2.5009238719940186, "uptime": 37340.43951209495, "examples_seen": 105472000.0, "progress": 0.9239574082546176, "epoch": 83.15652952052068, "img/sec/core": 188.98946413388435, "core_hours_Tesla V100-SXM2-32GB": 154.5185539783907, "core_hours": 154.5185539783907}
{"step": 103050, "global_schedule": 0.01692339777946472, "l2_grads": 2.706345319747925, "l2_params": 244.48284912109375, "l2_updates": 0.01846158690750599, "training_loss": 1.5108107328414917, "uptime": 37357.834843938996, "examples_seen": 105523200.0, "progress": 0.9244059312683334, "epoch": 83.19689676786074, "img/sec/core": 189.57483802970245, "core_hours_Tesla V100-SXM2-32GB": 154.59357565515984, "core_hours": 154.59357565515984}
{"step": 103100, "global_schedule": 0.016724348068237305, "l2_grads": 2.626844882965088, "l2_params": 244.47201538085938, "l2_updates": 0.0182492695748806, "training_loss": 1.374861240386963, "uptime": 37374.71822789498, "examples_seen": 105574400.0, "progress": 0.9248544542820493, "epoch": 83.2372640152008, "img/sec/core": 189.53546329000983, "core_hours_Tesla V100-SXM2-32GB": 154.6686129171864, "core_hours": 154.6686129171864}
{"step": 103150, "global_schedule": 0.016526401042938232, "l2_grads": 2.609882116317749, "l2_params": 244.46121215820312, "l2_updates": 0.018119322136044502, "training_loss": 1.6576640605926514, "uptime": 37391.61782795796, "examples_seen": 105625600.0, "progress": 0.925302977295765, "epoch": 83.27763126254085, "img/sec/core": 189.3535934621866, "core_hours_Tesla V100-SXM2-32GB": 154.7437222507997, "core_hours": 154.7437222507997}
{"step": 103200, "global_schedule": 0.016329646110534668, "l2_grads": 2.5230813026428223, "l2_params": 244.4508056640625, "l2_updates": 0.018084188923239708, "training_loss": 2.465893268585205, "uptime": 37408.49524543696, "examples_seen": 105676800.0, "progress": 0.9257515003094808, "epoch": 83.31799850988091, "img/sec/core": 189.60246755650718, "core_hours_Tesla V100-SXM2-32GB": 154.8187329951508, "core_hours": 154.8187329951508}
{"step": 103251, "global_schedule": 0.016134023666381836, "l2_grads": 2.7860774993896484, "l2_params": 244.44027709960938, "l2_updates": 0.017478177323937416, "training_loss": 1.4884281158447266, "uptime": 37425.38982260297, "examples_seen": 105728000.0, "progress": 0.9262000233231967, "epoch": 83.35836575722097, "img/sec/core": 189.40988984551453, "core_hours_Tesla V100-SXM2-32GB": 154.8938200047775, "core_hours": 154.8938200047775}
{"step": 103300, "global_schedule": 0.01593959331512451, "l2_grads": 2.9266974925994873, "l2_params": 244.42971801757812, "l2_updates": 0.017446905374526978, "training_loss": 1.6141161918640137, "uptime": 37442.28696122195, "examples_seen": 105779200.0, "progress": 0.9266485463369125, "epoch": 83.39873300456102, "img/sec/core": 189.38117702398702, "core_hours_Tesla V100-SXM2-32GB": 154.96891839863966, "core_hours": 154.96891839863966}
{"step": 103350, "global_schedule": 0.01574629545211792, "l2_grads": 2.6848533153533936, "l2_params": 244.4200439453125, "l2_updates": 0.01718655228614807, "training_loss": 2.535027503967285, "uptime": 37459.165366716974, "examples_seen": 105830400.0, "progress": 0.9270970693506284, "epoch": 83.43910025190108, "img/sec/core": 189.59136874295484, "core_hours_Tesla V100-SXM2-32GB": 155.04393353417308, "core_hours": 155.04393353417308}
{"step": 103400, "global_schedule": 0.015554189682006836, "l2_grads": 2.730693817138672, "l2_params": 244.41049194335938, "l2_updates": 0.0169831495732069, "training_loss": 3.0745763778686523, "uptime": 37476.044679276994, "examples_seen": 105881600.0, "progress": 0.9275455923643442, "epoch": 83.47946749924114, "img/sec/core": 189.5811804314451, "core_hours_Tesla V100-SXM2-32GB": 155.1189527011065, "core_hours": 155.1189527011065}
{"step": 103450, "global_schedule": 0.015363216400146484, "l2_grads": 2.7347679138183594, "l2_params": 244.4006805419922, "l2_updates": 0.01673867739737034, "training_loss": 1.482768177986145, "uptime": 37492.94557372696, "examples_seen": 105932800.0, "progress": 0.9279941153780601, "epoch": 83.5198347465812, "img/sec/core": 189.33909145894467, "core_hours_Tesla V100-SXM2-32GB": 155.1940677875508, "core_hours": 155.1940677875508}
{"step": 103500, "global_schedule": 0.01517343521118164, "l2_grads": 2.5938050746917725, "l2_params": 244.39068603515625, "l2_updates": 0.016593603417277336, "training_loss": 1.4890472888946533, "uptime": 37509.83787899697, "examples_seen": 105984000.0, "progress": 0.9284426383917759, "epoch": 83.56020199392125, "img/sec/core": 189.43536414066511, "core_hours_Tesla V100-SXM2-32GB": 155.26914469986195, "core_hours": 155.26914469986195}
{"step": 103550, "global_schedule": 0.014984756708145142, "l2_grads": 2.8632659912109375, "l2_params": 244.38087463378906, "l2_updates": 0.016296276822686195, "training_loss": 3.644401788711548, "uptime": 37526.71895340795, "examples_seen": 106035200.0, "progress": 0.9288911614054917, "epoch": 83.60056924126133, "img/sec/core": 189.56139414436115, "core_hours_Tesla V100-SXM2-32GB": 155.34417169724412, "core_hours": 155.34417169724412}
{"step": 103600, "global_schedule": 0.014797300100326538, "l2_grads": 2.695024013519287, "l2_params": 244.37100219726562, "l2_updates": 0.016204752027988434, "training_loss": 2.1199827194213867, "uptime": 37543.60656466696, "examples_seen": 106086400.0, "progress": 0.9293396844192076, "epoch": 83.64093648860138, "img/sec/core": 189.48801881575315, "core_hours_Tesla V100-SXM2-32GB": 155.4192277472841, "core_hours": 155.4192277472841}
{"step": 103650, "global_schedule": 0.014610975980758667, "l2_grads": 2.5791635513305664, "l2_params": 244.36146545410156, "l2_updates": 0.015832355245947838, "training_loss": 2.5464138984680176, "uptime": 37560.498272622004, "examples_seen": 106137600.0, "progress": 0.9297882074329233, "epoch": 83.68130373594144, "img/sec/core": 189.4420628462454, "core_hours_Tesla V100-SXM2-32GB": 155.4943020048621, "core_hours": 155.4943020048621}
{"step": 103700, "global_schedule": 0.014425843954086304, "l2_grads": 2.7015349864959717, "l2_params": 244.3524932861328, "l2_updates": 0.015905598178505898, "training_loss": 1.4059784412384033, "uptime": 37577.398341269, "examples_seen": 106188800.0, "progress": 0.9302367304466392, "epoch": 83.7216709832815, "img/sec/core": 189.34834330208034, "core_hours_Tesla V100-SXM2-32GB": 155.569413421071, "core_hours": 155.569413421071}
{"step": 103750, "global_schedule": 0.014241814613342285, "l2_grads": 2.8231608867645264, "l2_params": 244.34371948242188, "l2_updates": 0.01568600907921791, "training_loss": 1.5055081844329834, "uptime": 37594.277714380994, "examples_seen": 106240000.0, "progress": 0.930685253460355, "epoch": 83.76203823062156, "img/sec/core": 189.58050034014556, "core_hours_Tesla V100-SXM2-32GB": 155.6444328571243, "core_hours": 155.6444328571243}
{"step": 103800, "global_schedule": 0.014059007167816162, "l2_grads": 2.8285973072052, "l2_params": 244.33529663085938, "l2_updates": 0.015459146350622177, "training_loss": 3.453461170196533, "uptime": 37611.13886533299, "examples_seen": 106291200.0, "progress": 0.9311337764740709, "epoch": 83.80240547796161, "img/sec/core": 189.78538351919795, "core_hours_Tesla V100-SXM2-32GB": 155.71937130579985, "core_hours": 155.71937130579985}
{"step": 103850, "global_schedule": 0.013877332210540771, "l2_grads": 2.5472922325134277, "l2_params": 244.32635498046875, "l2_updates": 0.01511597353965044, "training_loss": 2.411167621612549, "uptime": 37628.04141269595, "examples_seen": 106342400.0, "progress": 0.9315822994877867, "epoch": 83.84277272530167, "img/sec/core": 189.32057584483513, "core_hours_Tesla V100-SXM2-32GB": 155.7944937385241, "core_hours": 155.7944937385241}
{"step": 103900, "global_schedule": 0.013696849346160889, "l2_grads": 2.65439510345459, "l2_params": 244.3177490234375, "l2_updates": 0.015187609009444714, "training_loss": 2.0132033824920654, "uptime": 37644.91530061199, "examples_seen": 106393600.0, "progress": 0.9320308225015026, "epoch": 83.88313997264173, "img/sec/core": 189.64212728701625, "core_hours_Tesla V100-SXM2-32GB": 155.8694887959287, "core_hours": 155.8694887959287}
{"step": 103950, "global_schedule": 0.013517498970031738, "l2_grads": 2.6917340755462646, "l2_params": 244.3087921142578, "l2_updates": 0.014754042029380798, "training_loss": 1.5194172859191895, "uptime": 37661.80877952697, "examples_seen": 106444800.0, "progress": 0.9324793455152184, "epoch": 83.92350721998179, "img/sec/core": 189.42220344932394, "core_hours_Tesla V100-SXM2-32GB": 155.94457092443972, "core_hours": 155.94457092443972}
{"step": 104000, "global_schedule": 0.013339340686798096, "l2_grads": 2.657733917236328, "l2_params": 244.30030822753906, "l2_updates": 0.01454256847500801, "training_loss": 3.117251396179199, "uptime": 37678.69938621699, "examples_seen": 106496000.0, "progress": 0.9329278685289342, "epoch": 83.96387446732184, "img/sec/core": 189.45441444031022, "core_hours_Tesla V100-SXM2-32GB": 156.01964028750652, "core_hours": 156.01964028750652}
{"step": 104050, "global_schedule": 0.013162344694137573, "l2_grads": 2.644030809402466, "l2_params": 244.2914581298828, "l2_updates": 0.01438381988555193, "training_loss": 3.1168034076690674, "uptime": 37696.331200644956, "examples_seen": 106547200.0, "progress": 0.9333763915426501, "epoch": 84.0042417146619, "img/sec/core": 189.49695734716812, "core_hours_Tesla V100-SXM2-32GB": 156.09469279716853, "core_hours": 156.09469279716853}
{"step": 104100, "global_schedule": 0.012986510992050171, "l2_grads": 2.7331857681274414, "l2_params": 244.28306579589844, "l2_updates": 0.014195390045642853, "training_loss": 2.5856130123138428, "uptime": 37713.226872422965, "examples_seen": 106598400.0, "progress": 0.9338249145563658, "epoch": 84.04460896200196, "img/sec/core": 189.39761863538277, "core_hours_Tesla V100-SXM2-32GB": 156.16978467173746, "core_hours": 156.16978467173746}
{"step": 104150, "global_schedule": 0.012811839580535889, "l2_grads": 2.7903265953063965, "l2_params": 244.27508544921875, "l2_updates": 0.014007025398314, "training_loss": 1.60618257522583, "uptime": 37730.13300950895, "examples_seen": 106649600.0, "progress": 0.9342734375700817, "epoch": 84.08497620934202, "img/sec/core": 189.2803769261217, "core_hours_Tesla V100-SXM2-32GB": 156.24492305878627, "core_hours": 156.24492305878627}
{"step": 104200, "global_schedule": 0.012638360261917114, "l2_grads": 2.8418796062469482, "l2_params": 244.2666473388672, "l2_updates": 0.013856529258191586, "training_loss": 1.4139304161071777, "uptime": 37747.03708238795, "examples_seen": 106700800.0, "progress": 0.9347219605837975, "epoch": 84.12534345668207, "img/sec/core": 189.30349052006386, "core_hours_Tesla V100-SXM2-32GB": 156.32005227158183, "core_hours": 156.32005227158183}
{"step": 104250, "global_schedule": 0.012466013431549072, "l2_grads": 2.7171034812927246, "l2_params": 244.25802612304688, "l2_updates": 0.013812855817377567, "training_loss": 1.4740712642669678, "uptime": 37763.92446627095, "examples_seen": 106752000.0, "progress": 0.9351704835975134, "epoch": 84.16571070402213, "img/sec/core": 189.49057013031884, "core_hours_Tesla V100-SXM2-32GB": 156.39510731106185, "core_hours": 156.39510731106185}
{"step": 104300, "global_schedule": 0.012294858694076538, "l2_grads": 2.817594528198242, "l2_params": 244.24978637695312, "l2_updates": 0.01362563855946064, "training_loss": 1.6506904363632202, "uptime": 37780.810052393994, "examples_seen": 106803200.0, "progress": 0.9356190066112292, "epoch": 84.2060779513622, "img/sec/core": 189.51074464827693, "core_hours_Tesla V100-SXM2-32GB": 156.47015436049756, "core_hours": 156.47015436049756}
{"step": 104350, "global_schedule": 0.012124836444854736, "l2_grads": 2.7911217212677, "l2_params": 244.2421417236328, "l2_updates": 0.012969044968485832, "training_loss": 1.672433614730835, "uptime": 37797.70874713297, "examples_seen": 106854400.0, "progress": 0.9360675296249451, "epoch": 84.24644519870226, "img/sec/core": 189.36373781691444, "core_hours_Tesla V100-SXM2-32GB": 156.5452596704486, "core_hours": 156.5452596704486}
{"step": 104400, "global_schedule": 0.01195603609085083, "l2_grads": 2.884368658065796, "l2_params": 244.23477172851562, "l2_updates": 0.013152709230780602, "training_loss": 1.8725793361663818, "uptime": 37814.602625309955, "examples_seen": 106905600.0, "progress": 0.9365160526386609, "epoch": 84.28681244604232, "img/sec/core": 189.41772673368934, "core_hours_Tesla V100-SXM2-32GB": 156.6203435734574, "core_hours": 156.6203435734574}
{"step": 104450, "global_schedule": 0.011788368225097656, "l2_grads": 2.8476667404174805, "l2_params": 244.2271728515625, "l2_updates": 0.012880945578217506, "training_loss": 3.5605416297912598, "uptime": 37831.50329877995, "examples_seen": 106956800.0, "progress": 0.9369645756523767, "epoch": 84.32717969338238, "img/sec/core": 189.3415671086328, "core_hours_Tesla V100-SXM2-32GB": 156.6954576777685, "core_hours": 156.6954576777685}
{"step": 104500, "global_schedule": 0.01162189245223999, "l2_grads": 2.62949538230896, "l2_params": 244.21958923339844, "l2_updates": 0.012678834609687328, "training_loss": 1.7885215282440186, "uptime": 37848.39144097897, "examples_seen": 107008000.0, "progress": 0.9374130986660926, "epoch": 84.36754694072243, "img/sec/core": 189.48206157247904, "core_hours_Tesla V100-SXM2-32GB": 156.77051608754195, "core_hours": 156.77051608754195}
{"step": 104551, "global_schedule": 0.011456549167633057, "l2_grads": 2.8126375675201416, "l2_params": 244.21188354492188, "l2_updates": 0.012629392556846142, "training_loss": 1.4620931148529053, "uptime": 37865.301801936, "examples_seen": 107059200.0, "progress": 0.9378616216798084, "epoch": 84.40791418806249, "img/sec/core": 189.23309846142888, "core_hours_Tesla V100-SXM2-32GB": 156.84567324735096, "core_hours": 156.84567324735096}
{"step": 104600, "global_schedule": 0.011292427778244019, "l2_grads": 2.8799684047698975, "l2_params": 244.2047882080078, "l2_updates": 0.012406639754772186, "training_loss": 3.7515692710876465, "uptime": 37882.19729468896, "examples_seen": 107110400.0, "progress": 0.9383101446935243, "epoch": 84.44828143540255, "img/sec/core": 189.3996254971717, "core_hours_Tesla V100-SXM2-32GB": 156.92076432625296, "core_hours": 156.92076432625296}
{"step": 104650, "global_schedule": 0.011129438877105713, "l2_grads": 2.7607638835906982, "l2_params": 244.19735717773438, "l2_updates": 0.012198359705507755, "training_loss": 1.6284782886505127, "uptime": 37899.10037281597, "examples_seen": 107161600.0, "progress": 0.93875866770724, "epoch": 84.4886486827426, "img/sec/core": 189.31463109587182, "core_hours_Tesla V100-SXM2-32GB": 156.99588911792858, "core_hours": 156.99588911792858}
{"step": 104700, "global_schedule": 0.010967612266540527, "l2_grads": 2.6479580402374268, "l2_params": 244.18992614746094, "l2_updates": 0.011933487839996815, "training_loss": 2.2089850902557373, "uptime": 37915.996746639954, "examples_seen": 107212800.0, "progress": 0.9392071907209559, "epoch": 84.52901593008266, "img/sec/core": 189.38974914592342, "core_hours_Tesla V100-SXM2-32GB": 157.07098411270184, "core_hours": 157.07098411270184}
{"step": 104750, "global_schedule": 0.010807007551193237, "l2_grads": 2.6648969650268555, "l2_params": 244.18350219726562, "l2_updates": 0.011913870461285114, "training_loss": 1.5379300117492676, "uptime": 37932.91491139197, "examples_seen": 107264000.0, "progress": 0.9396557137346717, "epoch": 84.56938317742272, "img/sec/core": 189.1458114343415, "core_hours_Tesla V100-SXM2-32GB": 157.14617595604415, "core_hours": 157.14617595604415}
{"step": 104800, "global_schedule": 0.010647565126419067, "l2_grads": 2.7495477199554443, "l2_params": 244.1762237548828, "l2_updates": 0.011583013460040092, "training_loss": 2.3816092014312744, "uptime": 37949.802238654986, "examples_seen": 107315200.0, "progress": 0.9401042367483876, "epoch": 84.60975042476278, "img/sec/core": 189.49120545607423, "core_hours_Tesla V100-SXM2-32GB": 157.22123074387977, "core_hours": 157.22123074387977}
{"step": 104850, "global_schedule": 0.01048925518989563, "l2_grads": 2.6521756649017334, "l2_params": 244.16917419433594, "l2_updates": 0.011486382223665714, "training_loss": 2.9445157051086426, "uptime": 37966.70625936199, "examples_seen": 107366400.0, "progress": 0.9405527597621034, "epoch": 84.65011767210284, "img/sec/core": 189.30407477989118, "core_hours_Tesla V100-SXM2-32GB": 157.2963597247998, "core_hours": 157.2963597247998}
{"step": 104900, "global_schedule": 0.0103321373462677, "l2_grads": 2.7915256023406982, "l2_params": 244.16238403320312, "l2_updates": 0.0112903518602252, "training_loss": 1.5473085641860962, "uptime": 37983.61199759197, "examples_seen": 107417600.0, "progress": 0.9410012827758192, "epoch": 84.6904849194429, "img/sec/core": 189.2848426060026, "core_hours_Tesla V100-SXM2-32GB": 157.37149633915527, "core_hours": 157.37149633915527}
{"step": 104950, "global_schedule": 0.010176211595535278, "l2_grads": 2.5806024074554443, "l2_params": 244.1559600830078, "l2_updates": 0.01111371349543333, "training_loss": 3.004544973373413, "uptime": 38000.507900291006, "examples_seen": 107468800.0, "progress": 0.9414498057895351, "epoch": 84.73085216678295, "img/sec/core": 189.39503008518855, "core_hours_Tesla V100-SXM2-32GB": 157.44658924003986, "core_hours": 157.44658924003986}
{"step": 105000, "global_schedule": 0.010021448135375977, "l2_grads": 2.7094783782958984, "l2_params": 244.14926147460938, "l2_updates": 0.011026963591575623, "training_loss": 2.026003360748291, "uptime": 38017.40465700097, "examples_seen": 107520000.0, "progress": 0.9418983288032509, "epoch": 84.77121941412302, "img/sec/core": 189.38545751289524, "core_hours_Tesla V100-SXM2-32GB": 157.52168593652857, "core_hours": 157.52168593652857, "minival/prec@1": 0.793787074617546, "minival/loss": 0.8075874273828368, "minival/sample count": 12812.0, "minival/attn_weight_avg": [13312, 12, 281], "minival/attn_mag": [13312, 12, 281], "minival/before_mlp": [13312, 12, 281], "z/secs/eval/minival": 2.9091816029977053, "real/prec@1": 0.82934432179687, "real/loss": 1.6144338301916754, "real/sample count": 46837.0, "real/attn_weight_avg": [50176, 12, 281], "real/attn_mag": [50176, 12, 281], "real/before_mlp": [50176, 12, 281], "z/secs/eval/real": 11.18713530502282, "train/prec@1": 0.8514615774889748, "train/loss": 0.5609786777796327, "train/sample count": 25623.0, "train/attn_weight_avg": [26624, 12, 281], "train/attn_mag": [26624, 12, 281], "train/before_mlp": [26624, 12, 281], "z/secs/eval/train": 6.606925631000195, "v2/prec@1": 0.6402, "v2/loss": 1.5529363037109376, "v2/sample count": 10000.0, "v2/attn_weight_avg": [10240, 12, 281], "v2/attn_mag": [10240, 12, 281], "v2/before_mlp": [10240, 12, 281], "z/secs/eval/v2": 3.3965466580120847, "val/prec@1": 0.76392, "val/loss": 0.9351817602539062, "val/sample count": 50000.0, "val/attn_weight_avg": [50176, 12, 281], "val/attn_mag": [50176, 12, 281], "val/before_mlp": [50176, 12, 281], "z/secs/eval/val": 12.365942597039975}
{"step": 105050, "global_schedule": 0.009867846965789795, "l2_grads": 2.8466851711273193, "l2_params": 244.14312744140625, "l2_updates": 0.010726766660809517, "training_loss": 1.4910037517547607, "uptime": 38071.34518415498, "examples_seen": 107571200.0, "progress": 0.9423468518169668, "epoch": 84.81158666146308, "img/sec/core": 188.57555894628968, "core_hours_Tesla V100-SXM2-32GB": 157.59710516000425, "core_hours": 157.59710516000425}
{"step": 105100, "global_schedule": 0.009715437889099121, "l2_grads": 2.7184700965881348, "l2_params": 244.13702392578125, "l2_updates": 0.010597588494420052, "training_loss": 1.4889447689056396, "uptime": 38088.23796094797, "examples_seen": 107622400.0, "progress": 0.9427953748306825, "epoch": 84.85195390880314, "img/sec/core": 189.43007648859592, "core_hours_Tesla V100-SXM2-32GB": 157.67218416797309, "core_hours": 157.67218416797309}
{"step": 105150, "global_schedule": 0.00956416130065918, "l2_grads": 2.867337465286255, "l2_params": 244.13088989257812, "l2_updates": 0.010513360612094402, "training_loss": 1.5609513521194458, "uptime": 38105.14833035198, "examples_seen": 107673600.0, "progress": 0.9432438978443984, "epoch": 84.8923211561432, "img/sec/core": 189.23300393670064, "core_hours_Tesla V100-SXM2-32GB": 157.74734136532422, "core_hours": 157.74734136532422}
{"step": 105200, "global_schedule": 0.009414106607437134, "l2_grads": 2.5803701877593994, "l2_params": 244.12469482421875, "l2_updates": 0.010339654982089996, "training_loss": 1.8485584259033203, "uptime": 38122.08807707101, "examples_seen": 107724800.0, "progress": 0.9436924208581142, "epoch": 84.93268840348325, "img/sec/core": 188.90483152297995, "core_hours_Tesla V100-SXM2-32GB": 157.8226291285199, "core_hours": 157.8226291285199}
{"step": 105250, "global_schedule": 0.009265214204788208, "l2_grads": 2.7946648597717285, "l2_params": 244.11871337890625, "l2_updates": 0.010191741399466991, "training_loss": 1.5366135835647583, "uptime": 38139.00316936098, "examples_seen": 107776000.0, "progress": 0.9441409438718301, "epoch": 84.97305565082331, "img/sec/core": 189.1801679318749, "core_hours_Tesla V100-SXM2-32GB": 157.89780731647534, "core_hours": 157.89780731647534}
{"step": 105300, "global_schedule": 0.00911751389503479, "l2_grads": 2.8362324237823486, "l2_params": 244.11260986328125, "l2_updates": 0.00998771097511053, "training_loss": 1.6822795867919922, "uptime": 38155.924481072, "examples_seen": 107827200.0, "progress": 0.9445894668855459, "epoch": 85.01342289816337, "img/sec/core": 189.11063484021275, "core_hours_Tesla V100-SXM2-32GB": 157.9730131463021, "core_hours": 157.9730131463021}
{"step": 105350, "global_schedule": 0.008970946073532104, "l2_grads": 2.7209460735321045, "l2_params": 244.10682678222656, "l2_updates": 0.009979134425520897, "training_loss": 1.7543785572052002, "uptime": 38172.83604947699, "examples_seen": 107878400.0, "progress": 0.9450379898992617, "epoch": 85.05379014550343, "img/sec/core": 189.21958764367162, "core_hours_Tesla V100-SXM2-32GB": 158.0481756725465, "core_hours": 158.0481756725465}
{"step": 105400, "global_schedule": 0.008825600147247314, "l2_grads": 2.9110426902770996, "l2_params": 244.1009979248047, "l2_updates": 0.009649538435041904, "training_loss": 1.5942409038543701, "uptime": 38189.740508975985, "examples_seen": 107929600.0, "progress": 0.9454865129129776, "epoch": 85.09415739284348, "img/sec/core": 189.29916098114867, "core_hours_Tesla V100-SXM2-32GB": 158.12330660365313, "core_hours": 158.12330660365313}
{"step": 105450, "global_schedule": 0.008681386709213257, "l2_grads": 2.9545669555664062, "l2_params": 244.09580993652344, "l2_updates": 0.009372535161674023, "training_loss": 3.525244951248169, "uptime": 38206.62958849, "examples_seen": 107980800.0, "progress": 0.9459350359266934, "epoch": 85.13452464018354, "img/sec/core": 189.47154564249797, "core_hours_Tesla V100-SXM2-32GB": 158.19836917927103, "core_hours": 158.19836917927103}
{"step": 105500, "global_schedule": 0.008538395166397095, "l2_grads": 2.6348307132720947, "l2_params": 244.09010314941406, "l2_updates": 0.009298651479184628, "training_loss": 2.7956628799438477, "uptime": 38223.568392001966, "examples_seen": 108032000.0, "progress": 0.9463835589404093, "epoch": 85.1748918875236, "img/sec/core": 188.91535035163793, "core_hours_Tesla V100-SXM2-32GB": 158.27365275043528, "core_hours": 158.27365275043528}
{"step": 105550, "global_schedule": 0.008396565914154053, "l2_grads": 2.6303963661193848, "l2_params": 244.08465576171875, "l2_updates": 0.009164467453956604, "training_loss": 1.8537657260894775, "uptime": 38240.48577318399, "examples_seen": 108083200.0, "progress": 0.946832081954125, "epoch": 85.21525913486366, "img/sec/core": 189.15457218642297, "core_hours_Tesla V100-SXM2-32GB": 158.34884111124427, "core_hours": 158.34884111124427}
{"step": 105600, "global_schedule": 0.00825589895248413, "l2_grads": 2.6517395973205566, "l2_params": 244.0791473388672, "l2_updates": 0.009024018421769142, "training_loss": 1.9690849781036377, "uptime": 38257.40609072399, "examples_seen": 108134400.0, "progress": 0.947280604967841, "epoch": 85.25562638220372, "img/sec/core": 189.1217462340454, "core_hours_Tesla V100-SXM2-32GB": 158.42404252253317, "core_hours": 158.42404252253317}
{"step": 105650, "global_schedule": 0.008116424083709717, "l2_grads": 2.664952278137207, "l2_params": 244.0738983154297, "l2_updates": 0.008872644044458866, "training_loss": 2.4874935150146484, "uptime": 38274.31745284499, "examples_seen": 108185600.0, "progress": 0.9477291279815567, "epoch": 85.29599362954377, "img/sec/core": 189.22189573521706, "core_hours_Tesla V100-SXM2-32GB": 158.49920413195983, "core_hours": 158.49920413195983}
{"step": 105700, "global_schedule": 0.00797814130783081, "l2_grads": 2.751377582550049, "l2_params": 244.06849670410156, "l2_updates": 0.008707717061042786, "training_loss": 1.6442265510559082, "uptime": 38291.228606536984, "examples_seen": 108236800.0, "progress": 0.9481776509952725, "epoch": 85.33636087688384, "img/sec/core": 189.2242278842667, "core_hours_Tesla V100-SXM2-32GB": 158.57436481503538, "core_hours": 158.57436481503538}
{"step": 105750, "global_schedule": 0.007841020822525024, "l2_grads": 2.7968592643737793, "l2_params": 244.0631561279297, "l2_updates": 0.008605306036770344, "training_loss": 1.6596240997314453, "uptime": 38308.14826206496, "examples_seen": 108288000.0, "progress": 0.9486261740089884, "epoch": 85.3767281242239, "img/sec/core": 189.12914596332024, "core_hours_Tesla V100-SXM2-32GB": 158.6495632840486, "core_hours": 158.6495632840486}
{"step": 105800, "global_schedule": 0.007705062627792358, "l2_grads": 2.5199382305145264, "l2_params": 244.0580291748047, "l2_updates": 0.008410449139773846, "training_loss": 2.59806489944458, "uptime": 38325.06334988098, "examples_seen": 108339200.0, "progress": 0.9490746970227042, "epoch": 85.41709537156396, "img/sec/core": 189.18021796909554, "core_hours_Tesla V100-SXM2-32GB": 158.7247414521198, "core_hours": 158.7247414521198}
{"step": 105850, "global_schedule": 0.007570326328277588, "l2_grads": 2.680598020553589, "l2_params": 244.0533447265625, "l2_updates": 0.008279689587652683, "training_loss": 1.7078874111175537, "uptime": 38341.961517964955, "examples_seen": 108390400.0, "progress": 0.9495232200364201, "epoch": 85.45746261890402, "img/sec/core": 189.36963960217236, "core_hours_Tesla V100-SXM2-32GB": 158.7998444213819, "core_hours": 158.7998444213819}
{"step": 105900, "global_schedule": 0.00743672251701355, "l2_grads": 2.60316801071167, "l2_params": 244.0484161376953, "l2_updates": 0.008026777766644955, "training_loss": 1.7812409400939941, "uptime": 38358.880186808005, "examples_seen": 108441600.0, "progress": 0.9499717430501359, "epoch": 85.49782986624407, "img/sec/core": 189.14017584277596, "core_hours_Tesla V100-SXM2-32GB": 158.8750385051288, "core_hours": 158.8750385051288}
{"step": 105950, "global_schedule": 0.007304340600967407, "l2_grads": 2.7397162914276123, "l2_params": 244.04367065429688, "l2_updates": 0.008028867654502392, "training_loss": 1.4614953994750977, "uptime": 38375.800538223004, "examples_seen": 108492800.0, "progress": 0.9504202660638518, "epoch": 85.53819711358413, "img/sec/core": 189.12136760725204, "core_hours_Tesla V100-SXM2-32GB": 158.9502400669732, "core_hours": 158.9502400669732}
{"step": 106000, "global_schedule": 0.007173120975494385, "l2_grads": 2.7658605575561523, "l2_params": 244.03904724121094, "l2_updates": 0.00791155081242323, "training_loss": 1.656440019607544, "uptime": 38392.714028813, "examples_seen": 108544000.0, "progress": 0.9508687890775676, "epoch": 85.57856436092419, "img/sec/core": 189.19808320892352, "core_hours_Tesla V100-SXM2-32GB": 159.0254111362621, "core_hours": 159.0254111362621}
{"step": 106050, "global_schedule": 0.00704309344291687, "l2_grads": 2.753901243209839, "l2_params": 244.03431701660156, "l2_updates": 0.007804022636264563, "training_loss": 1.8248252868652344, "uptime": 38410.121816458006, "examples_seen": 108595200.0, "progress": 0.9513173120912835, "epoch": 85.61893160826425, "img/sec/core": 189.04081935580422, "core_hours_Tesla V100-SXM2-32GB": 159.10064474067988, "core_hours": 159.10064474067988}
{"step": 106100, "global_schedule": 0.006914198398590088, "l2_grads": 2.856447458267212, "l2_params": 244.02980041503906, "l2_updates": 0.007489529438316822, "training_loss": 1.7244415283203125, "uptime": 38427.03891028499, "examples_seen": 108646400.0, "progress": 0.9517658351049992, "epoch": 85.6592988556043, "img/sec/core": 189.15778518034796, "core_hours_Tesla V100-SXM2-32GB": 159.17583182435536, "core_hours": 159.17583182435536}
{"step": 106150, "global_schedule": 0.006786555051803589, "l2_grads": 2.907498598098755, "l2_params": 244.02529907226562, "l2_updates": 0.007404850795865059, "training_loss": 1.5427011251449585, "uptime": 38443.939678024966, "examples_seen": 108697600.0, "progress": 0.952214358118715, "epoch": 85.69966610294436, "img/sec/core": 189.34051098935748, "core_hours_Tesla V100-SXM2-32GB": 159.25094634764412, "core_hours": 159.25094634764412}
{"step": 106200, "global_schedule": 0.006660044193267822, "l2_grads": 2.6197874546051025, "l2_params": 244.02096557617188, "l2_updates": 0.007315530441701412, "training_loss": 2.5086147785186768, "uptime": 38460.856242360955, "examples_seen": 108748800.0, "progress": 0.9526628811324309, "epoch": 85.74003335028442, "img/sec/core": 189.16370584731007, "core_hours_Tesla V100-SXM2-32GB": 159.3261310780263, "core_hours": 159.3261310780263}
{"step": 106250, "global_schedule": 0.0065347254276275635, "l2_grads": 2.638556718826294, "l2_params": 244.01669311523438, "l2_updates": 0.007102258503437042, "training_loss": 2.133253574371338, "uptime": 38477.78390066099, "examples_seen": 108800000.0, "progress": 0.9531114041461467, "epoch": 85.78040059762448, "img/sec/core": 189.03973268375628, "core_hours_Tesla V100-SXM2-32GB": 159.40136511491534, "core_hours": 159.40136511491534}
{"step": 106300, "global_schedule": 0.0064105987548828125, "l2_grads": 2.6268837451934814, "l2_params": 244.0120086669922, "l2_updates": 0.007046521175652742, "training_loss": 2.6444621086120605, "uptime": 38494.67032123299, "examples_seen": 108851200.0, "progress": 0.9535599271598626, "epoch": 85.82076784496454, "img/sec/core": 189.5013799020065, "core_hours_Tesla V100-SXM2-32GB": 159.47641587301314, "core_hours": 159.47641587301314}
{"step": 106350, "global_schedule": 0.006287664175033569, "l2_grads": 2.668678045272827, "l2_params": 244.00827026367188, "l2_updates": 0.0068534971214830875, "training_loss": 1.9892446994781494, "uptime": 38511.57746491197, "examples_seen": 108902400.0, "progress": 0.9540084501735784, "epoch": 85.8611350923046, "img/sec/core": 189.26910782559293, "core_hours_Tesla V100-SXM2-32GB": 159.5515587338086, "core_hours": 159.5515587338086}
{"step": 106400, "global_schedule": 0.006165891885757446, "l2_grads": 2.8903956413269043, "l2_params": 244.00437927246094, "l2_updates": 0.006769627332687378, "training_loss": 3.7468316555023193, "uptime": 38528.49514949997, "examples_seen": 108953600.0, "progress": 0.9544569731872943, "epoch": 85.90150233964465, "img/sec/core": 189.1511798411206, "core_hours_Tesla V100-SXM2-32GB": 159.62674844308862, "core_hours": 159.62674844308862}
{"step": 106450, "global_schedule": 0.006045311689376831, "l2_grads": 2.530635356903076, "l2_params": 244.00045776367188, "l2_updates": 0.0066233063116669655, "training_loss": 2.7220230102539062, "uptime": 38545.405612514995, "examples_seen": 109004800.0, "progress": 0.9549054962010101, "epoch": 85.94186958698472, "img/sec/core": 189.23195640218643, "core_hours_Tesla V100-SXM2-32GB": 159.7019060564887, "core_hours": 159.7019060564887}
{"step": 106500, "global_schedule": 0.005925893783569336, "l2_grads": 2.8173820972442627, "l2_params": 243.9962158203125, "l2_updates": 0.006563775707036257, "training_loss": 3.4660754203796387, "uptime": 38562.31260615098, "examples_seen": 109056000.0, "progress": 0.955354019214726, "epoch": 85.98223683432478, "img/sec/core": 189.27078751531914, "core_hours_Tesla V100-SXM2-32GB": 159.77704825042645, "core_hours": 159.77704825042645}
{"step": 106550, "global_schedule": 0.005807697772979736, "l2_grads": 2.7366268634796143, "l2_params": 243.9925079345703, "l2_updates": 0.006376492325216532, "training_loss": 1.547080159187317, "uptime": 38579.214731774, "examples_seen": 109107200.0, "progress": 0.9558025422284417, "epoch": 86.02260408166484, "img/sec/core": 189.32529975057878, "core_hours_Tesla V100-SXM2-32GB": 159.85216880875095, "core_hours": 159.85216880875095}
{"step": 106600, "global_schedule": 0.005690664052963257, "l2_grads": 2.6300048828125, "l2_params": 243.98841857910156, "l2_updates": 0.0062337820418179035, "training_loss": 1.8234680891036987, "uptime": 38596.098624657956, "examples_seen": 109158400.0, "progress": 0.9562510652421575, "epoch": 86.0629713290049, "img/sec/core": 189.52975015857714, "core_hours_Tesla V100-SXM2-32GB": 159.92720833267964, "core_hours": 159.92720833267964}
{"step": 106650, "global_schedule": 0.005574822425842285, "l2_grads": 2.7870562076568604, "l2_params": 243.9847869873047, "l2_updates": 0.0060583618469536304, "training_loss": 2.0965187549591064, "uptime": 38613.02283520799, "examples_seen": 109209600.0, "progress": 0.9566995882558734, "epoch": 86.10333857634495, "img/sec/core": 189.07824329768792, "core_hours_Tesla V100-SXM2-32GB": 160.00242704623534, "core_hours": 160.00242704623534}
{"step": 106700, "global_schedule": 0.005460143089294434, "l2_grads": 2.8592002391815186, "l2_params": 243.98121643066406, "l2_updates": 0.0060347458347678185, "training_loss": 1.505194067955017, "uptime": 38629.918076276954, "examples_seen": 109260800.0, "progress": 0.9571481112695892, "epoch": 86.14370582368501, "img/sec/core": 189.40244693387046, "core_hours_Tesla V100-SXM2-32GB": 160.07751700654185, "core_hours": 160.07751700654185}
{"step": 106750, "global_schedule": 0.0053466856479644775, "l2_grads": 2.717975378036499, "l2_params": 243.9776153564453, "l2_updates": 0.005865970626473427, "training_loss": 2.971914529800415, "uptime": 38646.828062621, "examples_seen": 109312000.0, "progress": 0.9575966342833051, "epoch": 86.18407307102507, "img/sec/core": 189.23729060999636, "core_hours_Tesla V100-SXM2-32GB": 160.15267250140428, "core_hours": 160.15267250140428}
{"step": 106800, "global_schedule": 0.005234390497207642, "l2_grads": 2.8915016651153564, "l2_params": 243.97396850585938, "l2_updates": 0.00571189820766449, "training_loss": 1.4766771793365479, "uptime": 38663.73903267697, "examples_seen": 109363200.0, "progress": 0.9580451572970209, "epoch": 86.22444031836513, "img/sec/core": 189.22628266800604, "core_hours_Tesla V100-SXM2-32GB": 160.22783236831972, "core_hours": 160.22783236831972}
{"step": 106850, "global_schedule": 0.0051232874393463135, "l2_grads": 2.7492587566375732, "l2_params": 243.97068786621094, "l2_updates": 0.005623191595077515, "training_loss": 1.6453620195388794, "uptime": 38680.645590133965, "examples_seen": 109414400.0, "progress": 0.9584936803107368, "epoch": 86.26480756570518, "img/sec/core": 189.27567058753925, "core_hours_Tesla V100-SXM2-32GB": 160.30297262368413, "core_hours": 160.30297262368413}
{"step": 106900, "global_schedule": 0.005013376474380493, "l2_grads": 2.807274580001831, "l2_params": 243.96742248535156, "l2_updates": 0.005440862383693457, "training_loss": 1.4598195552825928, "uptime": 38697.552584566, "examples_seen": 109465600.0, "progress": 0.9589422033244526, "epoch": 86.30517481304524, "img/sec/core": 189.2707786037041, "core_hours_Tesla V100-SXM2-32GB": 160.37811482115984, "core_hours": 160.37811482115984}
{"step": 106950, "global_schedule": 0.004904627799987793, "l2_grads": 2.8113162517547607, "l2_params": 243.96372985839844, "l2_updates": 0.005410642363131046, "training_loss": 1.5690093040466309, "uptime": 38714.472678977996, "examples_seen": 109516800.0, "progress": 0.9593907263381685, "epoch": 86.3455420603853, "img/sec/core": 189.1242402129561, "core_hours_Tesla V100-SXM2-32GB": 160.45331524076872, "core_hours": 160.45331524076872}
{"step": 107000, "global_schedule": 0.004797071218490601, "l2_grads": 2.6205739974975586, "l2_params": 243.96041870117188, "l2_updates": 0.005263956263661385, "training_loss": 2.4677584171295166, "uptime": 38731.38275089895, "examples_seen": 109568000.0, "progress": 0.9598392493518842, "epoch": 86.38590930772536, "img/sec/core": 189.23633293569713, "core_hours_Tesla V100-SXM2-32GB": 160.52847111597296, "core_hours": 160.52847111597296}
{"step": 107050, "global_schedule": 0.004690706729888916, "l2_grads": 2.842806100845337, "l2_params": 243.95730590820312, "l2_updates": 0.0051312814466655254, "training_loss": 1.915490984916687, "uptime": 38749.09248689795, "examples_seen": 109619200.0, "progress": 0.9602877723656, "epoch": 86.42627655506541, "img/sec/core": 189.1060560351055, "core_hours_Tesla V100-SXM2-32GB": 160.60367876675056, "core_hours": 160.60367876675056}
{"step": 107100, "global_schedule": 0.004585534334182739, "l2_grads": 2.7876532077789307, "l2_params": 243.9542694091797, "l2_updates": 0.0051103271543979645, "training_loss": 1.4834495782852173, "uptime": 38765.99218727095, "examples_seen": 109670400.0, "progress": 0.9607362953793159, "epoch": 86.46664380240547, "img/sec/core": 189.3524695332357, "core_hours_Tesla V100-SXM2-32GB": 160.67878854618615, "core_hours": 160.67878854618615}
{"step": 107150, "global_schedule": 0.00448155403137207, "l2_grads": 2.8232102394104004, "l2_params": 243.95140075683594, "l2_updates": 0.004918121267110109, "training_loss": 1.4933085441589355, "uptime": 38782.879656706995, "examples_seen": 109721600.0, "progress": 0.9611848183930317, "epoch": 86.50701104974554, "img/sec/core": 189.4896101585483, "core_hours_Tesla V100-SXM2-32GB": 160.7538439659019, "core_hours": 160.7538439659019}
{"step": 107200, "global_schedule": 0.004378765821456909, "l2_grads": 2.6480679512023926, "l2_params": 243.94854736328125, "l2_updates": 0.004789050668478012, "training_loss": 2.7297356128692627, "uptime": 38799.78148744296, "examples_seen": 109772800.0, "progress": 0.9616333414067476, "epoch": 86.5473782970856, "img/sec/core": 189.32860291818432, "core_hours_Tesla V100-SXM2-32GB": 160.8289632136173, "core_hours": 160.8289632136173}
{"step": 107250, "global_schedule": 0.004277139902114868, "l2_grads": 2.7837398052215576, "l2_params": 243.94549560546875, "l2_updates": 0.004698164761066437, "training_loss": 3.3709685802459717, "uptime": 38816.69148119696, "examples_seen": 109824000.0, "progress": 0.9620818644204634, "epoch": 86.58774554442566, "img/sec/core": 189.23720768630082, "core_hours_Tesla V100-SXM2-32GB": 160.90411874141284, "core_hours": 160.90411874141284}
{"step": 107300, "global_schedule": 0.004176735877990723, "l2_grads": 2.890986204147339, "l2_params": 243.9427032470703, "l2_updates": 0.004620339721441269, "training_loss": 3.6549267768859863, "uptime": 38833.60572985897, "examples_seen": 109875200.0, "progress": 0.9625303874341793, "epoch": 86.62811279176572, "img/sec/core": 189.18960362614746, "core_hours_Tesla V100-SXM2-32GB": 160.97929317991068, "core_hours": 160.97929317991068}
{"step": 107350, "global_schedule": 0.004077494144439697, "l2_grads": 2.7266058921813965, "l2_params": 243.9399871826172, "l2_updates": 0.0044415961019694805, "training_loss": 3.3682010173797607, "uptime": 38850.51402643096, "examples_seen": 109926400.0, "progress": 0.9629789104478951, "epoch": 86.66848003910577, "img/sec/core": 189.25620250249037, "core_hours_Tesla V100-SXM2-32GB": 161.05444116467507, "core_hours": 161.05444116467507}
{"step": 107400, "global_schedule": 0.00397944450378418, "l2_grads": 2.820261240005493, "l2_params": 243.9373321533203, "l2_updates": 0.004433476831763983, "training_loss": 1.5166314840316772, "uptime": 38867.41446730099, "examples_seen": 109977600.0, "progress": 0.9634274334616109, "epoch": 86.70884728644583, "img/sec/core": 189.34417300764702, "core_hours_Tesla V100-SXM2-32GB": 161.12955423520853, "core_hours": 161.12955423520853}
{"step": 107450, "global_schedule": 0.00388258695602417, "l2_grads": 2.884124994277954, "l2_params": 243.93479919433594, "l2_updates": 0.00426512723788619, "training_loss": 1.4993959665298462, "uptime": 38884.31418444199, "examples_seen": 110028800.0, "progress": 0.9638759564753268, "epoch": 86.74921453378589, "img/sec/core": 189.352281656618, "core_hours_Tesla V100-SXM2-32GB": 161.20466408916852, "core_hours": 161.20466408916852}
{"step": 107500, "global_schedule": 0.003786921501159668, "l2_grads": 2.8866212368011475, "l2_params": 243.93231201171875, "l2_updates": 0.00416000559926033, "training_loss": 3.5842692852020264, "uptime": 38901.23500473896, "examples_seen": 110080000.0, "progress": 0.9643244794890425, "epoch": 86.78958178112595, "img/sec/core": 189.11612698659204, "core_hours_Tesla V100-SXM2-32GB": 161.27986773493285, "core_hours": 161.27986773493285, "minival/prec@1": 0.7949578520137371, "minival/loss": 0.8069018227883589, "minival/sample count": 12812.0, "minival/attn_weight_avg": [13312, 12, 281], "minival/attn_mag": [13312, 12, 281], "minival/before_mlp": [13312, 12, 281], "z/secs/eval/minival": 2.898503825010266, "real/prec@1": 0.8301342955355808, "real/loss": 1.6115917866583844, "real/sample count": 46837.0, "real/attn_weight_avg": [50176, 12, 281], "real/attn_mag": [50176, 12, 281], "real/before_mlp": [50176, 12, 281], "z/secs/eval/real": 11.219769826973788, "train/prec@1": 0.8536080864847988, "train/loss": 0.558819469260894, "train/sample count": 25623.0, "train/attn_weight_avg": [26624, 12, 281], "train/attn_mag": [26624, 12, 281], "train/before_mlp": [26624, 12, 281], "z/secs/eval/train": 6.595490683976095, "v2/prec@1": 0.6412, "v2/loss": 1.5503418334960937, "v2/sample count": 10000.0, "v2/attn_weight_avg": [10240, 12, 281], "v2/attn_mag": [10240, 12, 281], "v2/before_mlp": [10240, 12, 281], "z/secs/eval/v2": 3.3370803790166974, "val/prec@1": 0.76482, "val/loss": 0.9345579052734375, "val/sample count": 50000.0, "val/attn_weight_avg": [50176, 12, 281], "val/attn_mag": [50176, 12, 281], "val/before_mlp": [50176, 12, 281], "z/secs/eval/val": 12.35859270702349}
{"step": 107551, "global_schedule": 0.003692418336868286, "l2_grads": 2.742095708847046, "l2_params": 243.92991638183594, "l2_updates": 0.004052653908729553, "training_loss": 1.674927830696106, "uptime": 38954.598027976, "examples_seen": 110131200.0, "progress": 0.9647730025027584, "epoch": 86.829949028466, "img/sec/core": 188.7734453232975, "core_hours_Tesla V100-SXM2-32GB": 161.35520789836454, "core_hours": 161.35520789836454}
{"step": 107600, "global_schedule": 0.0035991370677948, "l2_grads": 2.801633834838867, "l2_params": 243.92752075195312, "l2_updates": 0.003968029282987118, "training_loss": 1.6554286479949951, "uptime": 38971.48368206195, "examples_seen": 110182400.0, "progress": 0.9652215255164742, "epoch": 86.87031627580606, "img/sec/core": 189.5099818882035, "core_hours_Tesla V100-SXM2-32GB": 161.43025524985768, "core_hours": 161.43025524985768}
{"step": 107650, "global_schedule": 0.0035070180892944336, "l2_grads": 2.8980255126953125, "l2_params": 243.9251708984375, "l2_updates": 0.0038089375011622906, "training_loss": 3.7038307189941406, "uptime": 38988.388465719996, "examples_seen": 110233600.0, "progress": 0.9656700485301901, "epoch": 86.91068352314612, "img/sec/core": 189.29553105978337, "core_hours_Tesla V100-SXM2-32GB": 161.50538762167122, "core_hours": 161.50538762167122}
{"step": 107700, "global_schedule": 0.003416121006011963, "l2_grads": 2.81033992767334, "l2_params": 243.92288208007812, "l2_updates": 0.0037803768645972013, "training_loss": 1.463752031326294, "uptime": 39005.299554861966, "examples_seen": 110284800.0, "progress": 0.9661185715439059, "epoch": 86.95105077048618, "img/sec/core": 189.2249501576046, "core_hours_Tesla V100-SXM2-32GB": 161.58054801785775, "core_hours": 161.58054801785775}
{"step": 107750, "global_schedule": 0.0033263862133026123, "l2_grads": 2.7582404613494873, "l2_params": 243.9204559326172, "l2_updates": 0.003666701028123498, "training_loss": 1.5837821960449219, "uptime": 39022.191338929, "examples_seen": 110336000.0, "progress": 0.9665670945576218, "epoch": 86.99141801782623, "img/sec/core": 189.4412092471236, "core_hours_Tesla V100-SXM2-32GB": 161.65562261371124, "core_hours": 161.65562261371124}
{"step": 107800, "global_schedule": 0.0032378733158111572, "l2_grads": 2.676743507385254, "l2_params": 243.91819763183594, "l2_updates": 0.0035390814300626516, "training_loss": 2.5412139892578125, "uptime": 39039.09523970599, "examples_seen": 110387200.0, "progress": 0.9670156175713376, "epoch": 87.03178526516629, "img/sec/core": 189.30541785692233, "core_hours_Tesla V100-SXM2-32GB": 161.73075106160894, "core_hours": 161.73075106160894}
{"step": 107850, "global_schedule": 0.0031505227088928223, "l2_grads": 2.7445566654205322, "l2_params": 243.91604614257812, "l2_updates": 0.0034765577875077724, "training_loss": 1.577879548072815, "uptime": 39056.01300353196, "examples_seen": 110438400.0, "progress": 0.9674641405850534, "epoch": 87.07215251250636, "img/sec/core": 189.1502939110344, "core_hours_Tesla V100-SXM2-32GB": 161.80594112305775, "core_hours": 161.80594112305775}
{"step": 107900, "global_schedule": 0.003064364194869995, "l2_grads": 2.740133762359619, "l2_params": 243.91397094726562, "l2_updates": 0.00343261007219553, "training_loss": 1.513871431350708, "uptime": 39072.92082087195, "examples_seen": 110489600.0, "progress": 0.9679126635987693, "epoch": 87.11251975984642, "img/sec/core": 189.26156674471372, "core_hours_Tesla V100-SXM2-32GB": 161.88108697790213, "core_hours": 161.88108697790213}
{"step": 107950, "global_schedule": 0.0029793977737426758, "l2_grads": 3.1230335235595703, "l2_params": 243.91209411621094, "l2_updates": 0.003267163410782814, "training_loss": 3.664947032928467, "uptime": 39089.83669897297, "examples_seen": 110540800.0, "progress": 0.968361186612485, "epoch": 87.15288700718648, "img/sec/core": 189.17137974688993, "core_hours_Tesla V100-SXM2-32GB": 161.95626865835112, "core_hours": 161.95626865835112}
{"step": 108000, "global_schedule": 0.0028956234455108643, "l2_grads": 2.837322473526001, "l2_params": 243.91015625, "l2_updates": 0.0031551795545965433, "training_loss": 1.4733004570007324, "uptime": 39106.74075825396, "examples_seen": 110592000.0, "progress": 0.9688097096262009, "epoch": 87.19325425452654, "img/sec/core": 189.30364280007845, "core_hours_Tesla V100-SXM2-32GB": 162.03139781071107, "core_hours": 162.03139781071107}
{"step": 108050, "global_schedule": 0.0028130412101745605, "l2_grads": 2.6325879096984863, "l2_params": 243.9083251953125, "l2_updates": 0.003079526126384735, "training_loss": 3.0015101432800293, "uptime": 39124.397090050974, "examples_seen": 110643200.0, "progress": 0.9692582326399167, "epoch": 87.2336215018666, "img/sec/core": 189.41237554296873, "core_hours_Tesla V100-SXM2-32GB": 162.10648383495555, "core_hours": 162.10648383495555}
{"step": 108100, "global_schedule": 0.0027316808700561523, "l2_grads": 2.6775364875793457, "l2_params": 243.9064483642578, "l2_updates": 0.0030327425338327885, "training_loss": 2.5346853733062744, "uptime": 39141.309363432985, "examples_seen": 110694400.0, "progress": 0.9697067556536326, "epoch": 87.27398874920665, "img/sec/core": 189.2117001492931, "core_hours_Tesla V100-SXM2-32GB": 162.18164949443113, "core_hours": 162.18164949443113}
{"step": 108150, "global_schedule": 0.0026514530181884766, "l2_grads": 2.7070200443267822, "l2_params": 243.90460205078125, "l2_updates": 0.002912526950240135, "training_loss": 2.8851242065429688, "uptime": 39158.22376819397, "examples_seen": 110745600.0, "progress": 0.9701552786673484, "epoch": 87.31435599654671, "img/sec/core": 189.18785764076094, "core_hours_Tesla V100-SXM2-32GB": 162.2568246267022, "core_hours": 162.2568246267022}
{"step": 108200, "global_schedule": 0.002572476863861084, "l2_grads": 2.7342617511749268, "l2_params": 243.9027862548828, "l2_updates": 0.0028580075595527887, "training_loss": 1.5594438314437866, "uptime": 39175.13157376496, "examples_seen": 110796800.0, "progress": 0.9706038016810643, "epoch": 87.35472324388677, "img/sec/core": 189.2616984839088, "core_hours_Tesla V100-SXM2-32GB": 162.3319704292399, "core_hours": 162.3319704292399}
{"step": 108250, "global_schedule": 0.0024946630001068115, "l2_grads": 2.73287034034729, "l2_params": 243.90103149414062, "l2_updates": 0.0027592419646680355, "training_loss": 1.4789636135101318, "uptime": 39192.04180747899, "examples_seen": 110848000.0, "progress": 0.9710523246947801, "epoch": 87.39509049122682, "img/sec/core": 189.23452236759795, "core_hours_Tesla V100-SXM2-32GB": 162.4071270235245, "core_hours": 162.4071270235245}
{"step": 108300, "global_schedule": 0.002418041229248047, "l2_grads": 2.8052332401275635, "l2_params": 243.89942932128906, "l2_updates": 0.0026858362834900618, "training_loss": 1.601626992225647, "uptime": 39208.95760854997, "examples_seen": 110899200.0, "progress": 0.9715008477084959, "epoch": 87.43545773856688, "img/sec/core": 189.1722411828203, "core_hours_Tesla V100-SXM2-32GB": 162.48230836161775, "core_hours": 162.48230836161775}
{"step": 108350, "global_schedule": 0.00234261155128479, "l2_grads": 2.6382148265838623, "l2_params": 243.89785766601562, "l2_updates": 0.0025502245407551527, "training_loss": 2.4068872928619385, "uptime": 39225.848268604954, "examples_seen": 110950400.0, "progress": 0.9719493707222118, "epoch": 87.47582498590694, "img/sec/core": 189.4538158712274, "core_hours_Tesla V100-SXM2-32GB": 162.5573779618621, "core_hours": 162.5573779618621}
{"step": 108400, "global_schedule": 0.002268373966217041, "l2_grads": 2.7672128677368164, "l2_params": 243.896240234375, "l2_updates": 0.0024712122976779938, "training_loss": 1.906866192817688, "uptime": 39242.74869470298, "examples_seen": 111001600.0, "progress": 0.9723978937359276, "epoch": 87.516192233247, "img/sec/core": 189.34433850594885, "core_hours_Tesla V100-SXM2-32GB": 162.63249096674224, "core_hours": 162.63249096674224}
{"step": 108450, "global_schedule": 0.0021953284740448, "l2_grads": 2.446239709854126, "l2_params": 243.89471435546875, "l2_updates": 0.0024084460455924273, "training_loss": 2.296177387237549, "uptime": 39259.64990261599, "examples_seen": 111052800.0, "progress": 0.9728464167496435, "epoch": 87.55655948058705, "img/sec/core": 189.3355798278665, "core_hours_Tesla V100-SXM2-32GB": 162.7076074463556, "core_hours": 162.7076074463556}
{"step": 108500, "global_schedule": 0.0021234750747680664, "l2_grads": 2.8929340839385986, "l2_params": 243.8932647705078, "l2_updates": 0.0023120627738535404, "training_loss": 1.7485249042510986, "uptime": 39276.56455058197, "examples_seen": 111104000.0, "progress": 0.9732949397633592, "epoch": 87.59692672792711, "img/sec/core": 189.18513742854753, "core_hours_Tesla V100-SXM2-32GB": 162.78278365953776, "core_hours": 162.78278365953776}
{"step": 108550, "global_schedule": 0.002052813768386841, "l2_grads": 2.6348438262939453, "l2_params": 243.8919219970703, "l2_updates": 0.002264876151457429, "training_loss": 2.475217580795288, "uptime": 39293.488011978974, "examples_seen": 111155200.0, "progress": 0.9737434627770751, "epoch": 87.63729397526717, "img/sec/core": 189.0866132484299, "core_hours_Tesla V100-SXM2-32GB": 162.85799904352444, "core_hours": 162.85799904352444}
{"step": 108600, "global_schedule": 0.001983344554901123, "l2_grads": 2.6169657707214355, "l2_params": 243.8906707763672, "l2_updates": 0.002188440877944231, "training_loss": 3.166376829147339, "uptime": 39310.39846118097, "examples_seen": 111206400.0, "progress": 0.9741919857907909, "epoch": 87.67766122260724, "img/sec/core": 189.2321109732523, "core_hours_Tesla V100-SXM2-32GB": 162.9331565955333, "core_hours": 162.9331565955333}
{"step": 108650, "global_schedule": 0.001915067434310913, "l2_grads": 2.875739336013794, "l2_params": 243.88934326171875, "l2_updates": 0.0021061934530735016, "training_loss": 1.8560962677001953, "uptime": 39327.28518941096, "examples_seen": 111257600.0, "progress": 0.9746405088045068, "epoch": 87.7180284699473, "img/sec/core": 189.4979273910991, "core_hours_Tesla V100-SXM2-32GB": 163.00820872099993, "core_hours": 163.00820872099993}
{"step": 108700, "global_schedule": 0.0018480122089385986, "l2_grads": 2.834068775177002, "l2_params": 243.88807678222656, "l2_updates": 0.0020195781253278255, "training_loss": 3.405881643295288, "uptime": 39344.213073602004, "examples_seen": 111308800.0, "progress": 0.9750890318182226, "epoch": 87.75839571728736, "img/sec/core": 189.0372100781166, "core_hours_Tesla V100-SXM2-32GB": 163.083443761849, "core_hours": 163.083443761849}
{"step": 108750, "global_schedule": 0.0017821192741394043, "l2_grads": 2.853199005126953, "l2_params": 243.88690185546875, "l2_updates": 0.002019770909100771, "training_loss": 1.562075138092041, "uptime": 39361.106300365995, "examples_seen": 111360000.0, "progress": 0.9755375548319384, "epoch": 87.79876296462741, "img/sec/core": 189.42503079525042, "core_hours_Tesla V100-SXM2-32GB": 163.15852476968897, "core_hours": 163.15852476968897}
{"step": 108800, "global_schedule": 0.0017174184322357178, "l2_grads": 2.8546464443206787, "l2_params": 243.8856964111328, "l2_updates": 0.0018858729163184762, "training_loss": 1.5746383666992188, "uptime": 39378.012906569, "examples_seen": 111411200.0, "progress": 0.9759860778456543, "epoch": 87.83913021196747, "img/sec/core": 189.27512485808927, "core_hours_Tesla V100-SXM2-32GB": 163.2336652417023, "core_hours": 163.2336652417023}
{"step": 108850, "global_schedule": 0.001653909683227539, "l2_grads": 2.616150379180908, "l2_params": 243.88458251953125, "l2_updates": 0.0018003100994974375, "training_loss": 1.947489857673645, "uptime": 39394.93385533296, "examples_seen": 111462400.0, "progress": 0.9764346008593701, "epoch": 87.87949745930753, "img/sec/core": 189.1146911818376, "core_hours_Tesla V100-SXM2-32GB": 163.30886945843102, "core_hours": 163.30886945843102}
{"step": 108900, "global_schedule": 0.0015916228294372559, "l2_grads": 2.8416528701782227, "l2_params": 243.88351440429688, "l2_updates": 0.0017502817790955305, "training_loss": 3.6129276752471924, "uptime": 39411.840953786974, "examples_seen": 111513600.0, "progress": 0.976883123873086, "epoch": 87.91986470664759, "img/sec/core": 189.26961410341417, "core_hours_Tesla V100-SXM2-32GB": 163.38401211822665, "core_hours": 163.38401211822665}
{"step": 108950, "global_schedule": 0.0015304982662200928, "l2_grads": 2.8483691215515137, "l2_params": 243.88243103027344, "l2_updates": 0.0016832267865538597, "training_loss": 1.5430585145950317, "uptime": 39428.74435609998, "examples_seen": 111564800.0, "progress": 0.9773316468868017, "epoch": 87.96023195398764, "img/sec/core": 189.31100027936077, "core_hours_Tesla V100-SXM2-32GB": 163.45913835072892, "core_hours": 163.45913835072892}
{"step": 109000, "global_schedule": 0.0014705955982208252, "l2_grads": 2.8274238109588623, "l2_params": 243.88143920898438, "l2_updates": 0.00161492801271379, "training_loss": 1.5286821126937866, "uptime": 39445.670882484, "examples_seen": 111616000.0, "progress": 0.9777801699005176, "epoch": 88.0005992013277, "img/sec/core": 189.0523742083861, "core_hours_Tesla V100-SXM2-32GB": 163.5343673568801, "core_hours": 163.5343673568801}
{"step": 109050, "global_schedule": 0.0014118850231170654, "l2_grads": 2.7992992401123047, "l2_params": 243.88052368164062, "l2_updates": 0.0015485236654058099, "training_loss": 1.5785572528839111, "uptime": 39463.090634236985, "examples_seen": 111667200.0, "progress": 0.9782286929142334, "epoch": 88.04096644866776, "img/sec/core": 189.3556671353673, "core_hours_Tesla V100-SXM2-32GB": 163.6094758679555, "core_hours": 163.6094758679555}
{"step": 109100, "global_schedule": 0.0013543367385864258, "l2_grads": 2.850963592529297, "l2_params": 243.87954711914062, "l2_updates": 0.00147506152279675, "training_loss": 1.8700902462005615, "uptime": 39480.00498249498, "examples_seen": 111718400.0, "progress": 0.9786772159279493, "epoch": 88.08133369600782, "img/sec/core": 189.18848962963347, "core_hours_Tesla V100-SXM2-32GB": 163.68465074910213, "core_hours": 163.68465074910213}
{"step": 109150, "global_schedule": 0.0012980103492736816, "l2_grads": 2.8118977546691895, "l2_params": 243.878662109375, "l2_updates": 0.0014311930863186717, "training_loss": 1.490175724029541, "uptime": 39496.90029703296, "examples_seen": 111769600.0, "progress": 0.9791257389416651, "epoch": 88.12170094334788, "img/sec/core": 189.40162332029124, "core_hours_Tesla V100-SXM2-32GB": 163.7597410359376, "core_hours": 163.7597410359376}
{"step": 109200, "global_schedule": 0.0012428760528564453, "l2_grads": 2.732422113418579, "l2_params": 243.87783813476562, "l2_updates": 0.0013466359814628959, "training_loss": 1.6524131298065186, "uptime": 39513.79781735799, "examples_seen": 111820800.0, "progress": 0.9795742619553809, "epoch": 88.16206819068793, "img/sec/core": 189.37689900333237, "core_hours_Tesla V100-SXM2-32GB": 163.83484112627104, "core_hours": 163.83484112627104}
{"step": 109250, "global_schedule": 0.0011889338493347168, "l2_grads": 2.9267542362213135, "l2_params": 243.87704467773438, "l2_updates": 0.0013055054005235434, "training_loss": 3.6319189071655273, "uptime": 39530.691549904004, "examples_seen": 111872000.0, "progress": 0.9800227849690968, "epoch": 88.20243543802799, "img/sec/core": 189.41935959292, "core_hours_Tesla V100-SXM2-32GB": 163.9099243820311, "core_hours": 163.9099243820311}
{"step": 109300, "global_schedule": 0.001136183738708496, "l2_grads": 2.661877393722534, "l2_params": 243.87632751464844, "l2_updates": 0.0012542007025331259, "training_loss": 2.6421542167663574, "uptime": 39547.61139420798, "examples_seen": 111923200.0, "progress": 0.9804713079828126, "epoch": 88.24280268536806, "img/sec/core": 189.1270358349301, "core_hours_Tesla V100-SXM2-32GB": 163.98512369004882, "core_hours": 163.98512369004882}
{"step": 109350, "global_schedule": 0.001084655523300171, "l2_grads": 2.886655569076538, "l2_params": 243.87559509277344, "l2_updates": 0.0011887496802955866, "training_loss": 2.4319729804992676, "uptime": 39564.50386165397, "examples_seen": 111974400.0, "progress": 0.9809198309965285, "epoch": 88.28316993270812, "img/sec/core": 189.43354546825458, "core_hours_Tesla V100-SXM2-32GB": 164.06020132314205, "core_hours": 164.06020132314205}
{"step": 109400, "global_schedule": 0.0010342895984649658, "l2_grads": 2.707549810409546, "l2_params": 243.8748321533203, "l2_updates": 0.0011357179610058665, "training_loss": 1.479651689529419, "uptime": 39581.39594655397, "examples_seen": 112025600.0, "progress": 0.9813683540102442, "epoch": 88.32353718004818, "img/sec/core": 189.4378354681511, "core_hours_Tesla V100-SXM2-32GB": 164.13527725603095, "core_hours": 164.13527725603095}
{"step": 109450, "global_schedule": 0.0009851455688476562, "l2_grads": 2.715697765350342, "l2_params": 243.87411499023438, "l2_updates": 0.0010793465189635754, "training_loss": 1.6125308275222778, "uptime": 39598.295146674966, "examples_seen": 112076800.0, "progress": 0.9818168770239601, "epoch": 88.36390442738823, "img/sec/core": 189.35807476613448, "core_hours_Tesla V100-SXM2-32GB": 164.21038481212426, "core_hours": 164.21038481212426}
{"step": 109500, "global_schedule": 0.0009371638298034668, "l2_grads": 2.7153215408325195, "l2_params": 243.87347412109375, "l2_updates": 0.0010250097839161754, "training_loss": 2.3075926303863525, "uptime": 39615.175085758965, "examples_seen": 112128000.0, "progress": 0.9822654000376759, "epoch": 88.40427167472829, "img/sec/core": 189.57414384470636, "core_hours_Tesla V100-SXM2-32GB": 164.2854067636087, "core_hours": 164.2854067636087}
{"step": 109550, "global_schedule": 0.0008904039859771729, "l2_grads": 2.8326218128204346, "l2_params": 243.87277221679688, "l2_updates": 0.0009680581279098988, "training_loss": 1.9700679779052734, "uptime": 39632.06366435398, "examples_seen": 112179200.0, "progress": 0.9827139230513917, "epoch": 88.44463892206835, "img/sec/core": 189.47716541078287, "core_hours_Tesla V100-SXM2-32GB": 164.3604671129199, "core_hours": 164.3604671129199}
{"step": 109600, "global_schedule": 0.0008448362350463867, "l2_grads": 2.679887056350708, "l2_params": 243.87216186523438, "l2_updates": 0.0009274440235458314, "training_loss": 2.7263829708099365, "uptime": 39648.95874359296, "examples_seen": 112230400.0, "progress": 0.9831624460651076, "epoch": 88.48500616940841, "img/sec/core": 189.4042611304787, "core_hours_Tesla V100-SXM2-32GB": 164.43555635398204, "core_hours": 164.43555635398204}
{"step": 109650, "global_schedule": 0.0008004605770111084, "l2_grads": 2.981973648071289, "l2_params": 243.87156677246094, "l2_updates": 0.0008741361671127379, "training_loss": 1.633277416229248, "uptime": 39665.86536529299, "examples_seen": 112281600.0, "progress": 0.9836109690788234, "epoch": 88.52537341674847, "img/sec/core": 189.27495136376783, "core_hours_Tesla V100-SXM2-32GB": 164.51069689487107, "core_hours": 164.51069689487107}
{"step": 109700, "global_schedule": 0.0007572770118713379, "l2_grads": 2.730219602584839, "l2_params": 243.87106323242188, "l2_updates": 0.0008253066916950047, "training_loss": 1.6887528896331787, "uptime": 39682.75843130896, "examples_seen": 112332800.0, "progress": 0.9840594920925393, "epoch": 88.56574066408852, "img/sec/core": 189.42683329215086, "core_hours_Tesla V100-SXM2-32GB": 164.58577718827536, "core_hours": 164.58577718827536}
{"step": 109750, "global_schedule": 0.0007152855396270752, "l2_grads": 2.869267463684082, "l2_params": 243.8705291748047, "l2_updates": 0.0007866970263421535, "training_loss": 1.8598830699920654, "uptime": 39699.65883017797, "examples_seen": 112384000.0, "progress": 0.9845080151062551, "epoch": 88.60610791142858, "img/sec/core": 189.34464356743305, "core_hours_Tesla V100-SXM2-32GB": 164.66089007213762, "core_hours": 164.66089007213762}
{"step": 109800, "global_schedule": 0.000674515962600708, "l2_grads": 2.7602791786193848, "l2_params": 243.8701934814453, "l2_updates": 0.0007414910942316055, "training_loss": 1.5818294286727905, "uptime": 39716.542153424, "examples_seen": 112435200.0, "progress": 0.984956538119971, "epoch": 88.64647515876864, "img/sec/core": 189.536144831691, "core_hours_Tesla V100-SXM2-32GB": 164.73592706434223, "core_hours": 164.73592706434223}
{"step": 109850, "global_schedule": 0.0006349086761474609, "l2_grads": 2.6315722465515137, "l2_params": 243.8697052001953, "l2_updates": 0.0006890564109198749, "training_loss": 2.1743147373199463, "uptime": 39733.43666486, "examples_seen": 112486400.0, "progress": 0.9854050611336868, "epoch": 88.6868424061087, "img/sec/core": 189.41062676615857, "core_hours_Tesla V100-SXM2-32GB": 164.81101378183556, "core_hours": 164.81101378183556}
{"step": 109900, "global_schedule": 0.0005965232849121094, "l2_grads": 2.8856191635131836, "l2_params": 243.86927795410156, "l2_updates": 0.000650832720566541, "training_loss": 1.7823423147201538, "uptime": 39750.357996834966, "examples_seen": 112537600.0, "progress": 0.9858535841474027, "epoch": 88.72720965344875, "img/sec/core": 189.1104083729144, "core_hours_Tesla V100-SXM2-32GB": 164.8862197017243, "core_hours": 164.8862197017243}
{"step": 109950, "global_schedule": 0.0005593299865722656, "l2_grads": 2.9438364505767822, "l2_params": 243.868896484375, "l2_updates": 0.0006158293690532446, "training_loss": 1.520992398262024, "uptime": 39767.250981926976, "examples_seen": 112588800.0, "progress": 0.9863021071611184, "epoch": 88.76757690078881, "img/sec/core": 189.4277407202272, "core_hours_Tesla V100-SXM2-32GB": 164.96129963546656, "core_hours": 164.96129963546656}
{"step": 110000, "global_schedule": 0.0005233287811279297, "l2_grads": 2.9136736392974854, "l2_params": 243.8685760498047, "l2_updates": 0.0005680317408405244, "training_loss": 1.621914267539978, "uptime": 39784.155036323995, "examples_seen": 112640000.0, "progress": 0.9867506301748342, "epoch": 88.80794414812888, "img/sec/core": 189.30369749427598, "core_hours_Tesla V100-SXM2-32GB": 165.03642876611997, "core_hours": 165.03642876611997, "minival/prec@1": 0.7961286294099282, "minival/loss": 0.8031696506563366, "minival/sample count": 12812.0, "minival/attn_weight_avg": [13312, 12, 281], "minival/attn_mag": [13312, 12, 281], "minival/before_mlp": [13312, 12, 281], "z/secs/eval/minival": 2.895921591029037, "real/prec@1": 0.8302837500266883, "real/loss": 1.6079780967437602, "real/sample count": 46837.0, "real/attn_weight_avg": [50176, 12, 281], "real/attn_mag": [50176, 12, 281], "real/before_mlp": [50176, 12, 281], "z/secs/eval/real": 11.155113092041574, "train/prec@1": 0.8536471139210865, "train/loss": 0.5553716836822203, "train/sample count": 25623.0, "train/attn_weight_avg": [26624, 12, 281], "train/attn_mag": [26624, 12, 281], "train/before_mlp": [26624, 12, 281], "z/secs/eval/train": 6.594566793995909, "v2/prec@1": 0.6425, "v2/loss": 1.5485549682617188, "v2/sample count": 10000.0, "v2/attn_weight_avg": [10240, 12, 281], "v2/attn_mag": [10240, 12, 281], "v2/before_mlp": [10240, 12, 281], "z/secs/eval/v2": 3.4025398470112123, "val/prec@1": 0.76534, "val/loss": 0.9308492114257813, "val/sample count": 50000.0, "val/attn_weight_avg": [50176, 12, 281], "val/attn_mag": [50176, 12, 281], "val/before_mlp": [50176, 12, 281], "z/secs/eval/val": 12.305505837954115}
{"step": 110050, "global_schedule": 0.0004885196685791016, "l2_grads": 2.9466030597686768, "l2_params": 243.86825561523438, "l2_updates": 0.0005356204928830266, "training_loss": 3.6783571243286133, "uptime": 39838.08729874797, "examples_seen": 112691200.0, "progress": 0.9871991531885501, "epoch": 88.84831139546894, "img/sec/core": 188.90284726587885, "core_hours_Tesla V100-SXM2-32GB": 165.1117173201469, "core_hours": 165.1117173201469}
{"step": 110100, "global_schedule": 0.00045493245124816895, "l2_grads": 2.801126003265381, "l2_params": 243.86790466308594, "l2_updates": 0.0004959852667525411, "training_loss": 2.093449115753174, "uptime": 39854.96590964496, "examples_seen": 112742400.0, "progress": 0.9876476762022659, "epoch": 88.888678642809, "img/sec/core": 189.58906153644648, "core_hours_Tesla V100-SXM2-32GB": 165.18673336857802, "core_hours": 165.18673336857802}
{"step": 110150, "global_schedule": 0.00042250752449035645, "l2_grads": 3.08522629737854, "l2_params": 243.8675994873047, "l2_updates": 0.00046105252113193274, "training_loss": 3.7727367877960205, "uptime": 39871.87625397998, "examples_seen": 112793600.0, "progress": 0.9880961992159818, "epoch": 88.92904589014906, "img/sec/core": 189.23328446798573, "core_hours_Tesla V100-SXM2-32GB": 165.26189045451142, "core_hours": 165.26189045451142}
{"step": 110200, "global_schedule": 0.00039130449295043945, "l2_grads": 2.6685097217559814, "l2_params": 243.86734008789062, "l2_updates": 0.00043021253077313304, "training_loss": 1.496410608291626, "uptime": 39888.76489669195, "examples_seen": 112844800.0, "progress": 0.9885447222296976, "epoch": 88.96941313748911, "img/sec/core": 189.47644606937664, "core_hours_Tesla V100-SXM2-32GB": 165.33695108878686, "core_hours": 165.33695108878686}
{"step": 110250, "global_schedule": 0.0003612935543060303, "l2_grads": 2.8830978870391846, "l2_params": 243.86712646484375, "l2_updates": 0.0003980874898843467, "training_loss": 3.633723735809326, "uptime": 39905.671901619, "examples_seen": 112896000.0, "progress": 0.9889932452434135, "epoch": 89.00978038482917, "img/sec/core": 189.27066111395135, "core_hours_Tesla V100-SXM2-32GB": 165.4120933329071, "core_hours": 165.4120933329071}
{"step": 110300, "global_schedule": 0.0003324747085571289, "l2_grads": 2.7601306438446045, "l2_params": 243.86685180664062, "l2_updates": 0.0003652118903119117, "training_loss": 1.5357978343963623, "uptime": 39922.57977887499, "examples_seen": 112947200.0, "progress": 0.9894417682571293, "epoch": 89.05014763216923, "img/sec/core": 189.2608960635041, "core_hours_Tesla V100-SXM2-32GB": 165.4872394540448, "core_hours": 165.4872394540448}
{"step": 110350, "global_schedule": 0.00030484795570373535, "l2_grads": 2.768587827682495, "l2_params": 243.86666870117188, "l2_updates": 0.00033352471655234694, "training_loss": 1.9720475673675537, "uptime": 39939.46793747699, "examples_seen": 112998400.0, "progress": 0.9898902912708452, "epoch": 89.09051487950929, "img/sec/core": 189.48187753406603, "core_hours_Tesla V100-SXM2-32GB": 165.56229793672037, "core_hours": 165.56229793672037}
{"step": 110400, "global_schedule": 0.0002784132957458496, "l2_grads": 2.9293413162231445, "l2_params": 243.866455078125, "l2_updates": 0.0003054704866372049, "training_loss": 1.5505075454711914, "uptime": 39956.379047747, "examples_seen": 113049600.0, "progress": 0.9903388142845609, "epoch": 89.13088212684934, "img/sec/core": 189.22471374777365, "core_hours_Tesla V100-SXM2-32GB": 165.6374584268093, "core_hours": 165.6374584268093}
{"step": 110450, "global_schedule": 0.0002532005310058594, "l2_grads": 2.609743356704712, "l2_params": 243.86627197265625, "l2_updates": 0.0002780586655717343, "training_loss": 2.6787922382354736, "uptime": 39973.267827414966, "examples_seen": 113100800.0, "progress": 0.9907873372982767, "epoch": 89.1712493741894, "img/sec/core": 189.4749095501698, "core_hours_Tesla V100-SXM2-32GB": 165.71251966977803, "core_hours": 165.71251966977803}
{"step": 110500, "global_schedule": 0.00022915005683898926, "l2_grads": 2.8123695850372314, "l2_params": 243.86610412597656, "l2_updates": 0.00025274025392718613, "training_loss": 1.6488410234451294, "uptime": 39990.16997322498, "examples_seen": 113152000.0, "progress": 0.9912358603119926, "epoch": 89.21161662152946, "img/sec/core": 189.32507363079154, "core_hours_Tesla V100-SXM2-32GB": 165.78764031782254, "core_hours": 165.78764031782254}
{"step": 110550, "global_schedule": 0.00020632147789001465, "l2_grads": 2.4798734188079834, "l2_params": 243.865966796875, "l2_updates": 0.00022690879995934665, "training_loss": 2.9172961711883545, "uptime": 40007.079773237, "examples_seen": 113203200.0, "progress": 0.9916843833257084, "epoch": 89.25198386886952, "img/sec/core": 189.23937584870913, "core_hours_Tesla V100-SXM2-32GB": 165.8627949845426, "core_hours": 165.8627949845426}
{"step": 110600, "global_schedule": 0.00018468499183654785, "l2_grads": 3.012042284011841, "l2_params": 243.86582946777344, "l2_updates": 0.00020331252017058432, "training_loss": 3.6576507091522217, "uptime": 40023.98523245996, "examples_seen": 113254400.0, "progress": 0.9921329063394243, "epoch": 89.29235111620957, "img/sec/core": 189.2879665553738, "core_hours_Tesla V100-SXM2-32GB": 165.9379303588669, "core_hours": 165.9379303588669}
{"step": 110650, "global_schedule": 0.00016427040100097656, "l2_grads": 2.8263697624206543, "l2_params": 243.86572265625, "l2_updates": 0.00018018584523815662, "training_loss": 1.5230600833892822, "uptime": 40040.89763704897, "examples_seen": 113305600.0, "progress": 0.9925814293531401, "epoch": 89.33271836354963, "img/sec/core": 189.21023223866257, "core_hours_Tesla V100-SXM2-32GB": 166.0130966014847, "core_hours": 166.0130966014847}
{"step": 110700, "global_schedule": 0.0001450181007385254, "l2_grads": 2.598355293273926, "l2_params": 243.86563110351562, "l2_updates": 0.00015807706222403795, "training_loss": 2.8056373596191406, "uptime": 40057.79612381896, "examples_seen": 113356800.0, "progress": 0.993029952366856, "epoch": 89.37308561088969, "img/sec/core": 189.36606830871312, "core_hours_Tesla V100-SXM2-32GB": 166.0882009871291, "core_hours": 166.0882009871291}
{"step": 110750, "global_schedule": 0.00012698769569396973, "l2_grads": 2.851620674133301, "l2_params": 243.86550903320312, "l2_updates": 0.00013963195669930428, "training_loss": 1.6963903903961182, "uptime": 40074.72618263698, "examples_seen": 113408000.0, "progress": 0.9934784753805718, "epoch": 89.41345285822976, "img/sec/core": 189.0129286848129, "core_hours_Tesla V100-SXM2-32GB": 166.16344569298698, "core_hours": 166.16344569298698}
{"step": 110800, "global_schedule": 0.00011014938354492188, "l2_grads": 2.665313243865967, "l2_params": 243.8654327392578, "l2_updates": 0.00012080200394848362, "training_loss": 3.0235517024993896, "uptime": 40091.637347057986, "examples_seen": 113459200.0, "progress": 0.9939269983942877, "epoch": 89.45382010556982, "img/sec/core": 189.2241078340613, "core_hours_Tesla V100-SXM2-32GB": 166.238606423747, "core_hours": 166.238606423747}
{"step": 110850, "global_schedule": 9.450316429138184e-05, "l2_grads": 2.75223970413208, "l2_params": 243.86534118652344, "l2_updates": 0.00010387326619820669, "training_loss": 1.6330361366271973, "uptime": 40108.54906219599, "examples_seen": 113510400.0, "progress": 0.9943755214080034, "epoch": 89.49418735290988, "img/sec/core": 189.217945896496, "core_hours_Tesla V100-SXM2-32GB": 166.31376960213814, "core_hours": 166.31376960213814}
{"step": 110900, "global_schedule": 8.004903793334961e-05, "l2_grads": 2.702000379562378, "l2_params": 243.86526489257812, "l2_updates": 8.88040813151747e-05, "training_loss": 1.600416898727417, "uptime": 40125.46207473596, "examples_seen": 113561600.0, "progress": 0.9948240444217192, "epoch": 89.53455460024993, "img/sec/core": 189.20343093449125, "core_hours_Tesla V100-SXM2-32GB": 166.38893854676022, "core_hours": 166.38893854676022}
{"step": 110950, "global_schedule": 6.67870044708252e-05, "l2_grads": 2.66249942779541, "l2_params": 243.86521911621094, "l2_updates": 7.351725071202964e-05, "training_loss": 1.8863213062286377, "uptime": 40142.36723399698, "examples_seen": 113612800.0, "progress": 0.9952725674354351, "epoch": 89.57492184758999, "img/sec/core": 189.2913252452275, "core_hours_Tesla V100-SXM2-32GB": 166.4640725879203, "core_hours": 166.4640725879203}
{"step": 111000, "global_schedule": 5.474686622619629e-05, "l2_grads": 2.5724730491638184, "l2_params": 243.86517333984375, "l2_updates": 6.1022677982691675e-05, "training_loss": 2.3148579597473145, "uptime": 40159.26537689497, "examples_seen": 113664000.0, "progress": 0.9957210904491509, "epoch": 89.61528909493005, "img/sec/core": 189.3699218498566, "core_hours_Tesla V100-SXM2-32GB": 166.5391754452447, "core_hours": 166.5391754452447}
{"step": 111050, "global_schedule": 4.3898820877075195e-05, "l2_grads": 2.9394662380218506, "l2_params": 243.8651580810547, "l2_updates": 4.821263428311795e-05, "training_loss": 1.5502510070800781, "uptime": 40176.99565794197, "examples_seen": 113715200.0, "progress": 0.9961696134628668, "epoch": 89.6556563422701, "img/sec/core": 189.4450152094329, "core_hours_Tesla V100-SXM2-32GB": 166.6142485328448, "core_hours": 166.6142485328448}
{"step": 111100, "global_schedule": 3.4242868423461914e-05, "l2_grads": 2.869375467300415, "l2_params": 243.8651123046875, "l2_updates": 3.749760799109936e-05, "training_loss": 1.8067481517791748, "uptime": 40193.894948447996, "examples_seen": 113766400.0, "progress": 0.9966181364765826, "epoch": 89.69602358961016, "img/sec/core": 189.35706199371336, "core_hours_Tesla V100-SXM2-32GB": 166.6893564906494, "core_hours": 166.6893564906494}
{"step": 111150, "global_schedule": 2.5779008865356445e-05, "l2_grads": 2.6933584213256836, "l2_params": 243.86509704589844, "l2_updates": 2.8149268473498523e-05, "training_loss": 1.7351253032684326, "uptime": 40210.796415864956, "examples_seen": 113817600.0, "progress": 0.9970666594902985, "epoch": 89.73639083695022, "img/sec/core": 189.3326727825444, "core_hours_Tesla V100-SXM2-32GB": 166.76447412361364, "core_hours": 166.76447412361364}
{"step": 111200, "global_schedule": 1.850724220275879e-05, "l2_grads": 2.698089599609375, "l2_params": 243.8650665283203, "l2_updates": 2.0467410649871454e-05, "training_loss": 1.4647982120513916, "uptime": 40227.71487605595, "examples_seen": 113868800.0, "progress": 0.9975151825040143, "epoch": 89.77675808429028, "img/sec/core": 189.1425084715033, "core_hours_Tesla V100-SXM2-32GB": 166.83966728001806, "core_hours": 166.83966728001806}
{"step": 111250, "global_schedule": 1.245737075805664e-05, "l2_grads": 2.8530020713806152, "l2_params": 243.8650665283203, "l2_updates": 1.3635999493999407e-05, "training_loss": 3.2935218811035156, "uptime": 40244.616459021985, "examples_seen": 113920000.0, "progress": 0.9979637055177301, "epoch": 89.81712533163034, "img/sec/core": 189.33137839400513, "core_hours_Tesla V100-SXM2-32GB": 166.9147854265338, "core_hours": 166.9147854265338}
{"step": 111300, "global_schedule": 7.599592208862305e-06, "l2_grads": 2.5865957736968994, "l2_params": 243.8650665283203, "l2_updates": 8.269284990092274e-06, "training_loss": 2.3291730880737305, "uptime": 40261.499052712985, "examples_seen": 113971200.0, "progress": 0.998412228531446, "epoch": 89.8574925789704, "img/sec/core": 189.54433534143158, "core_hours_Tesla V100-SXM2-32GB": 166.98981917627154, "core_hours": 166.98981917627154}
{"step": 111350, "global_schedule": 3.933906555175781e-06, "l2_grads": 2.772751808166504, "l2_params": 243.8650665283203, "l2_updates": 4.337869540904649e-06, "training_loss": 1.7260043621063232, "uptime": 40278.42205399298, "examples_seen": 114022400.0, "progress": 0.9988607515451617, "epoch": 89.89785982631045, "img/sec/core": 189.09175429671245, "core_hours_Tesla V100-SXM2-32GB": 167.06503251529375, "core_hours": 167.06503251529375}
{"step": 111400, "global_schedule": 1.4603137969970703e-06, "l2_grads": 2.8552799224853516, "l2_params": 243.8650665283203, "l2_updates": 1.5939856439217692e-06, "training_loss": 1.484585165977478, "uptime": 40295.30502566899, "examples_seen": 114073600.0, "progress": 0.9993092745588776, "epoch": 89.93822707365051, "img/sec/core": 189.54009172137552, "core_hours_Tesla V100-SXM2-32GB": 167.1400679449649, "core_hours": 167.1400679449649}
{"step": 111450, "global_schedule": 1.7881393432617188e-07, "l2_grads": 2.8130269050598145, "l2_params": 243.8650665283203, "l2_updates": 1.9414073904044926e-07, "training_loss": 1.464487910270691, "uptime": 40312.210767543, "examples_seen": 114124800.0, "progress": 0.9997577975725934, "epoch": 89.97859432099058, "img/sec/core": 189.28480180565765, "core_hours_Tesla V100-SXM2-32GB": 167.21520457551608, "core_hours": 167.21520457551608}
{"step": 111477, "global_schedule": 0.0, "l2_grads": 2.7761971950531006, "l2_params": 243.8650665283203, "l2_updates": 0.0, "training_loss": 1.9388941526412964, "uptime": 40321.33443206595, "examples_seen": 114152448.0, "progress": 1.0, "epoch": 90.0003926345542, "img/sec/core": 189.39758204098095, "core_hours_Tesla V100-SXM2-32GB": 167.25575419561807, "core_hours": 167.25575419561807, "minival/prec@1": 0.796206681236341, "minival/loss": 0.8044125226152118, "minival/sample count": 12812.0, "minival/attn_weight_avg": [13312, 12, 281], "minival/attn_mag": [13312, 12, 281], "minival/before_mlp": [13312, 12, 281], "z/secs/eval/minival": 2.9191585459630005, "real/prec@1": 0.8305826590089033, "real/loss": 1.6087570511327849, "real/sample count": 46837.0, "real/attn_weight_avg": [50176, 12, 281], "real/attn_mag": [50176, 12, 281], "real/before_mlp": [50176, 12, 281], "z/secs/eval/real": 11.247990734002087, "train/prec@1": 0.8532958669944971, "train/loss": 0.5569656727553409, "train/sample count": 25623.0, "train/attn_weight_avg": [26624, 12, 281], "train/attn_mag": [26624, 12, 281], "train/before_mlp": [26624, 12, 281], "z/secs/eval/train": 6.5439004030195065, "v2/prec@1": 0.643, "v2/loss": 1.549887353515625, "v2/sample count": 10000.0, "v2/attn_weight_avg": [10240, 12, 281], "v2/attn_mag": [10240, 12, 281], "v2/before_mlp": [10240, 12, 281], "z/secs/eval/v2": 3.3465950989630073, "val/prec@1": 0.76534, "val/loss": 0.9323522973632813, "val/sample count": 50000.0, "val/attn_weight_avg": [50176, 12, 281], "val/attn_mag": [50176, 12, 281], "val/before_mlp": [50176, 12, 281], "z/secs/eval/val": 12.37488137499895}
{"step": 111477, "global_schedule": 0.0, "l2_grads": 2.7761971950531006, "l2_params": 243.8650665283203, "l2_updates": 0.0, "training_loss": 1.9388941526412964, "uptime": 40321.33443206595, "examples_seen": 114152448.0, "progress": 1.0, "epoch": 90.0003926345542, "img/sec/core": 189.39758204098095, "core_hours_Tesla V100-SXM2-32GB": 167.25575419561807, "core_hours": 167.25575419561807, "minival/prec@1": 0.796206681236341, "minival/loss": 0.8044125226152118, "minival/sample count": 12812.0, "minival/attn_weight_avg": [13312, 12, 281], "minival/attn_mag": [13312, 12, 281], "minival/before_mlp": [13312, 12, 281], "z/secs/eval/minival": 2.9191585459630005, "real/prec@1": 0.8305826590089033, "real/loss": 1.6087570511327849, "real/sample count": 46837.0, "real/attn_weight_avg": [50176, 12, 281], "real/attn_mag": [50176, 12, 281], "real/before_mlp": [50176, 12, 281], "z/secs/eval/real": 11.247990734002087, "train/prec@1": 0.8532958669944971, "train/loss": 0.5569656727553409, "train/sample count": 25623.0, "train/attn_weight_avg": [26624, 12, 281], "train/attn_mag": [26624, 12, 281], "train/before_mlp": [26624, 12, 281], "z/secs/eval/train": 6.5439004030195065, "v2/prec@1": 0.643, "v2/loss": 1.549887353515625, "v2/sample count": 10000.0, "v2/attn_weight_avg": [10240, 12, 281], "v2/attn_mag": [10240, 12, 281], "v2/before_mlp": [10240, 12, 281], "z/secs/eval/v2": 3.3465950989630073, "val/prec@1": 0.76534, "val/loss": 0.9323522973632813, "val/sample count": 50000.0, "val/attn_weight_avg": [50176, 12, 281], "val/attn_mag": [50176, 12, 281], "val/before_mlp": [50176, 12, 281], "z/secs/eval/val": 12.37488137499895}
