{"baseline": [{"Nstr": 30, "N": 30482560, "final_loss": 3.094648599624634, "D": 11999903744, "D/N": 393.6645657057675, "bops": 365787785870704640, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.422644853591919, "D": 749993984, "D/N": 24.604035356610467, "bops": 22861736616919040, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.300395965576172, "D": 1499987968, "D/N": 49.208070713220934, "bops": 45723473233838080, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.2116122245788574, "D": 2999975936, "D/N": 98.41614142644187, "bops": 91446946467676160, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.145786762237549, "D": 5999951872, "D/N": 196.83228285288374, "bops": 182893892935352320, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.0576882362365723, "D": 23999807488, "D/N": 787.329131411535, "bops": 731575571741409280, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.141568899154663, "D": 2499805184, "D/N": 50.44329763768138, "bops": 123882185554919424, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 2.9344751834869385, "D": 39999766528, "D/N": 807.1509497316368, "bops": 1982257869889732608, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.0143134593963623, "D": 9999745024, "D/N": 201.78377010140457, "bops": 495554724221681664, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.069868803024292, "D": 4999872512, "D/N": 100.89188505070229, "bops": 247777362110840832, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 2.969404458999634, "D": 19999752192, "D/N": 403.57282997814866, "bops": 991122439444365312, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.2368013858795166, "D": 1249902592, "D/N": 25.22164881884069, "bops": 61941092777459712, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.8753557205200195, "D": 9999745024, "D/N": 97.294742400542, "bops": 1027752354113388544, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.9417505264282227, "D": 4999872512, "D/N": 48.647371200271, "bops": 513876177056694272, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 3.0295932292938232, "D": 2499805184, "D/N": 24.322410305970966, "bops": 256924617229205504, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.7905032634735107, "D": 39999766528, "D/N": 389.18662136715517, "bops": 4111090244248403968, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.826296329498291, "D": 19999752192, "D/N": 194.59203538941307, "bops": 2055531650825060352, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.7641658782958984, "D": 79999795200, "D/N": 778.3757933226394, "bops": 8222207431095091200, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 200, "N": 203188480, "final_loss": 2.706197738647461, "D": 19999752192, "D/N": 98.4295575812172, "bops": 4063719248269148160, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 200, "N": 203188480, "final_loss": 2.7603962421417236, "D": 9999745024, "D/N": 49.21413371466729, "bops": 2031832991814123520, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 200, "N": 203188480, "final_loss": 2.835095167160034, "D": 4999872512, "D/N": 24.607066857333646, "bops": 1015916495907061760, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}], "quartetv2": [{"Nstr": 30, "N": 30482560, "final_loss": 3.464682102203369, "D": 749993984, "D/N": 24.604035356610467, "bops": 22861736616919040, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": true, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.3560855388641357, "D": 1499987968, "D/N": 49.208070713220934, "bops": 45723473233838080, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": true, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.2760660648345947, "D": 2999975936, "D/N": 98.41614142644187, "bops": 91446946467676160, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": true, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.2775633335113525, "D": 2999975936, "D/N": 98.41614142644187, "bops": 91446946467676160, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 32, "sdelayed_amax": true, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.358584403991699, "D": 1499987968, "D/N": 49.208070713220934, "bops": 45723473233838080, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 32, "sdelayed_amax": true, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.4671096801757812, "D": 749993984, "D/N": 24.604035356610467, "bops": 22861736616919040, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.3558027744293213, "D": 1499987968, "D/N": 49.208070713220934, "bops": 45723473233838080, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.277818441390991, "D": 2999975936, "D/N": 98.41614142644187, "bops": 91446946467676160, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.4671852588653564, "D": 749993984, "D/N": 24.604035356610467, "bops": 22861736616919040, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 32, "sdelayed_amax": true, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.221118211746216, "D": 5999951872, "D/N": 196.83228285288374, "bops": 182893892935352320, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.2210140228271484, "D": 5999951872, "D/N": 196.83228285288374, "bops": 182893892935352320, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": true, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.221705436706543, "D": 5999951872, "D/N": 196.83228285288374, "bops": 182893892935352320, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 32, "sdelayed_amax": true, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.1788344383239746, "D": 11999903744, "D/N": 393.6645657057675, "bops": 365787785870704640, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.178684949874878, "D": 11999903744, "D/N": 393.6645657057675, "bops": 365787785870704640, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": true, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.1815905570983887, "D": 11999903744, "D/N": 393.6645657057675, "bops": 365787785870704640, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 32, "sdelayed_amax": true, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.142542839050293, "D": 23999807488, "D/N": 787.329131411535, "bops": 731575571741409280, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.145017385482788, "D": 23999807488, "D/N": 787.329131411535, "bops": 731575571741409280, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 32, "sdelayed_amax": true, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.286261796951294, "D": 1249902592, "D/N": 25.22164881884069, "bops": 61941092777459712, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.1419498920440674, "D": 23999807488, "D/N": 787.329131411535, "bops": 731575571741409280, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": true, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.197173833847046, "D": 2499805184, "D/N": 50.44329763768138, "bops": 123882185554919424, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": true, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.197732448577881, "D": 2499805184, "D/N": 50.44329763768138, "bops": 123882185554919424, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.2868475914001465, "D": 1249902592, "D/N": 25.22164881884069, "bops": 61941092777459712, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 32, "sdelayed_amax": true, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.2862613201141357, "D": 1249902592, "D/N": 25.22164881884069, "bops": 61941092777459712, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": true, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.1980056762695312, "D": 2499805184, "D/N": 50.44329763768138, "bops": 123882185554919424, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 32, "sdelayed_amax": true, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.0823986530303955, "D": 9999745024, "D/N": 201.78377010140457, "bops": 495554724221681664, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.045940637588501, "D": 19999752192, "D/N": 403.57282997814866, "bops": 991122439444365312, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 32, "sdelayed_amax": true, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.043384552001953, "D": 19999752192, "D/N": 403.57282997814866, "bops": 991122439444365312, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.133361339569092, "D": 4999872512, "D/N": 100.89188505070229, "bops": 247777362110840832, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 32, "sdelayed_amax": true, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.0860140323638916, "D": 9999745024, "D/N": 201.78377010140457, "bops": 495554724221681664, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 32, "sdelayed_amax": true, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.0434563159942627, "D": 19999752192, "D/N": 403.57282997814866, "bops": 991122439444365312, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": true, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.1321561336517334, "D": 4999872512, "D/N": 100.89188505070229, "bops": 247777362110840832, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.082204818725586, "D": 9999745024, "D/N": 201.78377010140457, "bops": 495554724221681664, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": true, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.131696939468384, "D": 4999872512, "D/N": 100.89188505070229, "bops": 247777362110840832, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": true, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 3.0776307582855225, "D": 2499805184, "D/N": 24.322410305970966, "bops": 256924617229205504, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 3.079343557357788, "D": 2499805184, "D/N": 24.322410305970966, "bops": 256924617229205504, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 32, "sdelayed_amax": true, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 3.076704740524292, "D": 2499805184, "D/N": 24.322410305970966, "bops": 256924617229205504, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": true, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.9987685680389404, "D": 4999872512, "D/N": 48.647371200271, "bops": 513876177056694272, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 32, "sdelayed_amax": true, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.9972329139709473, "D": 4999872512, "D/N": 48.647371200271, "bops": 513876177056694272, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.936558246612549, "D": 9999745024, "D/N": 97.294742400542, "bops": 1027752354113388544, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": true, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.9368081092834473, "D": 9999745024, "D/N": 97.294742400542, "bops": 1027752354113388544, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.996840238571167, "D": 4999872512, "D/N": 48.647371200271, "bops": 513876177056694272, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": true, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.470503091812134, "D": 749993984, "D/N": 24.604035356610467, "bops": 22861736616919040, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.286280632019043, "D": 1249902592, "D/N": 25.22164881884069, "bops": 61941092777459712, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.3579843044281006, "D": 1499987968, "D/N": 49.208070713220934, "bops": 45723473233838080, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.1984336376190186, "D": 2499805184, "D/N": 50.44329763768138, "bops": 123882185554919424, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.134171724319458, "D": 4999872512, "D/N": 100.89188505070229, "bops": 247777362110840832, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.1465883255004883, "D": 23999807488, "D/N": 787.329131411535, "bops": 731575571741409280, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.2789955139160156, "D": 2999975936, "D/N": 98.41614142644187, "bops": 91446946467676160, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.89430832862854, "D": 19999752192, "D/N": 194.59203538941307, "bops": 2055531650825060352, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.1824800968170166, "D": 11999903744, "D/N": 393.6645657057675, "bops": 365787785870704640, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 3.000063180923462, "D": 4999872512, "D/N": 48.647371200271, "bops": 513876177056694272, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 3.0792887210845947, "D": 2499805184, "D/N": 24.322410305970966, "bops": 256924617229205504, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.939328908920288, "D": 9999745024, "D/N": 97.294742400542, "bops": 1027752354113388544, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.046738624572754, "D": 19999752192, "D/N": 403.57282997814866, "bops": 991122439444365312, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.2232799530029297, "D": 5999951872, "D/N": 196.83228285288374, "bops": 182893892935352320, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.0853261947631836, "D": 9999745024, "D/N": 201.78377010140457, "bops": 495554724221681664, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.465620517730713, "D": 749993984, "D/N": 24.604035356610467, "bops": 22861736616919040, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": false, "sfour_over_six": true}, {"Nstr": 30, "N": 30482560, "final_loss": 3.1325573921203613, "D": 23999807488, "D/N": 787.329131411535, "bops": 731575571741409280, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": false, "sfour_over_six": true}, {"Nstr": 50, "N": 49556736, "final_loss": 3.192169189453125, "D": 2499805184, "D/N": 50.44329763768138, "bops": 123882185554919424, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": false, "sfour_over_six": true}, {"Nstr": 30, "N": 30482560, "final_loss": 3.2117860317230225, "D": 5999951872, "D/N": 196.83228285288374, "bops": 182893892935352320, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": false, "sfour_over_six": true}, {"Nstr": 50, "N": 49556736, "final_loss": 3.27919602394104, "D": 1249902592, "D/N": 25.22164881884069, "bops": 61941092777459712, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": false, "sfour_over_six": true}, {"Nstr": 30, "N": 30482560, "final_loss": 3.1692769527435303, "D": 11999903744, "D/N": 393.6645657057675, "bops": 365787785870704640, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": false, "sfour_over_six": true}, {"Nstr": 30, "N": 30482560, "final_loss": 3.2707111835479736, "D": 2999975936, "D/N": 98.41614142644187, "bops": 91446946467676160, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": false, "sfour_over_six": true}, {"Nstr": 30, "N": 30482560, "final_loss": 3.351400852203369, "D": 1499987968, "D/N": 49.208070713220934, "bops": 45723473233838080, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": false, "sfour_over_six": true}, {"Nstr": 50, "N": 49556736, "final_loss": 3.12511682510376, "D": 4999872512, "D/N": 100.89188505070229, "bops": 247777362110840832, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": false, "sfour_over_six": true}, {"Nstr": 50, "N": 49556736, "final_loss": 3.0765011310577393, "D": 9999745024, "D/N": 201.78377010140457, "bops": 495554724221681664, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": false, "sfour_over_six": true}, {"Nstr": 50, "N": 49556736, "final_loss": 3.0360848903656006, "D": 19999752192, "D/N": 403.57282997814866, "bops": 991122439444365312, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": false, "sfour_over_six": true}, {"Nstr": 100, "N": 102777856, "final_loss": 2.989828586578369, "D": 4999872512, "D/N": 48.647371200271, "bops": 513876177056694272, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": false, "sfour_over_six": true}, {"Nstr": 100, "N": 102777856, "final_loss": 2.928170919418335, "D": 9999745024, "D/N": 97.294742400542, "bops": 1027752354113388544, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": false, "sfour_over_six": true}, {"Nstr": 100, "N": 102777856, "final_loss": 3.0715646743774414, "D": 2499805184, "D/N": 24.322410305970966, "bops": 256924617229205504, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": false, "sfour_over_six": true}, {"Nstr": 50, "N": 49556736, "final_loss": 3.001070499420166, "D": 39999766528, "D/N": 807.1509497316368, "bops": 1982257869889732608, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": false, "sfour_over_six": true}, {"Nstr": 100, "N": 102777856, "final_loss": 2.8818650245666504, "D": 19999752192, "D/N": 194.59203538941307, "bops": 2055531650825060352, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": false, "sfour_over_six": true}, {"Nstr": 200, "N": 203188480, "final_loss": 2.882150411605835, "D": 4999872512, "D/N": 24.607066857333646, "bops": 1015916495907061760, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 200, "N": 203188480, "final_loss": 2.876581907272339, "D": 4999872512, "D/N": 24.607066857333646, "bops": 1015916495907061760, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": false, "sfour_over_six": true}, {"Nstr": 200, "N": 203188480, "final_loss": 2.811300754547119, "D": 9999745024, "D/N": 49.21413371466729, "bops": 2031832991814123520, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 200, "N": 203188480, "final_loss": 2.8044638633728027, "D": 9999745024, "D/N": 49.21413371466729, "bops": 2031832991814123520, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": false, "sfour_over_six": true}, {"Nstr": 200, "N": 203188480, "final_loss": 2.7574398517608643, "D": 19999752192, "D/N": 98.4295575812172, "bops": 4063719248269148160, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 200, "N": 203188480, "final_loss": 2.75141978263855, "D": 19999752192, "D/N": 98.4295575812172, "bops": 4063719248269148160, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": false, "sfour_over_six": true}, {"Nstr": 50, "N": 49556736, "final_loss": 3.007532119750977, "D": 39999766528, "D/N": 807.1509497316368, "bops": 1982257869889732608, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.8906264305114746, "D": 19999752192, "D/N": 194.59203538941307, "bops": 2055531650825060352, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.8452205657958984, "D": 39999766528, "D/N": 389.18662136715517, "bops": 4111090244248403968, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": false, "sfour_over_six": true}, {"Nstr": 100, "N": 102777856, "final_loss": 2.853060245513916, "D": 39999766528, "D/N": 389.18662136715517, "bops": 4111090244248403968, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.826075553894043, "D": 79999795200, "D/N": 778.3757933226394, "bops": 8222207431095091200, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.8182222843170166, "D": 79999795200, "D/N": 778.3757933226394, "bops": 8222207431095091200, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "quartet_v2", "shadamard_dim": 128, "sdelayed_amax": false, "sfour_over_six": true}], "nvidia": [{"Nstr": 30, "N": 30482560, "final_loss": 3.290322542190552, "D": 2999975936, "D/N": 98.41614142644187, "bops": 91446946467676160, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "nvidia", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.197742462158203, "D": 11999903744, "D/N": 393.6645657057675, "bops": 365787785870704640, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "nvidia", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.0641720294952393, "D": 19999752192, "D/N": 403.57282997814866, "bops": 991122439444365312, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "nvidia", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.162240743637085, "D": 23999807488, "D/N": 787.329131411535, "bops": 731575571741409280, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "nvidia", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.4774208068847656, "D": 749993984, "D/N": 24.604035356610467, "bops": 22861736616919040, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "nvidia", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.236245393753052, "D": 5999951872, "D/N": 196.83228285288374, "bops": 182893892935352320, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "nvidia", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.1489508152008057, "D": 4999872512, "D/N": 100.89188505070229, "bops": 247777362110840832, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "nvidia", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.1006648540496826, "D": 9999745024, "D/N": 201.78377010140457, "bops": 495554724221681664, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "nvidia", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.21018648147583, "D": 2499805184, "D/N": 50.44329763768138, "bops": 123882185554919424, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "nvidia", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.3688344955444336, "D": 1499987968, "D/N": 49.208070713220934, "bops": 45723473233838080, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "nvidia", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.294499158859253, "D": 1249902592, "D/N": 25.22164881884069, "bops": 61941092777459712, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "nvidia", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.948164701461792, "D": 9999745024, "D/N": 97.294742400542, "bops": 1027752354113388544, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "nvidia", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 3.0075933933258057, "D": 4999872512, "D/N": 48.647371200271, "bops": 513876177056694272, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "nvidia", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 3.086474657058716, "D": 2499805184, "D/N": 24.322410305970966, "bops": 256924617229205504, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "nvidia", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.4791834354400635, "D": 749993984, "D/N": 24.604035356610467, "bops": 22861736616919040, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "nvidia", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": true}, {"Nstr": 30, "N": 30482560, "final_loss": 3.2865312099456787, "D": 2999975936, "D/N": 98.41614142644187, "bops": 91446946467676160, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "nvidia", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": true}, {"Nstr": 30, "N": 30482560, "final_loss": 3.2330589294433594, "D": 5999951872, "D/N": 196.83228285288374, "bops": 182893892935352320, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "nvidia", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": true}, {"Nstr": 30, "N": 30482560, "final_loss": 3.366539001464844, "D": 1499987968, "D/N": 49.208070713220934, "bops": 45723473233838080, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "nvidia", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": true}, {"Nstr": 50, "N": 49556736, "final_loss": 3.2065553665161133, "D": 2499805184, "D/N": 50.44329763768138, "bops": 123882185554919424, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "nvidia", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": true}, {"Nstr": 50, "N": 49556736, "final_loss": 3.2921717166900635, "D": 1249902592, "D/N": 25.22164881884069, "bops": 61941092777459712, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "nvidia", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": true}, {"Nstr": 50, "N": 49556736, "final_loss": 3.0950376987457275, "D": 9999745024, "D/N": 201.78377010140457, "bops": 495554724221681664, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "nvidia", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": true}, {"Nstr": 50, "N": 49556736, "final_loss": 3.1429572105407715, "D": 4999872512, "D/N": 100.89188505070229, "bops": 247777362110840832, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "nvidia", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": true}, {"Nstr": 50, "N": 49556736, "final_loss": 3.0575411319732666, "D": 19999752192, "D/N": 403.57282997814866, "bops": 991122439444365312, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "nvidia", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": true}, {"Nstr": 30, "N": 30482560, "final_loss": 3.192119836807251, "D": 11999903744, "D/N": 393.6645657057675, "bops": 365787785870704640, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "nvidia", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": true}, {"Nstr": 30, "N": 30482560, "final_loss": 3.1577537059783936, "D": 23999807488, "D/N": 787.329131411535, "bops": 731575571741409280, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "nvidia", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": true}, {"Nstr": 100, "N": 102777856, "final_loss": 3.081406831741333, "D": 2499805184, "D/N": 24.322410305970966, "bops": 256924617229205504, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "nvidia", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": true}, {"Nstr": 100, "N": 102777856, "final_loss": 2.9434187412261963, "D": 9999745024, "D/N": 97.294742400542, "bops": 1027752354113388544, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "nvidia", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": true}, {"Nstr": 100, "N": 102777856, "final_loss": 3.0020065307617188, "D": 4999872512, "D/N": 48.647371200271, "bops": 513876177056694272, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "nvidia", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": true}, {"Nstr": 100, "N": 102777856, "final_loss": 2.900766372680664, "D": 19999752192, "D/N": 194.59203538941307, "bops": 2055531650825060352, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "nvidia", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": true}, {"Nstr": 50, "N": 49556736, "final_loss": 3.023688554763794, "D": 39999766528, "D/N": 807.1509497316368, "bops": 1982257869889732608, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "nvidia", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": true}, {"Nstr": 100, "N": 102777856, "final_loss": 2.900766372680664, "D": 19999752192, "D/N": 194.59203538941307, "bops": 2055531650825060352, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "nvidia", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": true}, {"Nstr": 100, "N": 102777856, "final_loss": 2.865172863006592, "D": 39999766528, "D/N": 389.18662136715517, "bops": 4111090244248403968, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "nvidia", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": true}, {"Nstr": 200, "N": 203188480, "final_loss": 2.82003116607666, "D": 9999745024, "D/N": 49.21413371466729, "bops": 2031832991814123520, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "nvidia", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 200, "N": 203188480, "final_loss": 2.819159507751465, "D": 9999745024, "D/N": 49.21413371466729, "bops": 2031832991814123520, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "nvidia", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": true}, {"Nstr": 200, "N": 203188480, "final_loss": 2.8879354000091553, "D": 4999872512, "D/N": 24.607066857333646, "bops": 1015916495907061760, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "nvidia", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": true}, {"Nstr": 200, "N": 203188480, "final_loss": 2.889244079589844, "D": 4999872512, "D/N": 24.607066857333646, "bops": 1015916495907061760, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "nvidia", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 200, "N": 203188480, "final_loss": 2.7657861709594727, "D": 19999752192, "D/N": 98.4295575812172, "bops": 4063719248269148160, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "nvidia", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": true}, {"Nstr": 200, "N": 203188480, "final_loss": 2.7677061557769775, "D": 19999752192, "D/N": 98.4295575812172, "bops": 4063719248269148160, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "nvidia", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.029185056686402, "D": 39999766528, "D/N": 807.1509497316368, "bops": 1982257869889732608, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "nvidia", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.870213031768799, "D": 39999766528, "D/N": 389.18662136715517, "bops": 4111090244248403968, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "nvidia", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.9053211212158203, "D": 19999752192, "D/N": 194.59203538941307, "bops": 2055531650825060352, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "nvidia", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.8383898735046387, "D": 79999795200, "D/N": 778.3757933226394, "bops": 8222207431095091200, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "nvidia", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": true}, {"Nstr": 100, "N": 102777856, "final_loss": 2.844137668609619, "D": 79999795200, "D/N": 778.3757933226394, "bops": 8222207431095091200, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "nvidia", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}], "tetrajetv2": [{"Nstr": 30, "N": 30482560, "final_loss": 3.476752281188965, "D": 749993984, "D/N": 24.604035356610467, "bops": 22861736616919040, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "tetrajetv2", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.2253119945526123, "D": 5999951872, "D/N": 196.83228285288374, "bops": 182893892935352320, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "tetrajetv2", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.364501953125, "D": 1499987968, "D/N": 49.208070713220934, "bops": 45723473233838080, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "tetrajetv2", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.182234048843384, "D": 11999903744, "D/N": 393.6645657057675, "bops": 365787785870704640, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "tetrajetv2", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.2830967903137207, "D": 2999975936, "D/N": 98.41614142644187, "bops": 91446946467676160, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "tetrajetv2", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.2016170024871826, "D": 2499805184, "D/N": 50.44329763768138, "bops": 123882185554919424, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "tetrajetv2", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.293308973312378, "D": 1249902592, "D/N": 25.22164881884069, "bops": 61941092777459712, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "tetrajetv2", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.1366467475891113, "D": 4999872512, "D/N": 100.89188505070229, "bops": 247777362110840832, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "tetrajetv2", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.145180940628052, "D": 23999807488, "D/N": 787.329131411535, "bops": 731575571741409280, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "tetrajetv2", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.086511611938477, "D": 9999745024, "D/N": 201.78377010140457, "bops": 495554724221681664, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "tetrajetv2", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.046967029571533, "D": 19999752192, "D/N": 403.57282997814866, "bops": 991122439444365312, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "tetrajetv2", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 200, "N": 203188480, "final_loss": 2.8168699741363525, "D": 9999745024, "D/N": 49.21413371466729, "bops": 2031832991814123520, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "tetrajetv2", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 200, "N": 203188480, "final_loss": 2.887484073638916, "D": 4999872512, "D/N": 24.607066857333646, "bops": 1015916495907061760, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "tetrajetv2", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 3.0849921703338623, "D": 2499805184, "D/N": 24.322410305970966, "bops": 256924617229205504, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "tetrajetv2", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.8941829204559326, "D": 19999752192, "D/N": 194.59203538941307, "bops": 2055531650825060352, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "tetrajetv2", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.940826177597046, "D": 9999745024, "D/N": 97.294742400542, "bops": 1027752354113388544, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "tetrajetv2", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 3.0034255981445312, "D": 4999872512, "D/N": 48.647371200271, "bops": 513876177056694272, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "tetrajetv2", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.010661363601685, "D": 39999766528, "D/N": 807.1509497316368, "bops": 1982257869889732608, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "tetrajetv2", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.855395793914795, "D": 39999766528, "D/N": 389.18662136715517, "bops": 4111090244248403968, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "tetrajetv2", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 200, "N": 203188480, "final_loss": 2.760930061340332, "D": 19999752192, "D/N": 98.4295575812172, "bops": 4063719248269148160, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "tetrajetv2", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.8272135257720947, "D": 79999795200, "D/N": 778.3757933226394, "bops": 8222207431095091200, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": "tetrajetv2", "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}], "backward_main": [{"Nstr": 30, "N": 30482560, "final_loss": 3.14717960357666, "D": 5999951872, "D/N": 196.83228285288374, "bops": 182893892935352320, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "EW_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.4236550331115723, "D": 749993984, "D/N": 24.604035356610467, "bops": 22861736616919040, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "EW_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.0584535598754883, "D": 23999807488, "D/N": 787.329131411535, "bops": 731575571741409280, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "EW_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.0957956314086914, "D": 11999903744, "D/N": 393.6645657057675, "bops": 365787785870704640, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "EW_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.3023085594177246, "D": 1499987968, "D/N": 49.208070713220934, "bops": 45723473233838080, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "EW_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.211033582687378, "D": 2999975936, "D/N": 98.41614142644187, "bops": 91446946467676160, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "EW_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.3039205074310303, "D": 1499987968, "D/N": 49.208070713220934, "bops": 45723473233838080, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.1514737606048584, "D": 5999951872, "D/N": 196.83228285288374, "bops": 182893892935352320, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.30556058883667, "D": 1499987968, "D/N": 49.208070713220934, "bops": 45723473233838080, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.2161495685577393, "D": 2999975936, "D/N": 98.41614142644187, "bops": 91446946467676160, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.149941682815552, "D": 5999951872, "D/N": 196.83228285288374, "bops": 182893892935352320, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.429147481918335, "D": 749993984, "D/N": 24.604035356610467, "bops": 22861736616919040, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.4225423336029053, "D": 749993984, "D/N": 24.604035356610467, "bops": 22861736616919040, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.0626771450042725, "D": 23999807488, "D/N": 787.329131411535, "bops": 731575571741409280, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.062796115875244, "D": 23999807488, "D/N": 787.329131411535, "bops": 731575571741409280, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.100515842437744, "D": 11999903744, "D/N": 393.6645657057675, "bops": 365787785870704640, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.214488983154297, "D": 2999975936, "D/N": 98.41614142644187, "bops": 91446946467676160, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.099712371826172, "D": 11999903744, "D/N": 393.6645657057675, "bops": 365787785870704640, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 2.9771223068237305, "D": 19999752192, "D/N": 403.57282997814866, "bops": 991122439444365312, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.943992853164673, "D": 4999872512, "D/N": 48.647371200271, "bops": 513876177056694272, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "EW_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.881844997406006, "D": 9999745024, "D/N": 97.294742400542, "bops": 1027752354113388544, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.8315422534942627, "D": 19999752192, "D/N": 194.59203538941307, "bops": 2055531650825060352, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.2378125190734863, "D": 1249902592, "D/N": 25.22164881884069, "bops": 61941092777459712, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "EW_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 2.9404962062835693, "D": 39999766528, "D/N": 807.1509497316368, "bops": 1982257869889732608, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.9484994411468506, "D": 4999872512, "D/N": 48.647371200271, "bops": 513876177056694272, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.0155985355377197, "D": 9999745024, "D/N": 201.78377010140457, "bops": 495554724221681664, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "EW_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.143071413040161, "D": 2499805184, "D/N": 50.44329763768138, "bops": 123882185554919424, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "EW_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 3.035578966140747, "D": 2499805184, "D/N": 24.322410305970966, "bops": 256924617229205504, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.1465868949890137, "D": 2499805184, "D/N": 50.44329763768138, "bops": 123882185554919424, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.8764898777008057, "D": 9999745024, "D/N": 97.294742400542, "bops": 1027752354113388544, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "EW_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 2.975815534591675, "D": 19999752192, "D/N": 403.57282997814866, "bops": 991122439444365312, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.82816743850708, "D": 19999752192, "D/N": 194.59203538941307, "bops": 2055531650825060352, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "EW_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.8804004192352295, "D": 9999745024, "D/N": 97.294742400542, "bops": 1027752354113388544, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.0188562870025635, "D": 9999745024, "D/N": 201.78377010140457, "bops": 495554724221681664, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.2405669689178467, "D": 1249902592, "D/N": 25.22164881884069, "bops": 61941092777459712, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.0711803436279297, "D": 4999872512, "D/N": 100.89188505070229, "bops": 247777362110840832, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "EW_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 2.971205234527588, "D": 19999752192, "D/N": 403.57282997814866, "bops": 991122439444365312, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "EW_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.2410964965820312, "D": 1249902592, "D/N": 25.22164881884069, "bops": 61941092777459712, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.145210027694702, "D": 2499805184, "D/N": 50.44329763768138, "bops": 123882185554919424, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.8332557678222656, "D": 19999752192, "D/N": 194.59203538941307, "bops": 2055531650825060352, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 2.935039520263672, "D": 39999766528, "D/N": 807.1509497316368, "bops": 1982257869889732608, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "EW_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 2.9405951499938965, "D": 39999766528, "D/N": 807.1509497316368, "bops": 1982257869889732608, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.021128416061402, "D": 9999745024, "D/N": 201.78377010140457, "bops": 495554724221681664, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.075317621231079, "D": 4999872512, "D/N": 100.89188505070229, "bops": 247777362110840832, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.07372784614563, "D": 4999872512, "D/N": 100.89188505070229, "bops": 247777362110840832, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 3.034154176712036, "D": 2499805184, "D/N": 24.322410305970966, "bops": 256924617229205504, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 3.031686544418335, "D": 2499805184, "D/N": 24.322410305970966, "bops": 256924617229205504, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "EW_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.946883201599121, "D": 4999872512, "D/N": 48.647371200271, "bops": 513876177056694272, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.8871328830718994, "D": 9999745024, "D/N": 97.294742400542, "bops": 1027752354113388544, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 2.9353601932525635, "D": 39999766528, "D/N": 807.1509497316368, "bops": 1982257869889732608, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "EW_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.068239212036133, "D": 23999807488, "D/N": 787.329131411535, "bops": 731575571741409280, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.078404188156128, "D": 4999872512, "D/N": 100.89188505070229, "bops": 247777362110840832, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 2.978870153427124, "D": 19999752192, "D/N": 403.57282997814866, "bops": 991122439444365312, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 2.971548557281494, "D": 19999752192, "D/N": 403.57282997814866, "bops": 991122439444365312, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "EW_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.3089001178741455, "D": 1499987968, "D/N": 49.208070713220934, "bops": 45723473233838080, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.024817705154419, "D": 9999745024, "D/N": 201.78377010140457, "bops": 495554724221681664, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.1055262088775635, "D": 11999903744, "D/N": 393.6645657057675, "bops": 365787785870704640, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.4292991161346436, "D": 749993984, "D/N": 24.604035356610467, "bops": 22861736616919040, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.15277099609375, "D": 2499805184, "D/N": 50.44329763768138, "bops": 123882185554919424, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.437592029571533, "D": 749993984, "D/N": 24.604035356610467, "bops": 22861736616919040, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.9450314044952393, "D": 4999872512, "D/N": 48.647371200271, "bops": 513876177056694272, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "EW_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.220566987991333, "D": 2999975936, "D/N": 98.41614142644187, "bops": 91446946467676160, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.3039159774780273, "D": 1499987968, "D/N": 49.208070713220934, "bops": 45723473233838080, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "EW_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.157106399536133, "D": 5999951872, "D/N": 196.83228285288374, "bops": 182893892935352320, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 3.042901515960694, "D": 2499805184, "D/N": 24.322410305970966, "bops": 256924617229205504, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.1548361778259277, "D": 5999951872, "D/N": 196.83228285288374, "bops": 182893892935352320, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.8362395763397217, "D": 19999752192, "D/N": 194.59203538941307, "bops": 2055531650825060352, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 3.033780336380005, "D": 2499805184, "D/N": 24.322410305970966, "bops": 256924617229205504, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "EW_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.14848256111145, "D": 5999951872, "D/N": 196.83228285288374, "bops": 182893892935352320, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "EW_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.0969202518463135, "D": 11999903744, "D/N": 393.6645657057675, "bops": 365787785870704640, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "EW_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.8340203762054443, "D": 19999752192, "D/N": 194.59203538941307, "bops": 2055531650825060352, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 3.03847599029541, "D": 2499805184, "D/N": 24.322410305970966, "bops": 256924617229205504, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.066047430038452, "D": 23999807488, "D/N": 787.329131411535, "bops": 731575571741409280, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.884263753890991, "D": 9999745024, "D/N": 97.294742400542, "bops": 1027752354113388544, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.82828950881958, "D": 19999752192, "D/N": 194.59203538941307, "bops": 2055531650825060352, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "EW_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.222574472427368, "D": 2999975936, "D/N": 98.41614142644187, "bops": 91446946467676160, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.144470453262329, "D": 2499805184, "D/N": 50.44329763768138, "bops": 123882185554919424, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "EW_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.31190824508667, "D": 1499987968, "D/N": 49.208070713220934, "bops": 45723473233838080, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.2128241062164307, "D": 2999975936, "D/N": 98.41614142644187, "bops": 91446946467676160, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "EW_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.2454993724823, "D": 1249902592, "D/N": 25.22164881884069, "bops": 61941092777459712, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.9519028663635254, "D": 4999872512, "D/N": 48.647371200271, "bops": 513876177056694272, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 2.9412097930908203, "D": 39999766528, "D/N": 807.1509497316368, "bops": 1982257869889732608, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.2484734058380127, "D": 1249902592, "D/N": 25.22164881884069, "bops": 61941092777459712, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.4290435314178467, "D": 749993984, "D/N": 24.604035356610467, "bops": 22861736616919040, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "EW_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.240612030029297, "D": 1249902592, "D/N": 25.22164881884069, "bops": 61941092777459712, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "EW_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.072706699371338, "D": 4999872512, "D/N": 100.89188505070229, "bops": 247777362110840832, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "EW_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.1502904891967773, "D": 2499805184, "D/N": 50.44329763768138, "bops": 123882185554919424, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.1033663749694824, "D": 11999903744, "D/N": 393.6645657057675, "bops": 365787785870704640, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.023191213607788, "D": 9999745024, "D/N": 201.78377010140457, "bops": 495554724221681664, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 2.980637311935425, "D": 19999752192, "D/N": 403.57282997814866, "bops": 991122439444365312, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.954716444015503, "D": 4999872512, "D/N": 48.647371200271, "bops": 513876177056694272, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.877833604812622, "D": 9999745024, "D/N": 97.294742400542, "bops": 1027752354113388544, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "EW_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.08113169670105, "D": 4999872512, "D/N": 100.89188505070229, "bops": 247777362110840832, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.0588409900665283, "D": 23999807488, "D/N": 787.329131411535, "bops": 731575571741409280, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "EW_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 2.9427192211151123, "D": 39999766528, "D/N": 807.1509497316368, "bops": 1982257869889732608, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.7994275093078613, "D": 39999766528, "D/N": 389.18662136715517, "bops": 4111090244248403968, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.799285411834717, "D": 39999766528, "D/N": 389.18662136715517, "bops": 4111090244248403968, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.7914083003997803, "D": 39999766528, "D/N": 389.18662136715517, "bops": 4111090244248403968, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "EW_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.7918527126312256, "D": 39999766528, "D/N": 389.18662136715517, "bops": 4111090244248403968, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "EW_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.772299289703369, "D": 79999795200, "D/N": 778.3757933226394, "bops": 8222207431095091200, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.795973300933838, "D": 39999766528, "D/N": 389.18662136715517, "bops": 4111090244248403968, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.798012971878052, "D": 39999766528, "D/N": 389.18662136715517, "bops": 4111090244248403968, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.766477584838867, "D": 79999795200, "D/N": 778.3757933226394, "bops": 8222207431095091200, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "EW_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.7666401863098145, "D": 79999795200, "D/N": 778.3757933226394, "bops": 8222207431095091200, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "EW_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.7727742195129395, "D": 79999795200, "D/N": 778.3757933226394, "bops": 8222207431095091200, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.799295663833618, "D": 39999766528, "D/N": 389.18662136715517, "bops": 4111090244248403968, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.7723090648651123, "D": 79999795200, "D/N": 778.3757933226394, "bops": 8222207431095091200, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.799436569213867, "D": 39999766528, "D/N": 389.18662136715517, "bops": 4111090244248403968, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.7710025310516357, "D": 79999795200, "D/N": 778.3757933226394, "bops": 8222207431095091200, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.7707183361053467, "D": 79999795200, "D/N": 778.3757933226394, "bops": 8222207431095091200, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)Q(Wt)t_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}], "backward_quartet": [{"Nstr": 50, "N": 49556736, "final_loss": 3.2512474060058594, "D": 1249902592, "D/N": 25.22164881884069, "bops": 61941092777459712, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 32, "bscale_dtype": "e8m0", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 2.982647180557251, "D": 19999752192, "D/N": 403.57282997814866, "bops": 991122439444365312, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 32, "bscale_dtype": "e8m0", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.154787540435791, "D": 2499805184, "D/N": 50.44329763768138, "bops": 123882185554919424, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 32, "bscale_dtype": "e8m0", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.2181217670440674, "D": 2999975936, "D/N": 98.41614142644187, "bops": 91446946467676160, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "no", "bgroup_dim": 32, "bscale_dtype": "e8m0", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.306372880935669, "D": 1499987968, "D/N": 49.208070713220934, "bops": 45723473233838080, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "no", "bgroup_dim": 32, "bscale_dtype": "e8m0", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.4295248985290527, "D": 749993984, "D/N": 24.604035356610467, "bops": 22861736616919040, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "no", "bgroup_dim": 32, "bscale_dtype": "e8m0", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 2.978055000305176, "D": 19999752192, "D/N": 403.57282997814866, "bops": 991122439444365312, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "no", "bgroup_dim": 32, "bscale_dtype": "e8m0", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.026157855987549, "D": 9999745024, "D/N": 201.78377010140457, "bops": 495554724221681664, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 32, "bscale_dtype": "e8m0", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.147644281387329, "D": 2499805184, "D/N": 50.44329763768138, "bops": 123882185554919424, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "no", "bgroup_dim": 32, "bscale_dtype": "e8m0", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.065319776535034, "D": 23999807488, "D/N": 787.329131411535, "bops": 731575571741409280, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "no", "bgroup_dim": 32, "bscale_dtype": "e8m0", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.067539691925049, "D": 23999807488, "D/N": 787.329131411535, "bops": 731575571741409280, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 32, "bscale_dtype": "e8m0", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.3154637813568115, "D": 1499987968, "D/N": 49.208070713220934, "bops": 45723473233838080, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 32, "bscale_dtype": "e8m0", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.225132465362549, "D": 2999975936, "D/N": 98.41614142644187, "bops": 91446946467676160, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 32, "bscale_dtype": "e8m0", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.4380767345428467, "D": 749993984, "D/N": 24.604035356610467, "bops": 22861736616919040, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 32, "bscale_dtype": "e8m0", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.077005624771118, "D": 4999872512, "D/N": 100.89188505070229, "bops": 247777362110840832, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "no", "bgroup_dim": 32, "bscale_dtype": "e8m0", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.107239007949829, "D": 11999903744, "D/N": 393.6645657057675, "bops": 365787785870704640, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 32, "bscale_dtype": "e8m0", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.1530821323394775, "D": 5999951872, "D/N": 196.83228285288374, "bops": 182893892935352320, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "no", "bgroup_dim": 32, "bscale_dtype": "e8m0", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.1592681407928467, "D": 5999951872, "D/N": 196.83228285288374, "bops": 182893892935352320, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 32, "bscale_dtype": "e8m0", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.1011974811553955, "D": 11999903744, "D/N": 393.6645657057675, "bops": 365787785870704640, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "no", "bgroup_dim": 32, "bscale_dtype": "e8m0", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.245579481124878, "D": 1249902592, "D/N": 25.22164881884069, "bops": 61941092777459712, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "no", "bgroup_dim": 32, "bscale_dtype": "e8m0", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.083735704421997, "D": 4999872512, "D/N": 100.89188505070229, "bops": 247777362110840832, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "sr", "bgroup_dim": 32, "bscale_dtype": "e8m0", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.0208113193511963, "D": 9999745024, "D/N": 201.78377010140457, "bops": 495554724221681664, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "EdenSRQuantizer", "bunbiased": "no", "bgroup_dim": 32, "bscale_dtype": "e8m0", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}], "forward_quartet": [{"Nstr": 30, "N": 30482560, "final_loss": 3.2953100204467773, "D": 2999975936, "D/N": 98.41614142644187, "bops": 91446946467676160, "fquant": null, "fsquare": null, "fscale_override": 1, "fhadamard_dim": 16, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.1843254566192627, "D": 23999807488, "D/N": 787.329131411535, "bops": 731575571741409280, "fquant": null, "fsquare": null, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.478809356689453, "D": 749993984, "D/N": 24.604035356610467, "bops": 22861736616919040, "fquant": null, "fsquare": null, "fscale_override": 1, "fhadamard_dim": 16, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.374760627746582, "D": 1499987968, "D/N": 49.208070713220934, "bops": 45723473233838080, "fquant": null, "fsquare": null, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.244227170944214, "D": 5999951872, "D/N": 196.83228285288374, "bops": 182893892935352320, "fquant": null, "fsquare": null, "fscale_override": 1, "fhadamard_dim": 16, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.17134690284729, "D": 23999807488, "D/N": 787.329131411535, "bops": 731575571741409280, "fquant": null, "fsquare": null, "fscale_override": 1, "fhadamard_dim": 16, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.206448554992676, "D": 11999903744, "D/N": 393.6645657057675, "bops": 365787785870704640, "fquant": null, "fsquare": null, "fscale_override": 1, "fhadamard_dim": 16, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.2174723148345947, "D": 11999903744, "D/N": 393.6645657057675, "bops": 365787785870704640, "fquant": null, "fsquare": null, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.3048572540283203, "D": 2999975936, "D/N": 98.41614142644187, "bops": 91446946467676160, "fquant": null, "fsquare": null, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.256196975708008, "D": 5999951872, "D/N": 196.83228285288374, "bops": 182893892935352320, "fquant": null, "fsquare": null, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.480828285217285, "D": 749993984, "D/N": 24.604035356610467, "bops": 22861736616919040, "fquant": null, "fsquare": null, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.369927167892456, "D": 1499987968, "D/N": 49.208070713220934, "bops": 45723473233838080, "fquant": null, "fsquare": null, "fscale_override": 1, "fhadamard_dim": 16, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.221442461013794, "D": 2499805184, "D/N": 50.44329763768138, "bops": 123882185554919424, "fquant": null, "fsquare": null, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.0834429264068604, "D": 19999752192, "D/N": 403.57282997814866, "bops": 991122439444365312, "fquant": null, "fsquare": null, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 3.097179412841797, "D": 2499805184, "D/N": 24.322410305970966, "bops": 256924617229205504, "fquant": null, "fsquare": null, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.211829662322998, "D": 2499805184, "D/N": 50.44329763768138, "bops": 123882185554919424, "fquant": null, "fsquare": null, "fscale_override": 1, "fhadamard_dim": 16, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 3.0233805179595947, "D": 4999872512, "D/N": 48.647371200271, "bops": 513876177056694272, "fquant": null, "fsquare": null, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 3.084794282913208, "D": 2499805184, "D/N": 24.322410305970966, "bops": 256924617229205504, "fquant": null, "fsquare": null, "fscale_override": 1, "fhadamard_dim": 16, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.304115056991577, "D": 1249902592, "D/N": 25.22164881884069, "bops": 61941092777459712, "fquant": null, "fsquare": null, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.1055798530578613, "D": 9999745024, "D/N": 201.78377010140457, "bops": 495554724221681664, "fquant": null, "fsquare": null, "fscale_override": 1, "fhadamard_dim": 16, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.967468500137329, "D": 9999745024, "D/N": 97.294742400542, "bops": 1027752354113388544, "fquant": null, "fsquare": null, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.162126302719116, "D": 4999872512, "D/N": 100.89188505070229, "bops": 247777362110840832, "fquant": null, "fsquare": null, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.9516122341156006, "D": 9999745024, "D/N": 97.294742400542, "bops": 1027752354113388544, "fquant": null, "fsquare": null, "fscale_override": 1, "fhadamard_dim": 16, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.926034450531006, "D": 19999752192, "D/N": 194.59203538941307, "bops": 2055531650825060352, "fquant": null, "fsquare": null, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.897888422012329, "D": 39999766528, "D/N": 389.18662136715517, "bops": 4111090244248403968, "fquant": null, "fsquare": null, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.8780386447906494, "D": 39999766528, "D/N": 389.18662136715517, "bops": 4111090244248403968, "fquant": null, "fsquare": null, "fscale_override": 1, "fhadamard_dim": 16, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.0384745597839355, "D": 39999766528, "D/N": 807.1509497316368, "bops": 1982257869889732608, "fquant": null, "fsquare": null, "fscale_override": 1, "fhadamard_dim": 16, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.910367012023926, "D": 19999752192, "D/N": 194.59203538941307, "bops": 2055531650825060352, "fquant": null, "fsquare": null, "fscale_override": 1, "fhadamard_dim": 16, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.070894241333008, "D": 19999752192, "D/N": 403.57282997814866, "bops": 991122439444365312, "fquant": null, "fsquare": null, "fscale_override": 1, "fhadamard_dim": 16, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.2975001335144043, "D": 1249902592, "D/N": 25.22164881884069, "bops": 61941092777459712, "fquant": null, "fsquare": null, "fscale_override": 1, "fhadamard_dim": 16, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.151287317276001, "D": 4999872512, "D/N": 100.89188505070229, "bops": 247777362110840832, "fquant": null, "fsquare": null, "fscale_override": 1, "fhadamard_dim": 16, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 3.0081334114074707, "D": 4999872512, "D/N": 48.647371200271, "bops": 513876177056694272, "fquant": null, "fsquare": null, "fscale_override": 1, "fhadamard_dim": 16, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.1172194480895996, "D": 9999745024, "D/N": 201.78377010140457, "bops": 495554724221681664, "fquant": null, "fsquare": null, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.0533621311187744, "D": 39999766528, "D/N": 807.1509497316368, "bops": 1982257869889732608, "fquant": null, "fsquare": null, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.8822717666625977, "D": 79999795200, "D/N": 778.3757933226394, "bops": 8222207431095091200, "fquant": null, "fsquare": null, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.8641602993011475, "D": 79999795200, "D/N": 778.3757933226394, "bops": 8222207431095091200, "fquant": null, "fsquare": null, "fscale_override": 1, "fhadamard_dim": 16, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}], "orig_albert_tseng": [{"Nstr": 30, "N": 30482560, "final_loss": 3.3145620822906494, "D": 1499987968, "D/N": 49.208070713220934, "bops": 45723473233838080, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "AlbertTsengQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": true, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.1590945720672607, "D": 5999951872, "D/N": 196.83228285288374, "bops": 182893892935352320, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "AlbertTsengQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": true, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.4293954372406006, "D": 749993984, "D/N": 24.604035356610467, "bops": 22861736616919040, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "AlbertTsengQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": false, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.2253801822662354, "D": 2999975936, "D/N": 98.41614142644187, "bops": 91446946467676160, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "AlbertTsengQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": true, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.2197394371032715, "D": 2999975936, "D/N": 98.41614142644187, "bops": 91446946467676160, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "AlbertTsengQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": false, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.1078174114227295, "D": 11999903744, "D/N": 393.6645657057675, "bops": 365787785870704640, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "AlbertTsengQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": true, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.3081583976745605, "D": 1499987968, "D/N": 49.208070713220934, "bops": 45723473233838080, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "AlbertTsengQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": false, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.156450033187866, "D": 5999951872, "D/N": 196.83228285288374, "bops": 182893892935352320, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "AlbertTsengQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": false, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.4344327449798584, "D": 749993984, "D/N": 24.604035356610467, "bops": 22861736616919040, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "AlbertTsengQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": true, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.1556155681610107, "D": 2499805184, "D/N": 50.44329763768138, "bops": 123882185554919424, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "AlbertTsengQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": true, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 2.981428384780884, "D": 19999752192, "D/N": 403.57282997814866, "bops": 991122439444365312, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "AlbertTsengQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": true, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.0833544731140137, "D": 4999872512, "D/N": 100.89188505070229, "bops": 247777362110840832, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "AlbertTsengQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": true, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.0775649547576904, "D": 4999872512, "D/N": 100.89188505070229, "bops": 247777362110840832, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "AlbertTsengQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": false, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.022575855255127, "D": 9999745024, "D/N": 201.78377010140457, "bops": 495554724221681664, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "AlbertTsengQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": false, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.1074328422546387, "D": 11999903744, "D/N": 393.6645657057675, "bops": 365787785870704640, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "AlbertTsengQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": false, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.0703084468841553, "D": 23999807488, "D/N": 787.329131411535, "bops": 731575571741409280, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "AlbertTsengQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": true, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.070957660675049, "D": 23999807488, "D/N": 787.329131411535, "bops": 731575571741409280, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "AlbertTsengQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": false, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.1502087116241455, "D": 2499805184, "D/N": 50.44329763768138, "bops": 123882185554919424, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "AlbertTsengQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": false, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.026327133178711, "D": 9999745024, "D/N": 201.78377010140457, "bops": 495554724221681664, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "AlbertTsengQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": true, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 2.9452707767486572, "D": 39999766528, "D/N": 807.1509497316368, "bops": 1982257869889732608, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "AlbertTsengQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": true, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 2.9809160232543945, "D": 19999752192, "D/N": 403.57282997814866, "bops": 991122439444365312, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "AlbertTsengQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": false, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.2535014152526855, "D": 1249902592, "D/N": 25.22164881884069, "bops": 61941092777459712, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "AlbertTsengQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": true, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.245069980621338, "D": 1249902592, "D/N": 25.22164881884069, "bops": 61941092777459712, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "AlbertTsengQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": false, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 2.948781728744507, "D": 39999766528, "D/N": 807.1509497316368, "bops": 1982257869889732608, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "AlbertTsengQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": false, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}], "fixed_albert_tseng": [{"Nstr": 30, "N": 30482560, "final_loss": 3.1083950996398926, "D": 11999903744, "D/N": 393.6645657057675, "bops": 365787785870704640, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "AlbertTsengQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": true, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.2176103591918945, "D": 2999975936, "D/N": 98.41614142644187, "bops": 91446946467676160, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "AlbertTsengQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": false, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.43758773803711, "D": 749993984, "D/N": 24.604035356610467, "bops": 22861736616919040, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "AlbertTsengQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": true, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.0676815509796143, "D": 23999807488, "D/N": 787.329131411535, "bops": 731575571741409280, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "AlbertTsengQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": true, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.306640148162842, "D": 1499987968, "D/N": 49.208070713220934, "bops": 45723473233838080, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "AlbertTsengQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": false, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.4292681217193604, "D": 749993984, "D/N": 24.604035356610467, "bops": 22861736616919040, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "AlbertTsengQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": false, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.0646913051605225, "D": 23999807488, "D/N": 787.329131411535, "bops": 731575571741409280, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "AlbertTsengQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": false, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.1532251834869385, "D": 5999951872, "D/N": 196.83228285288374, "bops": 182893892935352320, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "AlbertTsengQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": false, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.2238283157348633, "D": 2999975936, "D/N": 98.41614142644187, "bops": 91446946467676160, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "AlbertTsengQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": true, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.315854549407959, "D": 1499987968, "D/N": 49.208070713220934, "bops": 45723473233838080, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "AlbertTsengQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": true, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.100947618484497, "D": 11999903744, "D/N": 393.6645657057675, "bops": 365787785870704640, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "AlbertTsengQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": false, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.1594414710998535, "D": 5999951872, "D/N": 196.83228285288374, "bops": 182893892935352320, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "AlbertTsengQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": true, "bhadamard_dim": 32, "bbackward_scheme": "Q(E)Q(Wt)t_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}], "forward_main": [{"Nstr": 30, "N": 30482560, "final_loss": 3.359827756881714, "D": 1499987968, "D/N": 49.208070713220934, "bops": 45723473233838080, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 16, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.2725658416748047, "D": 2999975936, "D/N": 98.41614142644187, "bops": 91446946467676160, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.4632062911987305, "D": 749993984, "D/N": 24.604035356610467, "bops": 22861736616919040, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.3512837886810303, "D": 1499987968, "D/N": 49.208070713220934, "bops": 45723473233838080, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.466763496398926, "D": 749993984, "D/N": 24.604035356610467, "bops": 22861736616919040, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 16, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.281914472579956, "D": 2999975936, "D/N": 98.41614142644187, "bops": 91446946467676160, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 16, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.226288318634033, "D": 5999951872, "D/N": 196.83228285288374, "bops": 182893892935352320, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 16, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.1770193576812744, "D": 11999903744, "D/N": 393.6645657057675, "bops": 365787785870704640, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.1854748725891113, "D": 11999903744, "D/N": 393.6645657057675, "bops": 365787785870704640, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 16, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.150405168533325, "D": 23999807488, "D/N": 787.329131411535, "bops": 731575571741409280, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 16, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.2175004482269287, "D": 5999951872, "D/N": 196.83228285288374, "bops": 182893892935352320, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.1400256156921387, "D": 23999807488, "D/N": 787.329131411535, "bops": 731575571741409280, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.371548652648926, "D": 1499987968, "D/N": 49.208070713220934, "bops": 45723473233838080, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 16, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.2355496883392334, "D": 5999951872, "D/N": 196.83228285288374, "bops": 182893892935352320, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 16, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.4764294624328613, "D": 749993984, "D/N": 24.604035356610467, "bops": 22861736616919040, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 16, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.1607940196990967, "D": 23999807488, "D/N": 787.329131411535, "bops": 731575571741409280, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 16, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.195631504058838, "D": 11999903744, "D/N": 393.6645657057675, "bops": 365787785870704640, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 16, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.2889280319213867, "D": 2999975936, "D/N": 98.41614142644187, "bops": 91446946467676160, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 16, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.2014734745025635, "D": 2499805184, "D/N": 50.44329763768138, "bops": 123882185554919424, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.2817375659942627, "D": 1249902592, "D/N": 25.22164881884069, "bops": 61941092777459712, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 16, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.281924247741699, "D": 1249902592, "D/N": 25.22164881884069, "bops": 61941092777459712, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.287883758544922, "D": 1249902592, "D/N": 25.22164881884069, "bops": 61941092777459712, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.2890546321868896, "D": 1249902592, "D/N": 25.22164881884069, "bops": 61941092777459712, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 16, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.2056779861450195, "D": 2499805184, "D/N": 50.44329763768138, "bops": 123882185554919424, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 16, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.1280221939086914, "D": 4999872512, "D/N": 100.89188505070229, "bops": 247777362110840832, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.1427135467529297, "D": 4999872512, "D/N": 100.89188505070229, "bops": 247777362110840832, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 16, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.0548388957977295, "D": 19999752192, "D/N": 403.57282997814866, "bops": 991122439444365312, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.0924575328826904, "D": 9999745024, "D/N": 201.78377010140457, "bops": 495554724221681664, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.0967886447906494, "D": 9999745024, "D/N": 201.78377010140457, "bops": 495554724221681664, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 16, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.133340120315552, "D": 4999872512, "D/N": 100.89188505070229, "bops": 247777362110840832, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 16, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.086756944656372, "D": 9999745024, "D/N": 201.78377010140457, "bops": 495554724221681664, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 16, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.0389442443847656, "D": 19999752192, "D/N": 403.57282997814866, "bops": 991122439444365312, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.04927396774292, "D": 19999752192, "D/N": 403.57282997814866, "bops": 991122439444365312, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 16, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.0057973861694336, "D": 39999766528, "D/N": 807.1509497316368, "bops": 1982257869889732608, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 3.077190399169922, "D": 2499805184, "D/N": 24.322410305970966, "bops": 256924617229205504, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 3.071728229522705, "D": 2499805184, "D/N": 24.322410305970966, "bops": 256924617229205504, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.0786561965942383, "D": 9999745024, "D/N": 201.78377010140457, "bops": 495554724221681664, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 3.0039403438568115, "D": 4999872512, "D/N": 48.647371200271, "bops": 513876177056694272, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 16, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.992748737335205, "D": 4999872512, "D/N": 48.647371200271, "bops": 513876177056694272, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.8490400314331055, "D": 39999766528, "D/N": 389.18662136715517, "bops": 4111090244248403968, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 3.077626943588257, "D": 2499805184, "D/N": 24.322410305970966, "bops": 256924617229205504, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 16, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.997748613357544, "D": 4999872512, "D/N": 48.647371200271, "bops": 513876177056694272, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.8860692977905273, "D": 19999752192, "D/N": 194.59203538941307, "bops": 2055531650825060352, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.8585164546966553, "D": 39999766528, "D/N": 389.18662136715517, "bops": 4111090244248403968, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 16, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.869313955307007, "D": 39999766528, "D/N": 389.18662136715517, "bops": 4111090244248403968, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 16, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.896341562271118, "D": 19999752192, "D/N": 194.59203538941307, "bops": 2055531650825060352, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.9405031204223633, "D": 9999745024, "D/N": 97.294742400542, "bops": 1027752354113388544, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 3.0833539962768555, "D": 2499805184, "D/N": 24.322410305970966, "bops": 256924617229205504, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 16, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.893495559692383, "D": 19999752192, "D/N": 194.59203538941307, "bops": 2055531650825060352, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 16, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.937530040740967, "D": 9999745024, "D/N": 97.294742400542, "bops": 1027752354113388544, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 16, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.9460713863372803, "D": 9999745024, "D/N": 97.294742400542, "bops": 1027752354113388544, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 16, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.8606362342834473, "D": 39999766528, "D/N": 389.18662136715517, "bops": 4111090244248403968, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.0610599517822266, "D": 19999752192, "D/N": 403.57282997814866, "bops": 991122439444365312, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 16, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.198115110397339, "D": 2499805184, "D/N": 50.44329763768138, "bops": 123882185554919424, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 16, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.9977829456329346, "D": 4999872512, "D/N": 48.647371200271, "bops": 513876177056694272, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 16, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.281080961227417, "D": 2999975936, "D/N": 98.41614142644187, "bops": 91446946467676160, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.228083372116089, "D": 5999951872, "D/N": 196.83228285288374, "bops": 182893892935352320, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.3575477600097656, "D": 1499987968, "D/N": 49.208070713220934, "bops": 45723473233838080, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.1887030601501465, "D": 11999903744, "D/N": 393.6645657057675, "bops": 365787785870704640, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.1539175510406494, "D": 23999807488, "D/N": 787.329131411535, "bops": 731575571741409280, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.4716920852661133, "D": 749993984, "D/N": 24.604035356610467, "bops": 22861736616919040, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.931328296661377, "D": 9999745024, "D/N": 97.294742400542, "bops": 1027752354113388544, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.8490400314331055, "D": 39999766528, "D/N": 389.18662136715517, "bops": 4111090244248403968, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.020294666290283, "D": 39999766528, "D/N": 807.1509497316368, "bops": 1982257869889732608, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.140286445617676, "D": 4999872512, "D/N": 100.89188505070229, "bops": 247777362110840832, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.869313955307007, "D": 39999766528, "D/N": 389.18662136715517, "bops": 4111090244248403968, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 16, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.8342580795288086, "D": 79999795200, "D/N": 778.3757933226394, "bops": 8222207431095091200, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.8235464096069336, "D": 79999795200, "D/N": 778.3757933226394, "bops": 8222207431095091200, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.833904266357422, "D": 79999795200, "D/N": 778.3757933226394, "bops": 8222207431095091200, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 16, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.844683885574341, "D": 79999795200, "D/N": 778.3757933226394, "bops": 8222207431095091200, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 16, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.2718117237091064, "D": 2999975936, "D/N": 98.41614142644187, "bops": 91446946467676160, "fquant": null, "fsquare": false, "fscale_override": 0.92, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.140223264694214, "D": 23999807488, "D/N": 787.329131411535, "bops": 731575571741409280, "fquant": null, "fsquare": false, "fscale_override": 0.92, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.216834306716919, "D": 5999951872, "D/N": 196.83228285288374, "bops": 182893892935352320, "fquant": null, "fsquare": false, "fscale_override": 0.92, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.468132495880127, "D": 749993984, "D/N": 24.604035356610467, "bops": 22861736616919040, "fquant": null, "fsquare": false, "fscale_override": 0.92, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.35412073135376, "D": 1499987968, "D/N": 49.208070713220934, "bops": 45723473233838080, "fquant": null, "fsquare": false, "fscale_override": 0.92, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.174133539199829, "D": 11999903744, "D/N": 393.6645657057675, "bops": 365787785870704640, "fquant": null, "fsquare": false, "fscale_override": 0.92, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.194190263748169, "D": 2499805184, "D/N": 50.44329763768138, "bops": 123882185554919424, "fquant": null, "fsquare": false, "fscale_override": 0.92, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 3.0709452629089355, "D": 2499805184, "D/N": 24.322410305970966, "bops": 256924617229205504, "fquant": null, "fsquare": false, "fscale_override": 0.92, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.931570053100586, "D": 9999745024, "D/N": 97.294742400542, "bops": 1027752354113388544, "fquant": null, "fsquare": false, "fscale_override": 0.92, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.1292099952697754, "D": 4999872512, "D/N": 100.89188505070229, "bops": 247777362110840832, "fquant": null, "fsquare": false, "fscale_override": 0.92, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.0404577255249023, "D": 19999752192, "D/N": 403.57282997814866, "bops": 991122439444365312, "fquant": null, "fsquare": false, "fscale_override": 0.92, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.0806243419647217, "D": 9999745024, "D/N": 201.78377010140457, "bops": 495554724221681664, "fquant": null, "fsquare": false, "fscale_override": 0.92, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.991671085357666, "D": 4999872512, "D/N": 48.647371200271, "bops": 513876177056694272, "fquant": null, "fsquare": false, "fscale_override": 0.92, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.8867645263671875, "D": 19999752192, "D/N": 194.59203538941307, "bops": 2055531650825060352, "fquant": null, "fsquare": false, "fscale_override": 0.92, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.281628370285034, "D": 1249902592, "D/N": 25.22164881884069, "bops": 61941092777459712, "fquant": null, "fsquare": false, "fscale_override": 0.92, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 200, "N": 203188480, "final_loss": 2.88187837600708, "D": 4999872512, "D/N": 24.607066857333646, "bops": 1015916495907061760, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 200, "N": 203188480, "final_loss": 2.812971353530884, "D": 9999745024, "D/N": 49.21413371466729, "bops": 2031832991814123520, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 200, "N": 203188480, "final_loss": 2.876657247543335, "D": 4999872512, "D/N": 24.607066857333646, "bops": 1015916495907061760, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 200, "N": 203188480, "final_loss": 2.8056671619415283, "D": 9999745024, "D/N": 49.21413371466729, "bops": 2031832991814123520, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 200, "N": 203188480, "final_loss": 2.759415864944458, "D": 19999752192, "D/N": 98.4295575812172, "bops": 4063719248269148160, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 200, "N": 203188480, "final_loss": 2.7555251121520996, "D": 19999752192, "D/N": 98.4295575812172, "bops": 4063719248269148160, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.19423508644104, "D": 2499805184, "D/N": 50.44329763768138, "bops": 123882185554919424, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": false, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.148790121078491, "D": 23999807488, "D/N": 787.329131411535, "bops": 731575571741409280, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": true, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.2237234115600586, "D": 5999951872, "D/N": 196.83228285288374, "bops": 182893892935352320, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": true, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.4676053524017334, "D": 749993984, "D/N": 24.604035356610467, "bops": 22861736616919040, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": true, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.347118377685547, "D": 1499987968, "D/N": 49.208070713220934, "bops": 45723473233838080, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": true, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.166105270385742, "D": 11999903744, "D/N": 393.6645657057675, "bops": 365787785870704640, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": true, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.129774808883667, "D": 23999807488, "D/N": 787.329131411535, "bops": 731575571741409280, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": true, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.267388343811035, "D": 2999975936, "D/N": 98.41614142644187, "bops": 91446946467676160, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": true, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.35609769821167, "D": 1499987968, "D/N": 49.208070713220934, "bops": 45723473233838080, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": true, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.208700180053711, "D": 5999951872, "D/N": 196.83228285288374, "bops": 182893892935352320, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": true, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.1834096908569336, "D": 11999903744, "D/N": 393.6645657057675, "bops": 365787785870704640, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": true, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.2775824069976807, "D": 2999975936, "D/N": 98.41614142644187, "bops": 91446946467676160, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": true, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.460808277130127, "D": 749993984, "D/N": 24.604035356610467, "bops": 22861736616919040, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": true, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.1983091831207275, "D": 2499805184, "D/N": 50.44329763768138, "bops": 123882185554919424, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": true, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.2764177322387695, "D": 1249902592, "D/N": 25.22164881884069, "bops": 61941092777459712, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": true, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.087726593017578, "D": 9999745024, "D/N": 201.78377010140457, "bops": 495554724221681664, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": true, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.014953851699829, "D": 39999766528, "D/N": 807.1509497316368, "bops": 1982257869889732608, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": true, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.1219239234924316, "D": 4999872512, "D/N": 100.89188505070229, "bops": 247777362110840832, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": true, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.0720629692077637, "D": 9999745024, "D/N": 201.78377010140457, "bops": 495554724221681664, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": true, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 2.99721097946167, "D": 39999766528, "D/N": 807.1509497316368, "bops": 1982257869889732608, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": true, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.1353907585144043, "D": 4999872512, "D/N": 100.89188505070229, "bops": 247777362110840832, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": true, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.049926280975342, "D": 19999752192, "D/N": 403.57282997814866, "bops": 991122439444365312, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": true, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.1878066062927246, "D": 2499805184, "D/N": 50.44329763768138, "bops": 123882185554919424, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": true, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.2832565307617188, "D": 1249902592, "D/N": 25.22164881884069, "bops": 61941092777459712, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": true, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.032531976699829, "D": 19999752192, "D/N": 403.57282997814866, "bops": 991122439444365312, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": true, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 3.065337896347046, "D": 2499805184, "D/N": 24.322410305970966, "bops": 256924617229205504, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": true, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.934708833694458, "D": 9999745024, "D/N": 97.294742400542, "bops": 1027752354113388544, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": true, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 3.0733160972595215, "D": 2499805184, "D/N": 24.322410305970966, "bops": 256924617229205504, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": true, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.8771021366119385, "D": 19999752192, "D/N": 194.59203538941307, "bops": 2055531650825060352, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": true, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.992365598678589, "D": 4999872512, "D/N": 48.647371200271, "bops": 513876177056694272, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": true, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.923654556274414, "D": 9999745024, "D/N": 97.294742400542, "bops": 1027752354113388544, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": true, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.9849345684051514, "D": 4999872512, "D/N": 48.647371200271, "bops": 513876177056694272, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": true, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.8923535346984863, "D": 19999752192, "D/N": 194.59203538941307, "bops": 2055531650825060352, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": true, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 200, "N": 203188480, "final_loss": 2.7572834491729736, "D": 19999752192, "D/N": 98.4295575812172, "bops": 4063719248269148160, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": true, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 200, "N": 203188480, "final_loss": 2.8098878860473633, "D": 9999745024, "D/N": 49.21413371466729, "bops": 2031832991814123520, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": true, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 200, "N": 203188480, "final_loss": 2.870790719985962, "D": 4999872512, "D/N": 24.607066857333646, "bops": 1015916495907061760, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": true, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 200, "N": 203188480, "final_loss": 2.7993154525756836, "D": 9999745024, "D/N": 49.21413371466729, "bops": 2031832991814123520, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": true, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 200, "N": 203188480, "final_loss": 2.74516224861145, "D": 19999752192, "D/N": 98.4295575812172, "bops": 4063719248269148160, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": true, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 200, "N": 203188480, "final_loss": 2.8792433738708496, "D": 4999872512, "D/N": 24.607066857333646, "bops": 1015916495907061760, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": true, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.8408844470977783, "D": 39999766528, "D/N": 389.18662136715517, "bops": 4111090244248403968, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": true, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.856022834777832, "D": 39999766528, "D/N": 389.18662136715517, "bops": 4111090244248403968, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": true, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.8136942386627197, "D": 79999795200, "D/N": 778.3757933226394, "bops": 8222207431095091200, "fquant": null, "fsquare": false, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": true, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.828745603561402, "D": 79999795200, "D/N": 778.3757933226394, "bops": 8222207431095091200, "fquant": null, "fsquare": true, "fscale_override": 1, "fhadamard_dim": 1, "ffour_over_six": true, "bquant": "NoQuantizer", "bunbiased": null, "bgroup_dim": null, "bscale_dtype": null, "bscale_override": 1.0, "bstochastic": null, "bhadamard_dim": null, "bbackward_scheme": "EW_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}], "bnrq": [{"Nstr": 30, "N": 30482560, "final_loss": 3.096776247024536, "D": 11999903744, "D/N": 393.6645657057675, "bops": 365787785870704640, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)W_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.424395799636841, "D": 749993984, "D/N": 24.604035356610467, "bops": 22861736616919040, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)W_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.4239675998687744, "D": 749993984, "D/N": 24.604035356610467, "bops": 22861736616919040, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 1, "bbackward_scheme": "Q(E)W_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.305964946746826, "D": 1499987968, "D/N": 49.208070713220934, "bops": 45723473233838080, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 1, "bbackward_scheme": "Q(E)W_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.214934825897217, "D": 2999975936, "D/N": 98.41614142644187, "bops": 91446946467676160, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 1, "bbackward_scheme": "Q(E)W_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.211680173873902, "D": 2999975936, "D/N": 98.41614142644187, "bops": 91446946467676160, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)W_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.060066938400269, "D": 23999807488, "D/N": 787.329131411535, "bops": 731575571741409280, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)W_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.3014211654663086, "D": 1499987968, "D/N": 49.208070713220934, "bops": 45723473233838080, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)W_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.147437572479248, "D": 5999951872, "D/N": 196.83228285288374, "bops": 182893892935352320, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)W_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.1430656909942627, "D": 2499805184, "D/N": 50.44329763768138, "bops": 123882185554919424, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)W_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.877295970916748, "D": 9999745024, "D/N": 97.294742400542, "bops": 1027752354113388544, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)W_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.828089952468872, "D": 19999752192, "D/N": 194.59203538941307, "bops": 2055531650825060352, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)W_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.071665525436402, "D": 4999872512, "D/N": 100.89188505070229, "bops": 247777362110840832, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)W_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 2.9714174270629883, "D": 19999752192, "D/N": 403.57282997814866, "bops": 991122439444365312, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)W_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 3.031135320663452, "D": 2499805184, "D/N": 24.322410305970966, "bops": 256924617229205504, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)W_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 2.9356863498687744, "D": 39999766528, "D/N": 807.1509497316368, "bops": 1982257869889732608, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)W_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.017094373703003, "D": 9999745024, "D/N": 201.78377010140457, "bops": 495554724221681664, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)W_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.943655014038086, "D": 4999872512, "D/N": 48.647371200271, "bops": 513876177056694272, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)W_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.2383296489715576, "D": 1249902592, "D/N": 25.22164881884069, "bops": 61941092777459712, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)W_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.018542766571045, "D": 9999745024, "D/N": 201.78377010140457, "bops": 495554724221681664, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 1, "bbackward_scheme": "Q(E)W_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.9474246501922607, "D": 4999872512, "D/N": 48.647371200271, "bops": 513876177056694272, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 1, "bbackward_scheme": "Q(E)W_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 2.973848819732666, "D": 19999752192, "D/N": 403.57282997814866, "bops": 991122439444365312, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 1, "bbackward_scheme": "Q(E)W_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.099496603012085, "D": 11999903744, "D/N": 393.6645657057675, "bops": 365787785870704640, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 1, "bbackward_scheme": "Q(E)W_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.1505684852600098, "D": 5999951872, "D/N": 196.83228285288374, "bops": 182893892935352320, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 1, "bbackward_scheme": "Q(E)W_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.2418413162231445, "D": 1249902592, "D/N": 25.22164881884069, "bops": 61941092777459712, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 1, "bbackward_scheme": "Q(E)W_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.830901622772217, "D": 19999752192, "D/N": 194.59203538941307, "bops": 2055531650825060352, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 1, "bbackward_scheme": "Q(E)W_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.8796989917755127, "D": 9999745024, "D/N": 97.294742400542, "bops": 1027752354113388544, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 1, "bbackward_scheme": "Q(E)W_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 2.937368392944336, "D": 39999766528, "D/N": 807.1509497316368, "bops": 1982257869889732608, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 1, "bbackward_scheme": "Q(E)W_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.0611441135406494, "D": 23999807488, "D/N": 787.329131411535, "bops": 731575571741409280, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 1, "bbackward_scheme": "Q(E)W_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.1454360485076904, "D": 2499805184, "D/N": 50.44329763768138, "bops": 123882185554919424, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 1, "bbackward_scheme": "Q(E)W_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 3.0349643230438232, "D": 2499805184, "D/N": 24.322410305970966, "bops": 256924617229205504, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 1, "bbackward_scheme": "Q(E)W_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.0744242668151855, "D": 4999872512, "D/N": 100.89188505070229, "bops": 247777362110840832, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 1, "bbackward_scheme": "Q(E)W_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.066758155822754, "D": 23999807488, "D/N": 787.329131411535, "bops": 731575571741409280, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)W_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.309453010559082, "D": 1499987968, "D/N": 49.208070713220934, "bops": 45723473233838080, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)W_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.3038175106048584, "D": 1499987968, "D/N": 49.208070713220934, "bops": 45723473233838080, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)W_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.4265987873077393, "D": 749993984, "D/N": 24.604035356610467, "bops": 22861736616919040, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)W_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.2153866291046143, "D": 2999975936, "D/N": 98.41614142644187, "bops": 91446946467676160, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)W_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.153914451599121, "D": 5999951872, "D/N": 196.83228285288374, "bops": 182893892935352320, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)W_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.432594537734986, "D": 749993984, "D/N": 24.604035356610467, "bops": 22861736616919040, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)W_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.103125810623169, "D": 11999903744, "D/N": 393.6645657057675, "bops": 365787785870704640, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)W_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.2189149856567383, "D": 2999975936, "D/N": 98.41614142644187, "bops": 91446946467676160, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)W_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.1529150009155273, "D": 5999951872, "D/N": 196.83228285288374, "bops": 182893892935352320, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)W_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.0643458366394043, "D": 23999807488, "D/N": 787.329131411535, "bops": 731575571741409280, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)W_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 30, "N": 30482560, "final_loss": 3.1039443016052246, "D": 11999903744, "D/N": 393.6645657057675, "bops": 365787785870704640, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)W_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.0752663612365723, "D": 4999872512, "D/N": 100.89188505070229, "bops": 247777362110840832, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)W_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 2.9776041507720947, "D": 19999752192, "D/N": 403.57282997814866, "bops": 991122439444365312, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)W_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.8812785148620605, "D": 9999745024, "D/N": 97.294742400542, "bops": 1027752354113388544, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)W_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.834627628326416, "D": 19999752192, "D/N": 194.59203538941307, "bops": 2055531650825060352, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)W_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.0777857303619385, "D": 4999872512, "D/N": 100.89188505070229, "bops": 247777362110840832, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)W_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.0226476192474365, "D": 9999745024, "D/N": 201.78377010140457, "bops": 495554724221681664, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)W_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.246126651763916, "D": 1249902592, "D/N": 25.22164881884069, "bops": 61941092777459712, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)W_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.8842933177948, "D": 9999745024, "D/N": 97.294742400542, "bops": 1027752354113388544, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)W_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.146023750305176, "D": 2499805184, "D/N": 50.44329763768138, "bops": 123882185554919424, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)W_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.951734781265259, "D": 4999872512, "D/N": 48.647371200271, "bops": 513876177056694272, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)W_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.836305618286133, "D": 19999752192, "D/N": 194.59203538941307, "bops": 2055531650825060352, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)W_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 3.03517746925354, "D": 2499805184, "D/N": 24.322410305970966, "bops": 256924617229205504, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)W_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 3.0399060249328613, "D": 2499805184, "D/N": 24.322410305970966, "bops": 256924617229205504, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)W_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 2.9789178371429443, "D": 19999752192, "D/N": 403.57282997814866, "bops": 991122439444365312, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)W_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 2.939396858215332, "D": 39999766528, "D/N": 807.1509497316368, "bops": 1982257869889732608, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)W_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.946449041366577, "D": 4999872512, "D/N": 48.647371200271, "bops": 513876177056694272, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)W_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.0214602947235107, "D": 9999745024, "D/N": 201.78377010140457, "bops": 495554724221681664, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)W_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.1501221656799316, "D": 2499805184, "D/N": 50.44329763768138, "bops": 123882185554919424, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)W_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 3.240478992462158, "D": 1249902592, "D/N": 25.22164881884069, "bops": 61941092777459712, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "eden", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 0.93, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)W_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.7943856716156006, "D": 39999766528, "D/N": 389.18662136715517, "bops": 4111090244248403968, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 1, "bbackward_scheme": "Q(E)W_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 50, "N": 49556736, "final_loss": 2.9415249824523926, "D": 39999766528, "D/N": 807.1509497316368, "bops": 1982257869889732608, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)W_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.8001198768615723, "D": 39999766528, "D/N": 389.18662136715517, "bops": 4111090244248403968, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 128, "bbackward_scheme": "Q(E)W_Q(Et)Q(Xt)t", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}, {"Nstr": 100, "N": 102777856, "final_loss": 2.768491744995117, "D": 79999795200, "D/N": 778.3757933226394, "bops": 8222207431095091200, "fquant": null, "fsquare": null, "fscale_override": 1.0, "fhadamard_dim": null, "ffour_over_six": false, "bquant": "IsolatedEdenQuantizer", "bunbiased": "sr", "bgroup_dim": 16, "bscale_dtype": "e4m3", "bscale_override": 1, "bstochastic": null, "bhadamard_dim": 1, "bbackward_scheme": "Q(E)W_EtX", "bfour_over_six": false, "sscheme": null, "shadamard_dim": 32, "sdelayed_amax": false, "sfour_over_six": false}]}