{"val": {"loss": 0.0, "accuracy": 1.0, "attn_entropy": 0.39023988228291273, "param_norm": 534.5306808533325}, "train": {"loss": 4.889437299482324e-09, "accuracy": 1.0, "attn_entropy": 0.27094303350895643, "param_norm": 534.5305925744348}, "step": 1000000, "lr": 0.001, "wd_logits_norm": 1.8364888429641724, "wd_probs_nonorm": 0.4649021327495575, "mse_logits_norm": 0.0005738960462622344, "mse_probs_nonorm": 1.7231550373253413e-05, "sharp_base_loss": 0.01295624952763319, "sharp_pert_loss": 2.8428248697309755e-05, "sharpness": -0.012927820906043053, "asharp_base_loss": 2.2118822329275645e-08, "asharp_pert_loss": 2.3283062977608182e-10, "adaptive_sharpness": -2.1885991685621775e-08, "_runtime": 45121, "_timestamp": 1768415085, "_step": 99999}