{"val": {"loss": 0.0007045516222766706, "accuracy": 0.999755859375, "attn_entropy": 0.38824325799942017, "param_norm": 553.1123676094625}, "train": {"loss": 1.3271334253772693e-08, "accuracy": 1.0, "attn_entropy": 0.2726950440555811, "param_norm": 553.1122489447353}, "step": 1000000, "lr": 0.001, "wd_logits_norm": 1.8041890859603882, "wd_probs_nonorm": 0.5363960266113281, "_runtime": 32539, "_timestamp": 1768315928, "_step": 99999}