{"val": {"loss": 9.739031328948045e-06, "accuracy": 1.0, "attn_entropy": 0.40715221501886845, "param_norm": 236.91243083319654}, "train": {"loss": 0.00016196214710362256, "accuracy": 1.0, "attn_entropy": 0.3122505098581314, "param_norm": 236.91133239298912}, "step": 115460, "lr": 0.001, "wd_logits_norm": 1.552003264427185, "wd_probs_nonorm": 0.4028107523918152, "_runtime": 3708, "_timestamp": 1768287048, "_step": 11545}