{"val": {"loss": 7.987583041191101, "accuracy": 0.078369140625, "attn_entropy": 0.1984279165044427, "param_norm": 150.17725720711596}, "train": {"loss": 0.08729967474937439, "accuracy": 0.98046875, "attn_entropy": 0.1015399694442749, "param_norm": 150.176345248434}, "step": 8910, "lr": 0.001, "wd_logits_norm": 8.080695152282715, "wd_probs_nonorm": 3.1078529357910156, "mse_logits_norm": 4.964450454281177e-06, "mse_probs_nonorm": 2.1440313503262587e-05, "_runtime": 309, "_timestamp": 1768291514, "_step": 890}