{"val": {"loss": 0.00036674769152966746, "accuracy": 0.999755859375, "attn_entropy": 0.3981069028377533, "param_norm": 235.51893659429953}, "train": {"loss": 0.0027433261275291443, "accuracy": 0.998046875, "attn_entropy": 0.3016260266304016, "param_norm": 235.5181532775788}, "step": 113050, "lr": 0.001, "wd_logits_norm": 9.356204986572266, "wd_probs_nonorm": 4.844634532928467, "_runtime": 3942, "_timestamp": 1768293962, "_step": 11304}