{"val": {"loss": 7.86424320936203, "accuracy": 0.01513671875, "attn_entropy": 0.17728931177407503, "param_norm": 134.71565524544937}, "train": {"loss": 1.179461121559143, "accuracy": 0.6328125, "attn_entropy": 0.07697425223886967, "param_norm": 134.70934723266225}, "step": 1370, "lr": 0.001, "wd_logits_norm": 1.8110212087631226, "wd_probs_nonorm": 0.18155476450920105, "wd_mse_logits": 2.3626192557912873e-07, "wd_mse_probs": 4.425772193172861e-09, "_runtime": 57, "_timestamp": 1768282406, "_step": 136}