{"val": {"loss": 0.44339820370078087, "accuracy": 0.900146484375, "attn_entropy": 0.3766599502414465, "param_norm": 139.74908301711778}, "train": {"loss": 0.0011605136096477509, "accuracy": 1.0, "attn_entropy": 0.2858882248401642, "param_norm": 139.7493560416632}, "step": 26250, "lr": 0.001, "_runtime": 806, "_timestamp": 1768224128, "_step": 2624}