{"val": {"loss": 6.869445860385895, "accuracy": 0.014892578125, "attn_entropy": 0.18435228522866964, "param_norm": 129.49712856165272}, "train": {"loss": 2.8557140827178955, "accuracy": 0.259765625, "attn_entropy": 0.08549594506621361, "param_norm": 129.48712824249128}, "step": 740, "lr": 0.001, "_runtime": 29, "_timestamp": 1768222729, "_step": 73}