{"val": {"loss": 8.789530396461487, "accuracy": 0.01611328125, "attn_entropy": 0.1776451924815774, "param_norm": 137.780514235867}, "train": {"loss": 0.5489798188209534, "accuracy": 0.84375, "attn_entropy": 0.07568081095814705, "param_norm": 137.77730333103182}, "step": 2060, "lr": 0.001, "wd_logits_norm": 2.5295088291168213, "wd_probs_nonorm": 0.302566796541214, "wd_mse_logits": 2.429990672681015e-06, "wd_mse_probs": 1.1341542176523944e-06, "_runtime": 71, "_timestamp": 1768282568, "_step": 205}