{"val": {"loss": 7.559394299983978, "accuracy": 0.003173828125, "attn_entropy": 0.18352288007736206, "param_norm": 130.59298062702638}, "train": {"loss": 2.3372137546539307, "accuracy": 0.337890625, "attn_entropy": 0.09084290638566017, "param_norm": 130.58364973400643}, "step": 870, "lr": 0.001, "_runtime": 86, "_timestamp": 1768206493, "_step": 86}