{"val": {"loss": 5.760124504566193, "accuracy": 0.00927734375, "attn_entropy": 0.22605826705694199, "param_norm": 125.03891259998976}, "train": {"loss": 3.9578676223754883, "accuracy": 0.099609375, "attn_entropy": 0.13624094426631927, "param_norm": 125.02807780437756}, "step": 300, "lr": 0.001, "_runtime": 18, "_timestamp": 1768222416, "_step": 29}