{"val": {"loss": 8.833534717559814, "accuracy": 0.02978515625, "attn_entropy": 0.22954047285020351, "param_norm": 140.96513990104253}, "train": {"loss": 0.15339849889278412, "accuracy": 0.962890625, "attn_entropy": 0.13352176547050476, "param_norm": 140.96314438757972}, "step": 4000, "lr": 0.001, "_runtime": 132, "_timestamp": 1768206824, "_step": 399}