run: gpt
depth: 12
model_dim: 768
unembedding_lr: 0.002