run: gla
gla_blocks: [-1]
depth: 12
model_dim: 928
d_state: 32
unembedding_lr: 0.002
device_batch_size: 32