run: kla
kla_blocks: [-1]
depth: 6
model_dim: 576
grad_clip: 5.0
device_batch_size: 8
d_state: 32