run: kla
kla_blocks: [-1]
depth: 6
model_dim: 288 
grad_clip: 5.0
device_batch_size: 16
d_state: 32