name: gtrxl
head_dim: 64
embedding_dim: 256
head_num: 8
mlp_num: 2
layer_num: 8
dropout_ratio: 0.0
gru_bias: 2.
memory_len: 256
reset_hidden_on_terminate: true