name: gtrxl
head_dim: 64
embedding_dim: 128
head_num: 4
mlp_num: 2
layer_num: 4
dropout_ratio: 0.0
gru_bias: 2.
memory_len: 128
reset_hidden_on_terminate: true