hidden_dim: 16
num_layers: 3
use_attention: False
heads: 1
bias: True
dropout: 0.0