hidden_dim: 16
num_layers: 3
alpha: 0.4
beta: 0.0
symmetric_norm: False
bias: True
dropout: 0.0
len_readout: False
softmax_and_scale: False