d_input: 16
d_rnn: 16
d_hidden: 64
n_layers: 3
n_head: 3
d_qk: 8
d_v: 8
dropout: 0.0
sample_rate: 2
mae_step: 2
mae_e_step: 2