epochs: 2000
lr: 1e-3
wd: 1e-6
hid_dim: 1024
num_layer: 2
dropout: 0.1
order: 5
alpha: 0.002
beta: 1e-6
use_bn: false
