scaling_type: cosine  # linear/cosine/exponential
scaling_length: 40
base_scaling: 0.5
mode: post_decay
opt_mode: default  # default/mem
drop_weight: 1.