type: AdamWScale

lr: 0.0005
betas:
  - 0.9
  - 0.98
eps: 1e-12
weight_decay: 0.01
correct_bias: True # adamw fix
