_target_: deepspeed.ops.adam.OnebitAdam
lr: ${training.lr}
betas: [ 0.8, 0.999 ]
eps: 1e-8
weight_decay: 3e-7
freeze_step: 400
cuda_aware: True
