batch_size: 128
epochs: 50
lr: 0.0003
weight_decay: 0.0
warmup: 5
num_workers: 8
schedule: inv_sqrt