_target_: transformers.get_polynomial_decay_schedule_with_warmup
num_training_steps: 50000  # -1 specifies to infer number of training steps
num_warmup_steps: 0.1  # float values determines percentage of training steps to use as warmup
lr_end: 1e-7
power: 1.0
