num_epochs: 5001
batch_size: 500

# optimizer settings
initial_lr: 1e-7
peak_lr: 1e-3
end_lr: 1e-4
warmup_steps: 5
decay_steps: 10000 # this depends on the number of batches per epoch (epochs * num_batches_per_epoch)
clip_grad_norm: 1.0

# model saving settings
model_save_dir: "${config.base_path}/.checkpoints/${config.wandb.experiment_name}"
