# optimizer
optimizer = dict(type='SGD', lr=0.01, momentum=0.9, weight_decay=0.0001)
optimizer_config = dict( grad_clip=dict(max_norm=35, norm_type=2))

# learning policy
lr_config = dict(
    policy='CosineAnnealing',
    warmup='exp',
    warmup_by_epoch=True,
    warmup_iters=1,
    warmup_ratio=0.001,
    min_lr_ratio=4e-5)  # 0.01 0.005 0.0025 0.00125 0.000625 
runner = dict(type='EpochBasedRunner', max_epochs=18)
