# https://arxiv.org/pdf/2110.00476.pdf
# A2
batch_size: 256
epochs: 300
opt: 'lamb'
weight_decay: 0.02
lr: 5e-3 # total batch size 2048
min_lr: 1e-5
sched: 'cosine'
warmup_epochs: 5
warmup_lr: 1e-6
cooldown_epochs: 0
drop_path: 0.05
# clip_grad: 1.0 #
amp: True
aa: 'rand-m7-mstd0.5-inc1'
aug_repeats: 3
bce_loss: true
# bce_target_thresh: 0.2
color_jitter: 0.0
smoothing: 0.
mixup: 0.1
cutmix: 1.0
mixup_prob: 1.0
mixup_switch_prob: 0.5
mixup_mode: 'batch'
dist_bn: 'reduce'

