aa: null
batch_size: 32
color_jitter: 0.0
decay_by_epoch: True
decay_epochs: 30
decay_rate: 0.1
drop: 0.0
epochs: 100
log_interval: 50
lr: 0.1
min_lr: 1.0e-05
model_ema: false
model_ema_decay: 0.9998
momentum: 0.9
smoothing: 0.0
opt: sgd
opt_betas: null
opt_eps: 1.0e-08
remode: const
reprob: 0.0
sched: step
seed: 42
warmup_epochs: 0
warmup_lr: 0.2
weight_decay: 1.0e-4
workers: 8
# kd
kd: 'dist'
ori_loss_weight: 1.
kd_loss_weight: 2.
teacher_model: 'tv_resnet34'
teacher_pretrained: True
