seed: 1222
gpus: 3
workers: 10
opt: adamw
sched: cosine_timm
lr: 1e-5
min_lr: 1e-6
warmup_lr: 1e-6
weight_decay: 0.05
momentum: 0.9
end_epoch: 400
cooldown_epochs: 10
warmup_epochs: 5
batch_size: 256
classifier_type: deit_small_patch16_224_return_total_attn
is_pretrained_imagenet: False
initial_checkpoint: dino_deitsmall16_pretrain.pth
patch_size: 16
num_classes: 20
tag : voc_dino_paper_baseline_test
experiments_name: voc_experiment_guide
experiments_subname: voc_dino_paper
dataset_name: voc
aug: 'timm_rand'
repeated_aug: True
transmix: False
mixup: 0.0
cutmix: 0.0
mixup_prob: 1.0
mixup_switch_prob: 0.5
saveckp_freq: 1200
baseline: True