MODEL:
  TYPE: vit
  NAME: pretrain
  DROP_PATH_RATE: 0.0
  RECOVER_TARGET_TYPE: normal
  VIT:
    EMBED_DIM: 384
    DEPTH: 12
    NUM_HEADS: 6
    INIT_VALUES: None
    USE_APE: True
    USE_RPB: False
    USE_SHARED_RPB: False
    USE_MEAN_POOLING: False
DATA:
  IMG_SIZE: 224
  FILTER_TYPE: wavelet
  WAVE:
    LEVEL: 4
    THRESHOLDS: [.05, .01, .005, .003]
    KEEP_HIGH: True
    RANDOM_MASK: False
TRAIN:
  EPOCHS: 300
  WARMUP_EPOCHS: 20
  BASE_LR: 3e-4
  WARMUP_LR: 2.5e-7
  MIN_LR: 2.5e-6
  WEIGHT_DECAY: 0.05
  CLIP_GRAD: 3.0
  OPTIMIZER:
    BETAS: (0.9, 0.95)
PRINT_FREQ: 100
SAVE_FREQ: 3
TAG: wavelet_compression__pretrain__vit_small_img224__300ep