OUTPUT_DIR: 'OUTPUT/'
WORKERS: 6
PRINT_FREQ: 100
AMP:
  ENABLED: True

AUG:
  MIXUP: 0.1

MODEL:
  NAME: cls_vit
  NUM_CLASSES: 1000
  SPEC:
    PATCH_SIZE: 16
    EMBED_DIM: 768
    NUM_HEADS: 8
    DEPTH: 8
    MLP_RATIO: 3.0
    ATTN_DROP_RATE: 0.0
    DROP_RATE: 0.1
    DROP_PATH_RATE: 0.0
    QKV_BIAS: False
    USE_CLS_TOKEN: True
  PRETRAINED: 'DATASET/models/IN-22k/s16_224_aug4_w5c300_adamW0.003wd0.05bnwd0/model_best.pth'
  PRETRAINED_LAYERS:
    - patch_embed
    - pos_embed
    - cls_token
    - blocks
DATASET:
  DATASET: 'imagenet'
  DATA_FORMAT: 'tsv'
  ROOT: 'DATASET/imagenet-tsv/'
  TEST_SET: 'val'
  TRAIN_SET: 'train'
TEST:
  BATCH_SIZE_PER_GPU: 32
  IMAGE_SIZE: [384, 384]
  CENTER_CROP: False
  MODEL_FILE: ''
TRAIN:
  BATCH_SIZE_PER_GPU: 32
  IMAGE_SIZE: [384, 384]
  LR_SCHEDULER:
    METHOD: 'BitHyperRule'
  OPTIMIZER: sgd
  WD: 0.0
  WITHOUT_WD_LIST: ['bn']
  MOMENTUM: 0.9
  NESTEROV: true
  SHUFFLE: true
FINETUNE:
  FINETUNE: true
  EVAL_EVERY: 2000
  BASE_LR: 0.03
DEBUG:
  DEBUG: false
