OUTPUT_DIR: 'OUTPUT/'
WORKERS: 6
PRINT_FREQ: 100
AMP:
  ENABLED: True

AUG:
  MIXUP: 0.1

MODEL:
  NAME: cls_vit
  NUM_CLASSES: 1000
  SPEC:
    PATCH_SIZE: 14
    EMBED_DIM: 1024
    NUM_HEADS: 16
    DEPTH: 24
    MLP_RATIO: 4.0
    ATTN_DROP_RATE: 0.0
    DROP_RATE: 0.0
    DROP_PATH_RATE: 0.1
    QKV_BIAS: True
    USE_CLS_TOKEN: True
    NORM_EMBED: True
  PRETRAINED: ''
  PRETRAINED_LAYERS:
    - patch_embed
    - pos_embed
    - cls_token
    - blocks
LOSS:
  LABEL_SMOOTHING: 0.1
DATASET:
  DATASET: 'imagenet'
  DATA_FORMAT: 'tsv'
  ROOT: 'DATASET/imagenet-tsv/'
  TEST_SET: 'val'
  TRAIN_SET: 'train'
TEST:
  BATCH_SIZE_PER_GPU: 32
  IMAGE_SIZE: [384, 384]
  CENTER_CROP: False
  MODEL_FILE: ''
TRAIN:
  BATCH_SIZE_PER_GPU: 32
  IMAGE_SIZE: [384, 384]
  LR_SCHEDULER:
    METHOD: 'BitHyperRule'
  OPTIMIZER: sgd
  WD: 0.0
  WITHOUT_WD_LIST: ['bn']
  MOMENTUM: 0.9
  NESTEROV: true
  SHUFFLE: true
FINETUNE:
  FINETUNE: true
  EVAL_EVERY: 2000
  BASE_LR: 0.03
DEBUG:
  DEBUG: false
