_BASE_: "Base.yaml"
MODEL:
  TRAIN_TASK: ["DenseCap"]
  TEST_TASK: "DenseCap"
  MASK_ON: False
  ROI_HEADS:
    SOFT_NMS_ENABLED: False
  BEAM_SIZE: 1
  WEIGHTS: "detectron2://ImageNetPretrained/MAE/mae_pretrain_vit_base.pth"
  BACKBONE:
    NAME: build_vit_fpn_backbone
  VIT_LAYERS: 12
SOLVER:
  VIT_LAYER_DECAY_RATE: 0.7
DATASETS:
  TRAIN: ("vg_train",)
  TEST: ("vg_test",)
DATALOADER:
  DATASET_BS: 2
OUTPUT_DIR: "./output/GRiT_B_DenseCap"