_BASE_: "Base-C2_L_R5021k_640b64_4x.yaml"
MODEL:
  ROI_BOX_HEAD:
    USE_ZEROSHOT_CLS: True
    IMAGE_LABEL_LOSS: 'max_size'
    ZEROSHOT_WEIGHT_PATH: 'datasets/metadata/lvis_v1_clip_gpt_tutorial_sampled_softmax_vit_b16_ep20_randaug2_unc1000_16shots_nctx4_cscFalse_ctpend+cname.npy'
  WEIGHTS: "output/Detic/Detic_LI_CLIP_R5021k_640b64_4x_ft4x_max-size_gpt/model_final.pth"
  RESET_CLS_TESTS: True
#  TEST_CLASSIFIERS: ("datasets/metadata/coco_clip_gpt_tutorial_sampled_softmax_vit_b16_ep20_randaug2_unc1000_16shots_nctx4_cscFalse_ctpend+cname.npy", "datasets/metadata/o365_clip_gpt_tutorial_sampled_softmax_vit_b16_ep20_randaug2_unc1000_16shots_nctx4_cscFalse_ctpend+cname.npy")
  TEST_CLASSIFIERS: ("datasets/metadata/coco_clip_gpt_tutorial_sampled_softmax_vit_b16_ep20_randaug2_unc1000_16shots_nctx4_cscFalse_ctpend+cname.npy", )
#  TEST_NUM_CLASSES: [ 80, 365 ]
  TEST_NUM_CLASSES: [ 80, ]
SOLVER:
  MAX_ITER: 90000
  IMS_PER_BATCH: 64
  BASE_LR: 0.0002
  WARMUP_ITERS: 1000
  WARMUP_FACTOR: 0.001
DATASETS:
  TRAIN: ("lvis_v1_train","imagenet_lvis_v1")
#  TEST: ('coco_generalized_zeroshot_val', 'objects365_v2_val')
  TEST: ('coco_generalized_zeroshot_val', )
OUTPUT_DIR: "./output/Detic/Detic_LI_CLIP_R5021k_640b64_4x_ft4x_max-size_gpt_coco"
DATALOADER:
  SAMPLER_TRAIN: "MultiDatasetSampler"
  DATASET_RATIO: [1, 4]
  USE_DIFF_BS_SIZE: True
  DATASET_BS: [8, 32]
  DATASET_INPUT_SIZE: [640, 320]
  USE_RFS: [True, False]
  DATASET_INPUT_SCALE: [[0.1, 2.0], [0.5, 1.5]]
  FILTER_EMPTY_ANNOTATIONS: False
  MULTI_DATASET_GROUPING: True
  DATASET_ANN: ['box', 'image']
  NUM_WORKERS: 8
WITH_IMAGE_LABELS: True