_BASE_: "base_clip_teacher_image_R50.yaml"
MODEL:
  WEIGHTS: "/data/weight/GLEE/GLEE_Lite_scaleup.pth"
  VISUAL_PROMPT: True
  HIER_TRAINING: True
  HIER_POS: False
  HIER_NEG: False
  LORA: True
  LORA_RANK: 16
  LORA_ALPHA: 16
  HIER_ELOSS_WEIGHT: 1.0
DATASETS:
  TRAIN: ("vg_syn",)
  TEST: ("refcoco-unc-val", "d3_intra_scenario")  
SOLVER: 
  IMS_PER_BATCH: 4
  BASE_LR: 0.00005
  STEPS: (300000,380000 )
  MAX_ITER: 100000
  WARMUP_FACTOR: 0.005
  WARMUP_ITERS: 200
  CHECKPOINT_PERIOD: 1000
  TEXTENCODER_MULTIPLIER: 0.1
TEST:
  EVAL_PERIOD: 10000
DATALOADER:
  SAMPLER_TRAIN: "MultiDatasetSampler"
  DATASET_RATIO: [1.0, 1.0, 1.0, 1.0]
  USE_DIFF_BS_SIZE: True
  DATASET_BS: [4, 4, 4, 4]
  USE_RFS: [True, True, True, True]
  DATASET_ANN: ['box', 'box', 'box', 'box']
  FILTER_EMPTY_ANNOTATIONS: False
  NUM_WORKERS: 4
OUTPUT_DIR: "/data/sojungan/exp/lora_enc"
WANDB_PROJECT: "vg"
WANDB_NAME: "test"