_BASE_: ../maskformer_dups_bs32_80k.yaml
MODEL:
  META_ARCHITECTURE: "DUPSMaskFormer"
  BACKBONE:
    NAME: "DUPSEncoder"
  DUPS:
    NAME: ["MixResViT","MixResNeighbour", "MixResNeighbour", "MixResNeighbour", "MixResNeighbour", "MixResNeighbour", "MixResViT" ]
    EMBED_DIM: [768,384,192,96,192,384,768]
    DEPTHS: [2, 2, 2, 8, 6, 18, 4]
    NUM_HEADS: [ 24, 12, 6, 3, 6, 12, 24 ]
    PATCH_SIZES: [32, 16, 8, 4, 8, 16, 32]
    DROP_RATE: [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]
    DROP_PATH_RATE: 0.3
    ATTN_DROP_RATE: [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]
    UPSCALE_RATIO: [0.0, 0.85, 0.7, 0.6, 0.0, 0.0, 0.0]
    SPLIT_RATIO: [4, 4, 4, 4, 4, 4, 4]
    MLP_RATIO: [4., 4., 4., 4., 4., 4., 4.]
    CLUSTER_SIZE: [8, 8, 8, 8, 8, 8, 8]
    NBHD_SIZE: [48,48,48,48,48,48,48]
    OUT_FEATURES: ["res2", "res3", "res4", "res5"]
    KEEP_OLD_SCALE: True
    ADD_IMAGE_DATA_TO_ALL: False
    LAYER_SCALE: 1e-5
    DYNAMIC_UPSAMPLING_RATIOS: True
    DYNAMIC_UPSAMPLING_THRESHOLD: [ 0.0, 0.01, 0.02, 0.04, 0.0, 0.0, 0.0 ]
  PIXEL_MEAN: [123.675, 116.280, 103.530]
  PIXEL_STD: [58.395, 57.120, 57.375]