_BASE_: ../maskformer_dups_bs16_90k.yaml
MODEL:
  META_ARCHITECTURE: "DUPSMaskFormerSW"
  BACKBONE:
    NAME: "DUPSEncoder"
  DUPS:
    NAME: ["MixResViT","MixResNeighbour", "MixResNeighbour", "MixResNeighbour", "MixResNeighbour", "MixResNeighbour", "MixResViT" ]
    EMBED_DIM: [512,256,128,64,128,256,512]
    DEPTHS: [1, 1, 1, 4, 4, 16, 4]
    NUM_HEADS: [ 16, 8, 4, 2, 4, 8, 16 ]
    PATCH_SIZES: [32, 16, 8, 4, 8, 16, 32]
    DROP_RATE: [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]
    DROP_PATH_RATE: 0.3
    ATTN_DROP_RATE: [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]
    UPSCALE_RATIO: [0.0, 0.5, 0.7, 0.65, 0.0, 0.0, 0.0]
    SPLIT_RATIO: [4, 4, 4, 4, 4, 4, 4]
    MLP_RATIO: [3., 3., 3., 3., 3., 3., 3.]
    CLUSTER_SIZE: [8, 8, 8, 8, 8, 8, 8]
    NBHD_SIZE: [48,48,48,48,48,48,48]
    OUT_FEATURES: ["res2", "res3", "res4", "res5"]
    KEEP_OLD_SCALE: True
    ADD_IMAGE_DATA_TO_ALL: False
    LAYER_SCALE: 0.0
    DYNAMIC_UPSAMPLING_RATIOS: True
    DYNAMIC_UPSAMPLING_THRESHOLD: [ 0.0, 0.005, 0.01, 0.02, 0.0, 0.0, 0.0 ]
  PIXEL_MEAN: [123.675, 116.280, 103.530]
  PIXEL_STD: [58.395, 57.120, 57.375]