MODEL:
  TYPE: vssm
  NAME: vssm1_tiny_0217
  DROP_PATH_RATE: 0.2
  VSSM:
    EMBED_DIM: 96
    DEPTHS: [ 2, 2, 4, 2 ]
    SSM_D_STATE: 1
    SSM_DT_RANK: "auto"
    SSM_RATIO: 1.6
    # SSM_RATIO: 2.0
    # SSM_RANK_RATIO: 1.6 # add SSM_RANK_RATIO will introduce extra nn.linear, which costs 1.5+ GFlops
    SSM_CONV: -1
    SSM_FORWARDTYPE: "v2"
    MLP_RATIO: 4.0
    DOWNSAMPLE: "v3"
    PATCHEMBED: "v2"
