_base_ = [
    './upernet_swin_4xb4-160k_ade20k-896x896_small.py'
]
model = dict(
    backbone=dict(
        type='MM_VSSM',
        out_indices=(0, 1, 2, 3),
        pretrained="../../ckpts/classification/outs/vssm/vssmsmall/vssmsmall_dp03_ckpt_epoch_238.pth",
        # copied from classification/configs/vssm/vssm_small_224.yaml
        dims=96,
        depths=(2, 4, 10, 2),
        ssm_d_state=16,
        ssm_dt_rank="auto",
        ssm_ratio=2.0,
        mlp_ratio=4.0,
        downsample_version="v3",
        patchembed_version="v2",
        ssm_conv_bias=False,
        ssm_conv = 3,
        forward_type="v05_noz", # if you want exactly the same
    ),
        decode_head=dict(in_channels=[96, 192, 384, 768]),
)
train_dataloader = dict(batch_size=4) # as gpus=4

