_base_ = [ '../swin/mask-rcnn_swin-t-p4-w7_fpn_1x_coco.py' ] model = dict( backbone=dict( type='MM_VSSM', out_indices=(0, 1, 2, 3), pretrained="", # copied from classification/configs/vssm/vssm_tiny_224.yaml dims=96, # depths=(2, 2, 5, 2), depths=(2, 2, 8, 2), ssm_d_state=1, ssm_dt_rank="auto", # ssm_ratio=2.0, ssm_ratio=1.0, ssm_conv=3, ssm_conv_bias=False, forward_type="v05_noz", # v3_noz mlp_ratio=4.0, downsample_version="v3", patchembed_version="v2", drop_path_rate=0.2, norm_layer="ln2d", ), ) # train_dataloader = dict(batch_size=2) # as gpus=8