{
    "dino_cfg": {
        "d_model": 1024,
        "decoder_cfg": {
            "num_cross_attn": 4,
            "init_values": 1.0,
            "prev_values": 0.5,
            "nhead": 8,
            "attention_type": "FLASH2",
            "ffn_type": "ffn",
            "softmax_scale": "entropy_invariance",
            "train_avg_length": 1024,
            "self_cross_types": null,
            "post_norm": false,
            "pre_norm_query": true,
            "no_combine_norm": false
        }            
    },
    "encoder_cfg":{
        "feat_chs": [64, 32, 16, 8]
    },
    "matcher":{
        "num_grid": [32, 32, 64, 128, 256],
        "radius": [7, 6, 4, 2, 0],
        "displacement_dim": [64, 64, 32, 16, 8],
        "num_itr": [4,4,4,4,4]
    }
}