{
    "dino-vit-small-p16_cls": {
        "model_name": "dino-vit-small-p16",
        "source": "ssl",
        "model_parameters": {
            "token_extraction": "cls_token"
        },
        "module_names": [
            "blocks.0.norm2",
            "blocks.1.norm1",
            "blocks.1.norm2",
            "blocks.2.norm1",
            "blocks.2.norm2",
            "blocks.3.norm1",
            "blocks.3.norm2",
            "blocks.4.norm1",
            "blocks.4.norm2",
            "blocks.5.norm1",
            "blocks.5.norm2",
            "blocks.6.norm1",
            "blocks.6.norm2",
            "blocks.7.norm1",
            "blocks.7.norm2",
            "blocks.8.norm1",
            "blocks.8.norm2",
            "blocks.9.norm1",
            "blocks.9.norm2",
            "blocks.10.norm1",
            "blocks.10.norm2",
            "blocks.11.norm1",
            "blocks.11.norm2",
            "norm"
        ],
        "objective": "Self-Supervised",
        "dataset": "ImageNet1k",
        "architecture_class": "Transformer",
        "architecture": "ViT",
        "alignment": null,
        "dataset_class": "ImageNet1k",
        "embedding_dim": 384,
        "size": 21665664,
        "size_fmt": "21.7M",
        "size_class": "small"
    },
    "dino-vit-small-p16_ap": {
        "model_name": "dino-vit-small-p16",
        "source": "ssl",
        "model_parameters": {
            "token_extraction": "avg_pool"
        },
        "module_names": [
            "blocks.0.norm2",
            "blocks.1.norm1",
            "blocks.1.norm2",
            "blocks.2.norm1",
            "blocks.2.norm2",
            "blocks.3.norm1",
            "blocks.3.norm2",
            "blocks.4.norm1",
            "blocks.4.norm2",
            "blocks.5.norm1",
            "blocks.5.norm2",
            "blocks.6.norm1",
            "blocks.6.norm2",
            "blocks.7.norm1",
            "blocks.7.norm2",
            "blocks.8.norm1",
            "blocks.8.norm2",
            "blocks.9.norm1",
            "blocks.9.norm2",
            "blocks.10.norm1",
            "blocks.10.norm2",
            "blocks.11.norm1",
            "blocks.11.norm2",
            "norm"
        ],
        "objective": "Self-Supervised",
        "dataset": "ImageNet1k",
        "architecture_class": "Transformer",
        "architecture": "ViT",
        "alignment": null,
        "dataset_class": "ImageNet1k",
        "embedding_dim": 384,
        "size": 21665664,
        "size_fmt": "21.7M",
        "size_class": "small"
    }
}