{
    "model_id": {
        "value": "S2MAE",
        "confidence": 0.8116
    },
    "model_name": {
        "value": "S2MAE",
        "confidence": 0.9953
    },
    "version": {
        "value": null,
        "confidence": 0.0
    },
    "release_date": {
        "value": null,
        "confidence": 0.0
    },
    "last_updated": {
        "value": null,
        "confidence": 0.0
    },
    "short_description": {
        "value": "S2MAE is a spatial-spectral masked autoencoder foundation model for spectral remote sensing data, employing a 3D transformer with a 90% masking ratio and learnable spectral-spatial embeddings. It is pretrained progressively on large-scale Sentinel-2 datasets and evaluated on classification and change detection tasks.",
        "confidence": 0.8094
    },
    "paper_link": {
        "value": null,
        "confidence": 0.0
    },
    "citations": {
        "value": null,
        "confidence": 0.0
    },
    "repository": {
        "value": null,
        "confidence": 0.0
    },
    "weights": {
        "value": null,
        "confidence": 0.0
    },
    "backbone": {
        "value": "ViT (Vision Transformer)",
        "confidence": 0.8914
    },
    "num_layers": {
        "value": null,
        "confidence": 0.0
    },
    "num_parameters": {
        "value": null,
        "confidence": 0.0
    },
    "pretext_training_type": {
        "value": "Masked Image Modeling (MIM)",
        "confidence": 0.8334
    },
    "masking_strategy": {
        "value": "3D random masking with 90% masking ratio",
        "confidence": 0.8185
    },
    "pretraining": {
        "value": "Progressive pretraining on fMoW-S2 and BigEarthNet Sentinel-2 datasets using 3D masked autoencoding with learnable spatial-spectral embeddings.",
        "confidence": 0.7584
    },
    "domain_knowledge": {
        "value": [],
        "confidence": 0.0
    },
    "backbone_modifications": {
        "value": [
            {
                "value": "3D patchification (spatial and spectral)",
                "confidence": 0.3736
            },
            {
                "value": "Learnable spatial-spectral positional embeddings",
                "confidence": 0.7965
            }
        ]
    },
    "supported_sensors": {
        "value": [
            {
                "value": "Sentinel-2",
                "confidence": 1.0
            }
        ]
    },
    "modality_integration_type": {
        "value": "Unimodal",
        "confidence": 1.0
    },
    "modalities": {
        "value": [
            {
                "value": "Multispectral",
                "confidence": 1.0
            }
        ]
    },
    "spectral_alignment": {
        "value": "full",
        "confidence": 0.9989
    },
    "temporal_alignment": {
        "value": "none",
        "confidence": 0.9987
    },
    "spatial_resolution": {
        "value": "10m, 20m, 60m",
        "confidence": 0.8922
    },
    "temporal_resolution": {
        "value": null,
        "confidence": 0.0
    },
    "bands": {
        "value": [
            {
                "value": "B1",
                "confidence": 0.9829
            },
            {
                "value": "B2",
                "confidence": 1.0
            },
            {
                "value": "B3",
                "confidence": 1.0
            },
            {
                "value": "B4",
                "confidence": 1.0
            },
            {
                "value": "B5",
                "confidence": 1.0
            },
            {
                "value": "B6",
                "confidence": 1.0
            },
            {
                "value": "B7",
                "confidence": 1.0
            },
            {
                "value": "B8",
                "confidence": 1.0
            },
            {
                "value": "B8A",
                "confidence": 0.9997
            },
            {
                "value": "B9",
                "confidence": 1.0
            },
            {
                "value": "B11",
                "confidence": 0.9978
            },
            {
                "value": "B12",
                "confidence": 1.0
            }
        ]
    },
    "pretraining_phases": [
        {
            "dataset": {
                "value": "fMoW-S2",
                "confidence": 0.9579
            },
            "regions_coverage": {
                "value": [
                    {
                        "value": "Global",
                        "confidence": 0.5268
                    }
                ]
            },
            "time_range": {
                "value": null,
                "confidence": 0.0
            },
            "num_images": {
                "value": 712874,
                "confidence": 1.0
            },
            "token_size": {
                "value": "8x8x3",
                "confidence": 0.9783
            },
            "image_resolution": {
                "value": "96x96x12",
                "confidence": 1.0
            },
            "epochs": {
                "value": 200,
                "confidence": 1.0
            },
            "batch_size": {
                "value": null,
                "confidence": 0.0
            },
            "learning_rate": {
                "value": "2e-4",
                "confidence": 0.9945
            },
            "augmentations": {
                "value": []
            },
            "processing": {
                "value": []
            },
            "sampling": {
                "value": null,
                "confidence": 0.0
            },
            "processing_level": {
                "value": null,
                "confidence": 0.0
            },
            "cloud_cover": {
                "value": null,
                "confidence": 0.0
            },
            "missing_data": {
                "value": null,
                "confidence": 0.0
            },
            "masking_ratio": {
                "value": 0.9,
                "confidence": 0.9969
            }
        },
        {
            "dataset": {
                "value": "BigEarthNet",
                "confidence": 1.0
            },
            "regions_coverage": {
                "value": [
                    {
                        "value": "Europe (10 countries)",
                        "confidence": 0.525
                    }
                ]
            },
            "time_range": {
                "value": "June 2017 to May 2018",
                "confidence": 0.6842
            },
            "num_images": {
                "value": 354196,
                "confidence": 1.0
            },
            "token_size": {
                "value": "8x8x3",
                "confidence": 1.0
            },
            "image_resolution": {
                "value": "128x128x12",
                "confidence": 1.0
            },
            "epochs": {
                "value": 100,
                "confidence": 1.0
            },
            "batch_size": {
                "value": null,
                "confidence": 0.0
            },
            "learning_rate": {
                "value": "2e-4",
                "confidence": 0.9972
            },
            "augmentations": {
                "value": []
            },
            "processing": {
                "value": []
            },
            "sampling": {
                "value": null,
                "confidence": 0.0
            },
            "processing_level": {
                "value": null,
                "confidence": 0.0
            },
            "cloud_cover": {
                "value": null,
                "confidence": 0.0
            },
            "missing_data": {
                "value": null,
                "confidence": 0.0
            },
            "masking_ratio": {
                "value": 0.9,
                "confidence": 1.0
            }
        }
    ],
    "benchmarks": [
        {
            "task": {
                "value": "Single-label classification",
                "confidence": 0.7599
            },
            "application": {
                "value": "Land use/land cover classification",
                "confidence": 0.5432
            },
            "dataset": {
                "value": "EuroSAT",
                "confidence": 1.0
            },
            "metrics": {
                "value": [
                    {
                        "value": "Top1 Accuracy",
                        "confidence": 0.5716
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 99.19,
                        "confidence": 0.6935
                    }
                ]
            },
            "sensor": {
                "value": [
                    {
                        "value": "Sentinel-2",
                        "confidence": 1.0
                    }
                ]
            },
            "regions": {
                "value": [
                    {
                        "value": "Europe (34 countries)",
                        "confidence": 0.8215
                    }
                ]
            },
            "original_samples": {
                "value": 27000,
                "confidence": 1.0
            },
            "num_samples": {
                "value": 27000,
                "confidence": 0.9995
            },
            "sampling_percentage": {
                "value": 100,
                "confidence": 1.0
            },
            "num_classes": {
                "value": 10,
                "confidence": 1.0
            },
            "classes": {
                "value": null,
                "confidence": 0.0
            },
            "image_resolution": {
                "value": "64x64",
                "confidence": 1.0
            },
            "spatial_resolution": {
                "value": null,
                "confidence": 0.0
            },
            "bands_used": {
                "value": [
                    {
                        "value": "B1",
                        "confidence": 0.8792
                    },
                    {
                        "value": "B2",
                        "confidence": 1.0
                    },
                    {
                        "value": "B3",
                        "confidence": 1.0
                    },
                    {
                        "value": "B4",
                        "confidence": 1.0
                    },
                    {
                        "value": "B5",
                        "confidence": 1.0
                    },
                    {
                        "value": "B6",
                        "confidence": 1.0
                    },
                    {
                        "value": "B7",
                        "confidence": 1.0
                    },
                    {
                        "value": "B8",
                        "confidence": 1.0
                    },
                    {
                        "value": "B8A",
                        "confidence": 1.0
                    },
                    {
                        "value": "B9",
                        "confidence": 1.0
                    },
                    {
                        "value": "B11",
                        "confidence": 1.0
                    },
                    {
                        "value": "B12",
                        "confidence": 1.0
                    }
                ]
            },
            "augmentations": {
                "value": [
                    {
                        "value": "weight decay (0.05)",
                        "confidence": 0.924
                    },
                    {
                        "value": "drop path (0.1)",
                        "confidence": 0.9999
                    },
                    {
                        "value": "reprob (0.25)",
                        "confidence": 0.9959
                    },
                    {
                        "value": "mixup (0.8)",
                        "confidence": 1.0
                    },
                    {
                        "value": "cutmix (1.0)",
                        "confidence": 1.0
                    }
                ]
            },
            "optimizer": {
                "value": "AdamW",
                "confidence": 1.0
            },
            "batch_size": {
                "value": 512,
                "confidence": 1.0
            },
            "learning_rate": {
                "value": 0.0002,
                "confidence": 0.9998
            },
            "epochs": {
                "value": 150,
                "confidence": 1.0
            },
            "loss_function": {
                "value": "Cross-entropy",
                "confidence": 0.782
            },
            "split_ratio": {
                "value": "train/validation as in [29]",
                "confidence": 0.3324
            }
        },
        {
            "task": {
                "value": "Multi-label classification",
                "confidence": 0.9999
            },
            "application": {
                "value": "Scene classification",
                "confidence": 0.5782
            },
            "dataset": {
                "value": "BigEarthNet",
                "confidence": 1.0
            },
            "metrics": {
                "value": [
                    {
                        "value": "mAP",
                        "confidence": 0.7252
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 87.41,
                        "confidence": 1.0
                    }
                ]
            },
            "sensor": {
                "value": [
                    {
                        "value": "Sentinel-2",
                        "confidence": 1.0
                    }
                ]
            },
            "regions": {
                "value": [
                    {
                        "value": "Europe (10 countries)",
                        "confidence": 0.9888
                    }
                ]
            },
            "original_samples": {
                "value": 354196,
                "confidence": 0.9623
            },
            "num_samples": {
                "value": 35419,
                "confidence": 0.9817
            },
            "sampling_percentage": {
                "value": 10,
                "confidence": 1.0
            },
            "num_classes": {
                "value": 19,
                "confidence": 1.0
            },
            "classes": {
                "value": null,
                "confidence": 0.0
            },
            "image_resolution": {
                "value": null,
                "confidence": 0.0
            },
            "spatial_resolution": {
                "value": null,
                "confidence": 0.0
            },
            "bands_used": {
                "value": [
                    {
                        "value": "B1",
                        "confidence": 0.9973
                    },
                    {
                        "value": "B2",
                        "confidence": 1.0
                    },
                    {
                        "value": "B3",
                        "confidence": 1.0
                    },
                    {
                        "value": "B4",
                        "confidence": 1.0
                    },
                    {
                        "value": "B5",
                        "confidence": 1.0
                    },
                    {
                        "value": "B6",
                        "confidence": 1.0
                    },
                    {
                        "value": "B7",
                        "confidence": 1.0
                    },
                    {
                        "value": "B8",
                        "confidence": 1.0
                    },
                    {
                        "value": "B8A",
                        "confidence": 1.0
                    },
                    {
                        "value": "B9",
                        "confidence": 1.0
                    },
                    {
                        "value": "B11",
                        "confidence": 1.0
                    },
                    {
                        "value": "B12",
                        "confidence": 1.0
                    }
                ]
            },
            "augmentations": {
                "value": null,
                "confidence": 0.0
            },
            "optimizer": {
                "value": "AdamW",
                "confidence": 0.9818
            },
            "batch_size": {
                "value": null,
                "confidence": 0.0
            },
            "learning_rate": {
                "value": 0.0002,
                "confidence": 1.0
            },
            "epochs": {
                "value": 40,
                "confidence": 1.0
            },
            "loss_function": {
                "value": "Multi-label soft margin loss",
                "confidence": 0.8593
            },
            "split_ratio": {
                "value": "train/validation as in [29]",
                "confidence": 0.935
            }
        },
        {
            "task": {
                "value": "Change detection",
                "confidence": 0.9093
            },
            "application": {
                "value": "Urban change detection",
                "confidence": 0.9497
            },
            "dataset": {
                "value": "OSCD",
                "confidence": 0.9165
            },
            "metrics": {
                "value": [
                    {
                        "value": "Precision",
                        "confidence": 0.9995
                    },
                    {
                        "value": "Recall",
                        "confidence": 1.0
                    },
                    {
                        "value": "F1",
                        "confidence": 1.0
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 54.9,
                        "confidence": 0.65
                    },
                    {
                        "value": 56.81,
                        "confidence": 1.0
                    },
                    {
                        "value": 54.26,
                        "confidence": 1.0
                    }
                ]
            },
            "sensor": {
                "value": [
                    {
                        "value": "Sentinel-2",
                        "confidence": 1.0
                    }
                ]
            },
            "regions": {
                "value": null,
                "confidence": 0.0
            },
            "original_samples": {
                "value": 24,
                "confidence": 0.9984
            },
            "num_samples": {
                "value": null,
                "confidence": 0.0
            },
            "sampling_percentage": {
                "value": null,
                "confidence": 0.0
            },
            "num_classes": {
                "value": 2,
                "confidence": 1.0
            },
            "classes": {
                "value": [
                    {
                        "value": "change",
                        "confidence": 0.5157
                    },
                    {
                        "value": "no change",
                        "confidence": 0.9208
                    }
                ]
            },
            "image_resolution": {
                "value": "128x128",
                "confidence": 0.9665
            },
            "spatial_resolution": {
                "value": "10m, 20m, 60m",
                "confidence": 0.7966
            },
            "bands_used": {
                "value": [
                    {
                        "value": "B1",
                        "confidence": 0.9475
                    },
                    {
                        "value": "B2",
                        "confidence": 1.0
                    },
                    {
                        "value": "B3",
                        "confidence": 1.0
                    },
                    {
                        "value": "B4",
                        "confidence": 1.0
                    },
                    {
                        "value": "B5",
                        "confidence": 1.0
                    },
                    {
                        "value": "B6",
                        "confidence": 1.0
                    },
                    {
                        "value": "B7",
                        "confidence": 1.0
                    },
                    {
                        "value": "B8",
                        "confidence": 1.0
                    },
                    {
                        "value": "B8A",
                        "confidence": 1.0
                    },
                    {
                        "value": "B9",
                        "confidence": 1.0
                    },
                    {
                        "value": "B11",
                        "confidence": 0.9469
                    },
                    {
                        "value": "B12",
                        "confidence": 1.0
                    }
                ]
            },
            "augmentations": {
                "value": [
                    {
                        "value": "random flips",
                        "confidence": 0.8071
                    },
                    {
                        "value": "rotations",
                        "confidence": 0.8085
                    }
                ]
            },
            "optimizer": {
                "value": "AdamW",
                "confidence": 0.9968
            },
            "batch_size": {
                "value": null,
                "confidence": 0.0
            },
            "learning_rate": {
                "value": 0.0002,
                "confidence": 1.0
            },
            "epochs": {
                "value": 50,
                "confidence": 1.0
            },
            "loss_function": {
                "value": "Cross-entropy",
                "confidence": 0.9698
            },
            "split_ratio": {
                "value": "14 train / 10 test",
                "confidence": 0.4349
            }
        }
    ]
}