{
    "model_id": {
        "value": "Omnisat-2024",
        "confidence": 0.6208
    },
    "model_name": {
        "value": "OmniSat",
        "confidence": 0.9999
    },
    "version": {
        "value": "v1",
        "confidence": 0.6656
    },
    "release_date": {
        "value": "2024-07-17",
        "confidence": 0.9636
    },
    "last_updated": {
        "value": "2024-07-17",
        "confidence": 0.9993
    },
    "short_description": {
        "value": "OmniSat is a self-supervised multimodal fusion model for Earth Observation, capable of combining diverse EO modalities (very high resolution images, optical and SAR time series) into expressive features without labels, achieving state-of-the-art results on forestry, land cover, and crop mapping tasks.",
        "confidence": 0.7815
    },
    "paper_link": {
        "value": "https://arxiv.org/abs/2404.08351",
        "confidence": 0.9999
    },
    "citations": {
        "value": null,
        "confidence": 0.0
    },
    "repository": {
        "value": "https://github.com/gastruc/OmniSat",
        "confidence": 1.0
    },
    "weights": {
        "value": null,
        "confidence": 0.0
    },
    "backbone": {
        "value": "Custom multimodal transformer with modality-specific encoders (CNN for images, LTAE for time series) and a modality-combining transformer",
        "confidence": 0.7669
    },
    "num_layers": {
        "value": null,
        "confidence": 0.0
    },
    "num_parameters": {
        "value": 10000000,
        "confidence": 0.9947
    },
    "pretext_training_type": {
        "value": "Cross-modal contrastive learning and multimodal masked autoencoding",
        "confidence": 0.8235
    },
    "masking_strategy": {
        "value": "Random patch masking per modality",
        "confidence": 0.7258
    },
    "pretraining": {
        "value": "Cross-modal contrastive learning and multimodal masked autoencoding leveraging spatial alignment of EO data",
        "confidence": 0.7282
    },
    "domain_knowledge": {
        "value": [
            {
                "value": "Georeferencing-based spatial alignment",
                "confidence": 0.5375
            },
            {
                "value": "Cloud-aware temporal filtering",
                "confidence": 0.5716
            },
            {
                "value": "Relative positional encoding for EO",
                "confidence": 0.6779
            }
        ]
    },
    "backbone_modifications": {
        "value": [
            {
                "value": "Maxpool index bypass from encoder to decoder (SegNet-style)",
                "confidence": 0.7381
            },
            {
                "value": "Lightweight Temporal Attention Encoder (LTAE) for time series",
                "confidence": 0.8325
            },
            {
                "value": "Relative positional encoding",
                "confidence": 0.7405
            }
        ]
    },
    "supported_sensors": {
        "value": [
            {
                "value": "Sentinel-1",
                "confidence": 0.683
            },
            {
                "value": "Sentinel-2",
                "confidence": 1.0
            },
            {
                "value": "SPOT 6-7",
                "confidence": 0.9294
            },
            {
                "value": "VHR aerial imagery",
                "confidence": 0.5217
            }
        ]
    },
    "modality_integration_type": {
        "value": "Heterogeneous Multimodal",
        "confidence": 0.9988
    },
    "modalities": {
        "value": [
            {
                "value": "Multispectral",
                "confidence": 0.8925
            },
            {
                "value": "SAR",
                "confidence": 0.9674
            },
            {
                "value": "RGB",
                "confidence": 0.5486
            },
            {
                "value": "Near-infrared",
                "confidence": 0.6839
            },
            {
                "value": "Time series",
                "confidence": 0.7569
            }
        ]
    },
    "spectral_alignment": {
        "value": "partial",
        "confidence": 0.9327
    },
    "temporal_alignment": {
        "value": "partial",
        "confidence": 0.9332
    },
    "spatial_resolution": {
        "value": "variable (0.2m, 1m, 10m)",
        "confidence": 0.7745
    },
    "temporal_resolution": {
        "value": "variable (10-140 obs/year)",
        "confidence": 0.8372
    },
    "bands": {
        "value": [
            {
                "value": "RGB",
                "confidence": 0.9787
            },
            {
                "value": "NIR",
                "confidence": 0.8088
            },
            {
                "value": "Sentinel-2 10 bands",
                "confidence": 0.8214
            },
            {
                "value": "Sentinel-1 3 bands",
                "confidence": 0.8347
            }
        ]
    },
    "pretraining_phases": [
        {
            "dataset": {
                "value": "TreeSatAI-TS",
                "confidence": 0.9699
            },
            "regions_coverage": {
                "value": [
                    {
                        "value": "Germany",
                        "confidence": 1.0
                    }
                ]
            },
            "time_range": {
                "value": "closest available year to VHR observation",
                "confidence": 0.4596
            },
            "num_images": {
                "value": 50381,
                "confidence": 1.0
            },
            "token_size": {
                "value": "256",
                "confidence": 0.9586
            },
            "image_resolution": {
                "value": "0.2m (VHR), 10m (Sentinel)",
                "confidence": 0.459
            },
            "epochs": {
                "value": 250,
                "confidence": 1.0
            },
            "batch_size": {
                "value": 128,
                "confidence": 0.9668
            },
            "learning_rate": {
                "value": "1e-4",
                "confidence": 0.8957
            },
            "augmentations": {
                "value": []
            },
            "processing": {
                "value": [
                    {
                        "value": "No pre-processing for time series",
                        "confidence": 0.3246
                    },
                    {
                        "value": "Manual selection for single-date images",
                        "confidence": 0.4935
                    }
                ]
            },
            "sampling": {
                "value": "All available tiles",
                "confidence": 0.3644
            },
            "processing_level": {
                "value": null,
                "confidence": 0.0
            },
            "cloud_cover": {
                "value": "No filtering; raw observations included",
                "confidence": 0.3194
            },
            "missing_data": {
                "value": "Cloudy observations present; handled by attention-based date filtering",
                "confidence": 0.3001
            },
            "masking_ratio": {
                "value": null,
                "confidence": 0.0
            }
        },
        {
            "dataset": {
                "value": "PASTIS-HD",
                "confidence": 0.9996
            },
            "regions_coverage": {
                "value": [
                    {
                        "value": "France",
                        "confidence": 0.9456
                    }
                ]
            },
            "time_range": {
                "value": null,
                "confidence": 0.0
            },
            "num_images": {
                "value": 2433,
                "confidence": 0.9998
            },
            "token_size": {
                "value": "256",
                "confidence": 1.0
            },
            "image_resolution": {
                "value": "1m (SPOT 6-7), 10m (Sentinel)",
                "confidence": 0.5417
            },
            "epochs": {
                "value": 250,
                "confidence": 1.0
            },
            "batch_size": {
                "value": 128,
                "confidence": 1.0
            },
            "learning_rate": {
                "value": "1e-4",
                "confidence": 1.0
            },
            "augmentations": {
                "value": []
            },
            "processing": {
                "value": [
                    {
                        "value": "Orthorectification",
                        "confidence": 0.9955
                    },
                    {
                        "value": "Pansharpening",
                        "confidence": 0.9886
                    },
                    {
                        "value": "Resampling to 1m",
                        "confidence": 0.5454
                    },
                    {
                        "value": "8-bit conversion",
                        "confidence": 0.5969
                    }
                ]
            },
            "sampling": {
                "value": "All available tiles",
                "confidence": 0.5527
            },
            "processing_level": {
                "value": null,
                "confidence": 0.0
            },
            "cloud_cover": {
                "value": null,
                "confidence": 0.0
            },
            "missing_data": {
                "value": null,
                "confidence": 0.0
            },
            "masking_ratio": {
                "value": null,
                "confidence": 0.0
            }
        },
        {
            "dataset": {
                "value": "FLAIR",
                "confidence": 1.0
            },
            "regions_coverage": {
                "value": [
                    {
                        "value": "France",
                        "confidence": 1.0
                    }
                ]
            },
            "time_range": {
                "value": null,
                "confidence": 0.0
            },
            "num_images": {
                "value": 77762,
                "confidence": 1.0
            },
            "token_size": {
                "value": "256",
                "confidence": 1.0
            },
            "image_resolution": {
                "value": "0.2m (aerial), 10m (Sentinel-2)",
                "confidence": 0.6602
            },
            "epochs": {
                "value": 250,
                "confidence": 1.0
            },
            "batch_size": {
                "value": 128,
                "confidence": 1.0
            },
            "learning_rate": {
                "value": "1e-4",
                "confidence": 1.0
            },
            "augmentations": {
                "value": []
            },
            "processing": {
                "value": []
            },
            "sampling": {
                "value": "All available tiles",
                "confidence": 0.9827
            },
            "processing_level": {
                "value": null,
                "confidence": 0.0
            },
            "cloud_cover": {
                "value": null,
                "confidence": 0.0
            },
            "missing_data": {
                "value": null,
                "confidence": 0.0
            },
            "masking_ratio": {
                "value": null,
                "confidence": 0.0
            }
        }
    ],
    "benchmarks": [
        {
            "task": {
                "value": "Multi-label classification",
                "confidence": 0.8079
            },
            "application": {
                "value": "Tree species identification",
                "confidence": 0.7133
            },
            "dataset": {
                "value": "TreeSatAI-TS",
                "confidence": 0.9959
            },
            "metrics": {
                "value": [
                    {
                        "value": "Weighted F1",
                        "confidence": 0.7618
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 74.2,
                        "confidence": 0.9952
                    }
                ]
            },
            "sensor": {
                "value": [
                    {
                        "value": "VHR aerial",
                        "confidence": 0.922
                    },
                    {
                        "value": "Sentinel-1",
                        "confidence": 0.8848
                    },
                    {
                        "value": "Sentinel-2",
                        "confidence": 1.0
                    }
                ]
            },
            "regions": {
                "value": [
                    {
                        "value": "Germany",
                        "confidence": 1.0
                    }
                ]
            },
            "original_samples": {
                "value": 50381,
                "confidence": 1.0
            },
            "num_samples": {
                "value": 50381,
                "confidence": 0.9986
            },
            "sampling_percentage": {
                "value": 100,
                "confidence": 1.0
            },
            "num_classes": {
                "value": 20,
                "confidence": 0.9983
            },
            "classes": {
                "value": [
                    {
                        "value": "Abies/tree",
                        "confidence": 0.8963
                    },
                    {
                        "value": "Acer/leaf",
                        "confidence": 0.6002
                    },
                    {
                        "value": "Alnus/leaf",
                        "confidence": 1.0
                    },
                    {
                        "value": "Betula/leaf",
                        "confidence": 1.0
                    },
                    {
                        "value": "Cleared",
                        "confidence": 1.0
                    },
                    {
                        "value": "Fagus/leaf",
                        "confidence": 1.0
                    },
                    {
                        "value": "Fraxinus/leaf",
                        "confidence": 1.0
                    },
                    {
                        "value": "Larix/tree",
                        "confidence": 1.0
                    },
                    {
                        "value": "Picea/tree",
                        "confidence": 1.0
                    },
                    {
                        "value": "Pinus/tree",
                        "confidence": 1.0
                    },
                    {
                        "value": "Populus/leaf",
                        "confidence": 1.0
                    },
                    {
                        "value": "Prunus/leaf",
                        "confidence": 1.0
                    },
                    {
                        "value": "Pseudotsuga/tree",
                        "confidence": 1.0
                    },
                    {
                        "value": "Quercus/leaf",
                        "confidence": 1.0
                    },
                    {
                        "value": "Tilia/leaf",
                        "confidence": 1.0
                    },
                    {
                        "value": null,
                        "confidence": 1.5
                    },
                    {
                        "value": null,
                        "confidence": 1.5
                    },
                    {
                        "value": null,
                        "confidence": 1.5
                    },
                    {
                        "value": null,
                        "confidence": 1.5
                    },
                    {
                        "value": null,
                        "confidence": 1.5
                    }
                ]
            },
            "image_resolution": {
                "value": "0.2m (VHR), 10m (Sentinel)",
                "confidence": 0.7881
            },
            "spatial_resolution": {
                "value": "0.2m, 10m",
                "confidence": 0.7124
            },
            "bands_used": {
                "value": [
                    {
                        "value": "RGB",
                        "confidence": 0.9977
                    },
                    {
                        "value": "NIR",
                        "confidence": 0.9887
                    },
                    {
                        "value": "Sentinel-2 10 bands",
                        "confidence": 0.8701
                    },
                    {
                        "value": "Sentinel-1 3 bands",
                        "confidence": 0.9995
                    }
                ]
            },
            "augmentations": {
                "value": []
            },
            "optimizer": {
                "value": "ADAM",
                "confidence": 0.7754
            },
            "batch_size": {
                "value": 128,
                "confidence": 1.0
            },
            "learning_rate": {
                "value": 0.0001,
                "confidence": 0.9982
            },
            "epochs": {
                "value": 250,
                "confidence": 1.0
            },
            "loss_function": {
                "value": "Sum of cross-modal contrastive and multimodal reconstruction loss",
                "confidence": 0.33
            },
            "split_ratio": {
                "value": "train/val/test not specified",
                "confidence": 0.3321
            }
        },
        {
            "task": {
                "value": "Multi-class classification",
                "confidence": 0.9693
            },
            "application": {
                "value": "Crop type mapping",
                "confidence": 0.6928
            },
            "dataset": {
                "value": "PASTIS-HD",
                "confidence": 1.0
            },
            "metrics": {
                "value": [
                    {
                        "value": "Macro F1",
                        "confidence": 0.8865
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 69.9,
                        "confidence": 1.0
                    }
                ]
            },
            "sensor": {
                "value": [
                    {
                        "value": "SPOT 6-7",
                        "confidence": 0.9907
                    },
                    {
                        "value": "Sentinel-1",
                        "confidence": 0.9985
                    },
                    {
                        "value": "Sentinel-2",
                        "confidence": 1.0
                    }
                ]
            },
            "regions": {
                "value": [
                    {
                        "value": "France",
                        "confidence": 1.0
                    }
                ]
            },
            "original_samples": {
                "value": 2433,
                "confidence": 1.0
            },
            "num_samples": {
                "value": 2433,
                "confidence": 1.0
            },
            "sampling_percentage": {
                "value": 100,
                "confidence": 1.0
            },
            "num_classes": {
                "value": 18,
                "confidence": 1.0
            },
            "classes": {
                "value": [
                    {
                        "value": "Meadow",
                        "confidence": 1.0
                    },
                    {
                        "value": "Soft winter wheat",
                        "confidence": 0.9988
                    },
                    {
                        "value": "Corn",
                        "confidence": 1.0
                    },
                    {
                        "value": "Winter barley",
                        "confidence": 1.0
                    },
                    {
                        "value": "Winter rapeseed",
                        "confidence": 0.9998
                    },
                    {
                        "value": "Spring barley",
                        "confidence": 1.0
                    },
                    {
                        "value": "Sunflower",
                        "confidence": 1.0
                    },
                    {
                        "value": "Grapevine",
                        "confidence": 1.0
                    },
                    {
                        "value": "Beet",
                        "confidence": 1.0
                    },
                    {
                        "value": "Winter triticale",
                        "confidence": 1.0
                    },
                    {
                        "value": "Winter durum wheat",
                        "confidence": 0.9992
                    },
                    {
                        "value": "Fruits, vegetables, flowers",
                        "confidence": 0.9556
                    },
                    {
                        "value": "Potatoes",
                        "confidence": 1.0
                    },
                    {
                        "value": "Leguminous fodder",
                        "confidence": 0.9999
                    },
                    {
                        "value": "Soybeans",
                        "confidence": 1.0
                    },
                    {
                        "value": "Orchard",
                        "confidence": 1.0
                    },
                    {
                        "value": "Mixed cereal",
                        "confidence": 1.0
                    },
                    {
                        "value": "Sorghum",
                        "confidence": 1.0
                    }
                ]
            },
            "image_resolution": {
                "value": "1m (SPOT 6-7), 10m (Sentinel)",
                "confidence": 0.887
            },
            "spatial_resolution": {
                "value": "1m, 10m",
                "confidence": 0.9989
            },
            "bands_used": {
                "value": [
                    {
                        "value": "SPOT 6-7 bands",
                        "confidence": 0.4107
                    },
                    {
                        "value": "Sentinel-2 10 bands",
                        "confidence": 0.9058
                    },
                    {
                        "value": "Sentinel-1 3 bands",
                        "confidence": 1.0
                    }
                ]
            },
            "augmentations": {
                "value": []
            },
            "optimizer": {
                "value": "ADAM",
                "confidence": 1.0
            },
            "batch_size": {
                "value": 128,
                "confidence": 1.0
            },
            "learning_rate": {
                "value": 0.0001,
                "confidence": 1.0
            },
            "epochs": {
                "value": 250,
                "confidence": 1.0
            },
            "loss_function": {
                "value": "Sum of cross-modal contrastive and multimodal reconstruction loss",
                "confidence": 0.9966
            },
            "split_ratio": {
                "value": "train/val/test not specified",
                "confidence": 0.9369
            }
        },
        {
            "task": {
                "value": "Multi-class classification",
                "confidence": 0.9787
            },
            "application": {
                "value": "Land cover classification",
                "confidence": 0.8983
            },
            "dataset": {
                "value": "FLAIR",
                "confidence": 1.0
            },
            "metrics": {
                "value": [
                    {
                        "value": "Macro F1",
                        "confidence": 1.0
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 73.4,
                        "confidence": 1.0
                    }
                ]
            },
            "sensor": {
                "value": [
                    {
                        "value": "VHR aerial",
                        "confidence": 0.7347
                    },
                    {
                        "value": "Sentinel-2",
                        "confidence": 1.0
                    }
                ]
            },
            "regions": {
                "value": [
                    {
                        "value": "France",
                        "confidence": 1.0
                    }
                ]
            },
            "original_samples": {
                "value": 77762,
                "confidence": 1.0
            },
            "num_samples": {
                "value": 77762,
                "confidence": 1.0
            },
            "sampling_percentage": {
                "value": 100,
                "confidence": 1.0
            },
            "num_classes": {
                "value": 13,
                "confidence": 1.0
            },
            "classes": {
                "value": [
                    {
                        "value": "building",
                        "confidence": 0.9923
                    },
                    {
                        "value": "perv. surface",
                        "confidence": 0.6499
                    },
                    {
                        "value": "imperv. surface",
                        "confidence": 1.0
                    },
                    {
                        "value": "bare soil",
                        "confidence": 1.0
                    },
                    {
                        "value": "water",
                        "confidence": 1.0
                    },
                    {
                        "value": "coniferous",
                        "confidence": 1.0
                    },
                    {
                        "value": "deciduous",
                        "confidence": 1.0
                    },
                    {
                        "value": "brushwood",
                        "confidence": 1.0
                    },
                    {
                        "value": "vineyard",
                        "confidence": 1.0
                    },
                    {
                        "value": "herbaceous",
                        "confidence": 1.0
                    },
                    {
                        "value": "agri. land",
                        "confidence": 0.9463
                    },
                    {
                        "value": "plowed land",
                        "confidence": 1.0
                    },
                    {
                        "value": "other",
                        "confidence": 1.0
                    }
                ]
            },
            "image_resolution": {
                "value": "0.2m (aerial), 10m (Sentinel-2)",
                "confidence": 0.9843
            },
            "spatial_resolution": {
                "value": "0.2m, 10m",
                "confidence": 0.9999
            },
            "bands_used": {
                "value": [
                    {
                        "value": "RGB",
                        "confidence": 0.9786
                    },
                    {
                        "value": "NIR",
                        "confidence": 0.9967
                    },
                    {
                        "value": "DSM",
                        "confidence": 0.604
                    },
                    {
                        "value": "Sentinel-2 10 bands",
                        "confidence": 0.9991
                    }
                ]
            },
            "augmentations": {
                "value": []
            },
            "optimizer": {
                "value": "ADAM",
                "confidence": 1.0
            },
            "batch_size": {
                "value": 128,
                "confidence": 1.0
            },
            "learning_rate": {
                "value": 0.0001,
                "confidence": 1.0
            },
            "epochs": {
                "value": 250,
                "confidence": 1.0
            },
            "loss_function": {
                "value": "Sum of cross-modal contrastive and multimodal reconstruction loss",
                "confidence": 0.9993
            },
            "split_ratio": {
                "value": "train/val/test not specified",
                "confidence": 0.9999
            }
        }
    ]
}