{
    "model_id": {
        "value": "ViT-G12x4-MAE-MillionAID",
        "confidence": 0.7553
    },
    "model_name": {
        "value": "ViT-G12x4",
        "confidence": 0.9889
    },
    "version": {
        "value": "1.0",
        "confidence": 0.9518
    },
    "release_date": {
        "value": null,
        "confidence": 0.0
    },
    "last_updated": {
        "value": null,
        "confidence": 0.0
    },
    "short_description": {
        "value": "First billion-scale vision transformer foundation model for remote sensing, pretrained with MAE on MillionAID and evaluated on rotated object detection and semantic segmentation tasks.",
        "confidence": 0.8099
    },
    "paper_link": {
        "value": "https://arxiv.org/abs/2304.05215",
        "confidence": 0.9994
    },
    "citations": {
        "value": null,
        "confidence": 0.0
    },
    "repository": {
        "value": null,
        "confidence": 0.0
    },
    "weights": {
        "value": null,
        "confidence": 0.0
    },
    "backbone": {
        "value": "Vision Transformer (ViT-G12x4)",
        "confidence": 0.8667
    },
    "num_layers": {
        "value": 12,
        "confidence": 1.0
    },
    "num_parameters": {
        "value": 2420000000,
        "confidence": 0.9828
    },
    "pretext_training_type": {
        "value": "Masked Image Modeling (MAE)",
        "confidence": 0.8216
    },
    "masking_strategy": {
        "value": "Random masking of 75% patches",
        "confidence": 0.8177
    },
    "pretraining": {
        "value": "Self-supervised pretraining with MAE on MillionAID dataset, using random masking and reconstruction of masked patches.",
        "confidence": 0.6708
    },
    "domain_knowledge": {
        "value": [],
        "confidence": 0.0
    },
    "backbone_modifications": {
        "value": [
            {
                "value": "Parallelism in transformer layers (4-way parallel)",
                "confidence": 0.4204
            },
            {
                "value": "Increased hidden size (2048)",
                "confidence": 0.6096
            },
            {
                "value": "Increased MLP size (8192)",
                "confidence": 0.7747
            },
            {
                "value": "Increased number of heads (32)",
                "confidence": 0.5804
            }
        ]
    },
    "supported_sensors": {
        "value": [
            {
                "value": "Google Earth imagery",
                "confidence": 0.8526
            }
        ]
    },
    "modality_integration_type": {
        "value": "Unimodal",
        "confidence": 1.0
    },
    "modalities": {
        "value": [
            {
                "value": "RGB",
                "confidence": 0.7654
            }
        ]
    },
    "spectral_alignment": {
        "value": "none",
        "confidence": 0.9974
    },
    "temporal_alignment": {
        "value": "none",
        "confidence": 1.0
    },
    "spatial_resolution": {
        "value": "0.5m to 153m",
        "confidence": 0.8462
    },
    "temporal_resolution": {
        "value": null,
        "confidence": 0.0
    },
    "bands": {
        "value": [
            {
                "value": "R",
                "confidence": 0.933
            },
            {
                "value": "G",
                "confidence": 1.0
            },
            {
                "value": "B",
                "confidence": 1.0
            }
        ]
    },
    "pretraining_phases": [
        {
            "dataset": {
                "value": "MillionAID",
                "confidence": 1.0
            },
            "regions_coverage": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "time_range": {
                "value": null,
                "confidence": 0.0
            },
            "num_images": {
                "value": 1000848,
                "confidence": 1.0
            },
            "token_size": {
                "value": "16x16",
                "confidence": 0.9992
            },
            "image_resolution": {
                "value": "224x224",
                "confidence": 0.9997
            },
            "epochs": {
                "value": 400,
                "confidence": 1.0
            },
            "batch_size": {
                "value": 2048,
                "confidence": 1.0
            },
            "learning_rate": {
                "value": "0.0001 (base LR, effective LR = batch_size * base LR / 256)",
                "confidence": 0.3075
            },
            "augmentations": {
                "value": [
                    {
                        "value": "RandomResizedCrop",
                        "confidence": 0.7242
                    },
                    {
                        "value": "HorizontalFlip",
                        "confidence": 0.6839
                    },
                    {
                        "value": "VerticalFlip",
                        "confidence": 1.0
                    }
                ]
            },
            "processing": {
                "value": [
                    {
                        "value": "Resize",
                        "confidence": 0.7643
                    },
                    {
                        "value": "Crop",
                        "confidence": 0.8681
                    },
                    {
                        "value": "Patchify (16x16)",
                        "confidence": 0.3853
                    }
                ]
            },
            "sampling": {
                "value": "Full dataset used",
                "confidence": 0.3395
            },
            "processing_level": {
                "value": null,
                "confidence": 0.0
            },
            "cloud_cover": {
                "value": null,
                "confidence": 0.0
            },
            "missing_data": {
                "value": null,
                "confidence": 0.0
            },
            "masking_ratio": {
                "value": 0.75,
                "confidence": 1.0
            }
        }
    ],
    "benchmarks": [
        {
            "task": {
                "value": "Rotated Object Detection",
                "confidence": 0.8185
            },
            "application": {
                "value": "Aerial object detection",
                "confidence": 0.5093
            },
            "dataset": {
                "value": "DOTA v2.0",
                "confidence": 0.9998
            },
            "metrics": {
                "value": [
                    {
                        "value": "mAP",
                        "confidence": 0.9688
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 58.69,
                        "confidence": 1.0
                    }
                ]
            },
            "sensor": {
                "value": [
                    {
                        "value": "Multiple sources (DOTA)",
                        "confidence": 0.337
                    }
                ]
            },
            "regions": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "original_samples": {
                "value": 11268,
                "confidence": 0.9858
            },
            "num_samples": {
                "value": 11268,
                "confidence": 0.9194
            },
            "sampling_percentage": {
                "value": 100,
                "confidence": 1.0
            },
            "num_classes": {
                "value": 18,
                "confidence": 1.0
            },
            "classes": {
                "value": [
                    {
                        "value": "Plane",
                        "confidence": 0.6454
                    },
                    {
                        "value": "Baseball diamond",
                        "confidence": 0.932
                    },
                    {
                        "value": "Bridge",
                        "confidence": 1.0
                    },
                    {
                        "value": "Ground track field",
                        "confidence": 0.9972
                    },
                    {
                        "value": "Small-vehicle",
                        "confidence": 0.9794
                    },
                    {
                        "value": "Large-vehicle",
                        "confidence": 1.0
                    },
                    {
                        "value": "Ship",
                        "confidence": 1.0
                    },
                    {
                        "value": "Tennis-court",
                        "confidence": 0.9996
                    },
                    {
                        "value": "Basketball-court",
                        "confidence": 0.9997
                    },
                    {
                        "value": "Storage-tank",
                        "confidence": 0.9998
                    },
                    {
                        "value": "Soccer-ball field",
                        "confidence": 0.9998
                    },
                    {
                        "value": "Roundabout",
                        "confidence": 1.0
                    },
                    {
                        "value": "Harbor",
                        "confidence": 1.0
                    },
                    {
                        "value": "Swimming-pool",
                        "confidence": 0.9995
                    },
                    {
                        "value": "Helicopter",
                        "confidence": 1.0
                    },
                    {
                        "value": "Container-crane",
                        "confidence": 0.9999
                    },
                    {
                        "value": "Airport",
                        "confidence": 1.0
                    },
                    {
                        "value": "Helipad",
                        "confidence": 1.0
                    }
                ]
            },
            "image_resolution": {
                "value": "800x800 to 20000x20000",
                "confidence": 0.9466
            },
            "spatial_resolution": {
                "value": "variable",
                "confidence": 0.7635
            },
            "bands_used": {
                "value": [
                    {
                        "value": "R",
                        "confidence": 0.9668
                    },
                    {
                        "value": "G",
                        "confidence": 1.0
                    },
                    {
                        "value": "B",
                        "confidence": 1.0
                    }
                ]
            },
            "augmentations": {
                "value": [
                    {
                        "value": "RandomHorizontalFlip",
                        "confidence": 0.9076
                    },
                    {
                        "value": "RandomVerticalFlip",
                        "confidence": 0.9999
                    }
                ]
            },
            "optimizer": {
                "value": "AdamW",
                "confidence": 1.0
            },
            "batch_size": {
                "value": 2,
                "confidence": 1.0
            },
            "learning_rate": {
                "value": 0.0001,
                "confidence": 1.0
            },
            "epochs": {
                "value": 12,
                "confidence": 1.0
            },
            "loss_function": {
                "value": null,
                "confidence": 0.0
            },
            "split_ratio": {
                "value": "train: 1830, val: 593, test-dev: 2792",
                "confidence": 0.3282
            }
        },
        {
            "task": {
                "value": "Rotated Object Detection",
                "confidence": 1.0
            },
            "application": {
                "value": "Aerial object detection",
                "confidence": 0.9997
            },
            "dataset": {
                "value": "DIOR-R",
                "confidence": 1.0
            },
            "metrics": {
                "value": [
                    {
                        "value": "mAP",
                        "confidence": 1.0
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 73.62,
                        "confidence": 1.0
                    }
                ]
            },
            "sensor": {
                "value": [
                    {
                        "value": "Multiple sources (DIOR-R)",
                        "confidence": 0.653
                    }
                ]
            },
            "regions": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "original_samples": {
                "value": 11738,
                "confidence": 0.97
            },
            "num_samples": {
                "value": 11738,
                "confidence": 1.0
            },
            "sampling_percentage": {
                "value": 100,
                "confidence": 1.0
            },
            "num_classes": {
                "value": 20,
                "confidence": 1.0
            },
            "classes": {
                "value": [
                    {
                        "value": "Airplane",
                        "confidence": 0.9998
                    },
                    {
                        "value": "Airport",
                        "confidence": 1.0
                    },
                    {
                        "value": "Baseball field",
                        "confidence": 0.9991
                    },
                    {
                        "value": "Basketball court",
                        "confidence": 0.9991
                    },
                    {
                        "value": "Bridge",
                        "confidence": 1.0
                    },
                    {
                        "value": "Chimney",
                        "confidence": 1.0
                    },
                    {
                        "value": "Dam",
                        "confidence": 1.0
                    },
                    {
                        "value": "Expressway-toll-station",
                        "confidence": 0.9978
                    },
                    {
                        "value": "Expressway-service-area",
                        "confidence": 0.9954
                    },
                    {
                        "value": "Golf field",
                        "confidence": 0.9977
                    },
                    {
                        "value": "Ground track field",
                        "confidence": 0.9838
                    },
                    {
                        "value": "Harbor",
                        "confidence": 1.0
                    },
                    {
                        "value": "Overpass",
                        "confidence": 1.0
                    },
                    {
                        "value": "Ship",
                        "confidence": 1.0
                    },
                    {
                        "value": "Stadium",
                        "confidence": 1.0
                    },
                    {
                        "value": "Storage tank",
                        "confidence": 0.9991
                    },
                    {
                        "value": "Tennis court",
                        "confidence": 0.9996
                    },
                    {
                        "value": "Transition",
                        "confidence": 0.9996
                    },
                    {
                        "value": "Vehicle",
                        "confidence": 1.0
                    },
                    {
                        "value": "Windmill",
                        "confidence": 1.0
                    }
                ]
            },
            "image_resolution": {
                "value": "800x800",
                "confidence": 1.0
            },
            "spatial_resolution": {
                "value": "0.5m to 30m",
                "confidence": 0.9783
            },
            "bands_used": {
                "value": [
                    {
                        "value": "R",
                        "confidence": 1.0
                    },
                    {
                        "value": "G",
                        "confidence": 1.0
                    },
                    {
                        "value": "B",
                        "confidence": 1.0
                    }
                ]
            },
            "augmentations": {
                "value": [
                    {
                        "value": "RandomHorizontalFlip",
                        "confidence": 1.0
                    },
                    {
                        "value": "RandomVerticalFlip",
                        "confidence": 1.0
                    }
                ]
            },
            "optimizer": {
                "value": "AdamW",
                "confidence": 1.0
            },
            "batch_size": {
                "value": 2,
                "confidence": 1.0
            },
            "learning_rate": {
                "value": 0.0001,
                "confidence": 1.0
            },
            "epochs": {
                "value": 12,
                "confidence": 1.0
            },
            "loss_function": {
                "value": null,
                "confidence": 0.0
            },
            "split_ratio": {
                "value": "train/val/test: published splits",
                "confidence": 0.3112
            }
        },
        {
            "task": {
                "value": "Semantic Segmentation",
                "confidence": 0.9837
            },
            "application": {
                "value": "Land cover segmentation",
                "confidence": 0.4469
            },
            "dataset": {
                "value": "Potsdam",
                "confidence": 0.994
            },
            "metrics": {
                "value": [
                    {
                        "value": "mF1",
                        "confidence": 0.9012
                    },
                    {
                        "value": "OA",
                        "confidence": 0.9732
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 92.12,
                        "confidence": 0.9469
                    },
                    {
                        "value": 92.58,
                        "confidence": 0.7357
                    }
                ]
            },
            "sensor": {
                "value": [
                    {
                        "value": "Aerial imagery (ISPRS Potsdam)",
                        "confidence": 0.3482
                    }
                ]
            },
            "regions": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "original_samples": {
                "value": 38,
                "confidence": 0.8946
            },
            "num_samples": {
                "value": 38,
                "confidence": 0.9854
            },
            "sampling_percentage": {
                "value": 100,
                "confidence": 1.0
            },
            "num_classes": {
                "value": 5,
                "confidence": 0.9987
            },
            "classes": {
                "value": [
                    {
                        "value": "Impervious surfaces",
                        "confidence": 0.8666
                    },
                    {
                        "value": "Building",
                        "confidence": 0.7357
                    },
                    {
                        "value": "Low vegetation",
                        "confidence": 0.9962
                    },
                    {
                        "value": "Tree",
                        "confidence": 1.0
                    },
                    {
                        "value": "Car",
                        "confidence": 1.0
                    }
                ]
            },
            "image_resolution": {
                "value": "6000x6000",
                "confidence": 1.0
            },
            "spatial_resolution": {
                "value": "0.5m",
                "confidence": 0.9999
            },
            "bands_used": {
                "value": [
                    {
                        "value": "R",
                        "confidence": 0.9995
                    },
                    {
                        "value": "G",
                        "confidence": 1.0
                    },
                    {
                        "value": "B",
                        "confidence": 1.0
                    }
                ]
            },
            "augmentations": {
                "value": [
                    {
                        "value": "Resize",
                        "confidence": 0.9865
                    },
                    {
                        "value": "Crop (512x512, stride 384)",
                        "confidence": 0.4445
                    },
                    {
                        "value": "HorizontalFlip",
                        "confidence": 0.6302
                    },
                    {
                        "value": "PhotometricDistortion",
                        "confidence": 0.9817
                    }
                ]
            },
            "optimizer": {
                "value": "AdamW",
                "confidence": 1.0
            },
            "batch_size": {
                "value": null,
                "confidence": 0.0
            },
            "learning_rate": {
                "value": 6e-05,
                "confidence": 1.0
            },
            "epochs": {
                "value": null,
                "confidence": 0.0
            },
            "loss_function": {
                "value": null,
                "confidence": 0.0
            },
            "split_ratio": {
                "value": "train: 24, test: 14",
                "confidence": 0.7064
            }
        },
        {
            "task": {
                "value": "Semantic Segmentation",
                "confidence": 1.0
            },
            "application": {
                "value": "Land cover segmentation",
                "confidence": 0.9514
            },
            "dataset": {
                "value": "LoveDA",
                "confidence": 1.0
            },
            "metrics": {
                "value": [
                    {
                        "value": "mIoU",
                        "confidence": 0.9999
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 54.4,
                        "confidence": 0.9839
                    }
                ]
            },
            "sensor": {
                "value": [
                    {
                        "value": "Aerial imagery (LoveDA)",
                        "confidence": 0.7673
                    }
                ]
            },
            "regions": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "original_samples": {
                "value": 5987,
                "confidence": 0.7741
            },
            "num_samples": {
                "value": 5987,
                "confidence": 0.9998
            },
            "sampling_percentage": {
                "value": 100,
                "confidence": 1.0
            },
            "num_classes": {
                "value": 6,
                "confidence": 0.9923
            },
            "classes": {
                "value": [
                    {
                        "value": "Building",
                        "confidence": 0.9785
                    },
                    {
                        "value": "Road",
                        "confidence": 1.0
                    },
                    {
                        "value": "Water",
                        "confidence": 1.0
                    },
                    {
                        "value": "Barren",
                        "confidence": 1.0
                    },
                    {
                        "value": "Forest",
                        "confidence": 0.9993
                    },
                    {
                        "value": "Agriculture",
                        "confidence": 0.9958
                    }
                ]
            },
            "image_resolution": {
                "value": "1024x1024",
                "confidence": 1.0
            },
            "spatial_resolution": {
                "value": "0.3m",
                "confidence": 1.0
            },
            "bands_used": {
                "value": [
                    {
                        "value": "R",
                        "confidence": 1.0
                    },
                    {
                        "value": "G",
                        "confidence": 1.0
                    },
                    {
                        "value": "B",
                        "confidence": 1.0
                    }
                ]
            },
            "augmentations": {
                "value": [
                    {
                        "value": "Resize",
                        "confidence": 0.9618
                    },
                    {
                        "value": "Crop (512x512)",
                        "confidence": 0.711
                    },
                    {
                        "value": "HorizontalFlip",
                        "confidence": 0.9767
                    },
                    {
                        "value": "PhotometricDistortion",
                        "confidence": 1.0
                    }
                ]
            },
            "optimizer": {
                "value": "AdamW",
                "confidence": 1.0
            },
            "batch_size": {
                "value": null,
                "confidence": 0.0
            },
            "learning_rate": {
                "value": 6e-05,
                "confidence": 1.0
            },
            "epochs": {
                "value": null,
                "confidence": 0.0
            },
            "loss_function": {
                "value": null,
                "confidence": 0.0
            },
            "split_ratio": {
                "value": "train: 2522, val: 1669, test: 1796",
                "confidence": 0.872
            }
        }
    ]
}