{
    "model_id": {
        "value": "SMLFR-ConvNeXt",
        "confidence": 0.9897
    },
    "model_name": {
        "value": "SMLFR-ConvNeXt",
        "confidence": 0.9981
    },
    "version": {
        "value": "1.0",
        "confidence": 0.9006
    },
    "release_date": {
        "value": "2024-01-01",
        "confidence": 1.0
    },
    "last_updated": {
        "value": "2024-01-11",
        "confidence": 0.9996
    },
    "short_description": {
        "value": "A generative ConvNet foundation model for remote sensing image interpretation, pretrained on the large-scale GeoSense dataset (~9 million images) using a sparse modeling and low-frequency reconstruction (SMLFR) self-supervised learning framework. Achieves state-of-the-art results on object detection, semantic segmentation, and change detection benchmarks.",
        "confidence": 0.8356
    },
    "paper_link": {
        "value": "https://doi.org/10.1109/TGRS.2023.3348479",
        "confidence": 0.9913
    },
    "citations": {
        "value": null,
        "confidence": 0.0
    },
    "repository": {
        "value": "https://github.com/HIT-SIRS/SMLFR",
        "confidence": 1.0
    },
    "weights": {
        "value": null,
        "confidence": 0.0
    },
    "backbone": {
        "value": "ConvNeXt (B and L variants)",
        "confidence": 0.7833
    },
    "num_layers": {
        "value": null,
        "confidence": 0.0
    },
    "num_parameters": {
        "value": null,
        "confidence": 0.0
    },
    "pretext_training_type": {
        "value": "Self-supervised masked image modeling (MIM) with sparse modeling and low-frequency reconstruction",
        "confidence": 0.897
    },
    "masking_strategy": {
        "value": "Random masking with 0.6 masking ratio, mask patch size 32",
        "confidence": 0.814
    },
    "pretraining": {
        "value": "Self-supervised pretraining on GeoSense using SMLFR: sparse modeling (masked image modeling with sparse convolution) and low-frequency reconstruction (DFT-based low-pass filtering as target)",
        "confidence": 0.6626
    },
    "domain_knowledge": {
        "value": [
            {
                "value": "Sparse convolution",
                "confidence": 0.6324
            },
            {
                "value": "Low-frequency reconstruction",
                "confidence": 0.7691
            },
            {
                "value": "Remote sensing-specific data diversity",
                "confidence": 0.6902
            }
        ]
    },
    "backbone_modifications": {
        "value": [
            {
                "value": "Submanifold sparse convolution layers",
                "confidence": 0.6663
            },
            {
                "value": "Skip connections in encoder-decoder",
                "confidence": 0.6391
            },
            {
                "value": "Mask token filling for sparse maps",
                "confidence": 0.5093
            }
        ]
    },
    "supported_sensors": {
        "value": [
            {
                "value": "Sentinel-2",
                "confidence": 1.0
            },
            {
                "value": "Gaofen",
                "confidence": 0.9982
            },
            {
                "value": "Landsat",
                "confidence": 1.0
            },
            {
                "value": "QuickBird",
                "confidence": 0.9997
            },
            {
                "value": "Google Earth",
                "confidence": 0.9707
            },
            {
                "value": "JL-1",
                "confidence": 0.9443
            }
        ]
    },
    "modality_integration_type": {
        "value": "Unimodal",
        "confidence": 1.0
    },
    "modalities": {
        "value": [
            {
                "value": "Multispectral",
                "confidence": 0.9992
            },
            {
                "value": "RGB",
                "confidence": 0.8615
            }
        ]
    },
    "spectral_alignment": {
        "value": "none",
        "confidence": 0.6357
    },
    "temporal_alignment": {
        "value": "none",
        "confidence": 1.0
    },
    "spatial_resolution": {
        "value": "variable (0.05m to 150m)",
        "confidence": 0.8677
    },
    "temporal_resolution": {
        "value": null,
        "confidence": 0.0
    },
    "bands": {
        "value": [
            {
                "value": "RGB",
                "confidence": 0.7057
            },
            {
                "value": "Multispectral",
                "confidence": 0.5001
            }
        ]
    },
    "pretraining_phases": [
        {
            "dataset": {
                "value": "GeoSense",
                "confidence": 1.0
            },
            "regions_coverage": {
                "value": [
                    {
                        "value": "Asia",
                        "confidence": 0.9999
                    },
                    {
                        "value": "Europe",
                        "confidence": 1.0
                    },
                    {
                        "value": "North America",
                        "confidence": 1.0
                    },
                    {
                        "value": "South America",
                        "confidence": 1.0
                    },
                    {
                        "value": "Africa",
                        "confidence": 1.0
                    },
                    {
                        "value": "Oceania",
                        "confidence": 1.0
                    }
                ]
            },
            "time_range": {
                "value": null,
                "confidence": 0.0
            },
            "num_images": {
                "value": 8916233,
                "confidence": 1.0
            },
            "token_size": {
                "value": "32x32 patch",
                "confidence": 0.4999
            },
            "image_resolution": {
                "value": "224x224",
                "confidence": 0.9997
            },
            "epochs": {
                "value": 400,
                "confidence": 1.0
            },
            "batch_size": {
                "value": 1024,
                "confidence": 1.0
            },
            "learning_rate": {
                "value": "cosine-annealing, peak=0.0002*batchsize/256",
                "confidence": 0.3537
            },
            "augmentations": {
                "value": [
                    {
                        "value": "horizontal flipping",
                        "confidence": 0.5727
                    },
                    {
                        "value": "random cropping",
                        "confidence": 1.0
                    }
                ]
            },
            "processing": {
                "value": [
                    {
                        "value": "cropping to 224x224",
                        "confidence": 0.5112
                    },
                    {
                        "value": "normalization",
                        "confidence": 0.9901
                    },
                    {
                        "value": "standardization (mean/var computed on GeoSense)",
                        "confidence": 0.3186
                    }
                ]
            },
            "sampling": {
                "value": "Random masking (mask ratio 0.6)",
                "confidence": 0.3164
            },
            "processing_level": {
                "value": null,
                "confidence": 0.0
            },
            "cloud_cover": {
                "value": null,
                "confidence": 0.0
            },
            "missing_data": {
                "value": null,
                "confidence": 0.0
            },
            "masking_ratio": {
                "value": 0.6,
                "confidence": 1.0
            }
        }
    ],
    "benchmarks": [
        {
            "task": {
                "value": "Object Detection",
                "confidence": 0.7177
            },
            "application": {
                "value": "Aerial object detection",
                "confidence": 0.4754
            },
            "dataset": {
                "value": "DOTA v1.0",
                "confidence": 0.9998
            },
            "metrics": {
                "value": [
                    {
                        "value": "mAP",
                        "confidence": 0.9351
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 76.23,
                        "confidence": 0.306
                    }
                ]
            },
            "sensor": {
                "value": [
                    {
                        "value": "Google Earth",
                        "confidence": 0.9804
                    },
                    {
                        "value": "GF-2",
                        "confidence": 0.9981
                    },
                    {
                        "value": "JL-1",
                        "confidence": 1.0
                    }
                ]
            },
            "regions": {
                "value": [
                    {
                        "value": "Various (global)",
                        "confidence": 0.3073
                    }
                ]
            },
            "original_samples": {
                "value": 2806,
                "confidence": 0.9901
            },
            "num_samples": {
                "value": 2806,
                "confidence": 0.9887
            },
            "sampling_percentage": {
                "value": 100,
                "confidence": 1.0
            },
            "num_classes": {
                "value": 15,
                "confidence": 1.0
            },
            "classes": {
                "value": [
                    {
                        "value": "plane",
                        "confidence": 0.9983
                    },
                    {
                        "value": "ship",
                        "confidence": 1.0
                    },
                    {
                        "value": "storage tank",
                        "confidence": 1.0
                    },
                    {
                        "value": "baseball diamond",
                        "confidence": 1.0
                    },
                    {
                        "value": "tennis court",
                        "confidence": 1.0
                    },
                    {
                        "value": "basketball court",
                        "confidence": 1.0
                    },
                    {
                        "value": "ground track field",
                        "confidence": 1.0
                    },
                    {
                        "value": "harbor",
                        "confidence": 1.0
                    },
                    {
                        "value": "bridge",
                        "confidence": 1.0
                    },
                    {
                        "value": "large vehicle",
                        "confidence": 1.0
                    },
                    {
                        "value": "small vehicle",
                        "confidence": 1.0
                    },
                    {
                        "value": "helicopter",
                        "confidence": 1.0
                    },
                    {
                        "value": "roundabout",
                        "confidence": 1.0
                    },
                    {
                        "value": "soccer ball field",
                        "confidence": 0.9998
                    },
                    {
                        "value": "swimming pool",
                        "confidence": 1.0
                    }
                ]
            },
            "image_resolution": {
                "value": "800x800 to 4000x4000",
                "confidence": 0.9372
            },
            "spatial_resolution": {
                "value": null,
                "confidence": 0.0
            },
            "bands_used": {
                "value": [
                    {
                        "value": "RGB",
                        "confidence": 0.9911
                    }
                ]
            },
            "augmentations": {
                "value": [
                    {
                        "value": "random horizontal flip",
                        "confidence": 0.6556
                    },
                    {
                        "value": "random vertical flip",
                        "confidence": 0.6934
                    },
                    {
                        "value": "random diagonal flip",
                        "confidence": 0.9833
                    }
                ]
            },
            "optimizer": {
                "value": "AdamW",
                "confidence": 1.0
            },
            "batch_size": {
                "value": 16,
                "confidence": 1.0
            },
            "learning_rate": {
                "value": 0.0001,
                "confidence": 1.0
            },
            "epochs": {
                "value": 12,
                "confidence": 1.0
            },
            "loss_function": {
                "value": "cross-entropy (class), smooth L1 (bbox)",
                "confidence": 0.3562
            },
            "split_ratio": {
                "value": "1411 train / 458 val / 937 test",
                "confidence": 0.5834
            }
        },
        {
            "task": {
                "value": "Object Detection",
                "confidence": 1.0
            },
            "application": {
                "value": "Aerial object detection",
                "confidence": 0.8059
            },
            "dataset": {
                "value": "DIOR-R",
                "confidence": 1.0
            },
            "metrics": {
                "value": [
                    {
                        "value": "mAP",
                        "confidence": 1.0
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 60.45,
                        "confidence": 0.301
                    }
                ]
            },
            "sensor": {
                "value": null,
                "confidence": 0.0
            },
            "regions": {
                "value": null,
                "confidence": 0.0
            },
            "original_samples": {
                "value": 23463,
                "confidence": 0.9998
            },
            "num_samples": {
                "value": 23463,
                "confidence": 0.9988
            },
            "sampling_percentage": {
                "value": 100,
                "confidence": 1.0
            },
            "num_classes": {
                "value": 20,
                "confidence": 1.0
            },
            "classes": {
                "value": [
                    {
                        "value": "airplane",
                        "confidence": 1.0
                    },
                    {
                        "value": "airport",
                        "confidence": 1.0
                    },
                    {
                        "value": "baseball field",
                        "confidence": 0.9901
                    },
                    {
                        "value": "basketball court",
                        "confidence": 1.0
                    },
                    {
                        "value": "bridge",
                        "confidence": 1.0
                    },
                    {
                        "value": "chimney",
                        "confidence": 1.0
                    },
                    {
                        "value": "dam",
                        "confidence": 1.0
                    },
                    {
                        "value": "expressway service area",
                        "confidence": 0.9999
                    },
                    {
                        "value": "expressway toll station",
                        "confidence": 1.0
                    },
                    {
                        "value": "golf field",
                        "confidence": 1.0
                    },
                    {
                        "value": "ground track field",
                        "confidence": 0.9997
                    },
                    {
                        "value": "harbor",
                        "confidence": 1.0
                    },
                    {
                        "value": "overpass",
                        "confidence": 1.0
                    },
                    {
                        "value": "ship",
                        "confidence": 1.0
                    },
                    {
                        "value": "stadium",
                        "confidence": 1.0
                    },
                    {
                        "value": "storage tank",
                        "confidence": 1.0
                    },
                    {
                        "value": "tennis court",
                        "confidence": 1.0
                    },
                    {
                        "value": "train station",
                        "confidence": 0.9999
                    },
                    {
                        "value": "vehicle",
                        "confidence": 1.0
                    },
                    {
                        "value": "windmill",
                        "confidence": 1.0
                    }
                ]
            },
            "image_resolution": {
                "value": "800x800",
                "confidence": 1.0
            },
            "spatial_resolution": {
                "value": "0.5m to 30m",
                "confidence": 0.7018
            },
            "bands_used": {
                "value": [
                    {
                        "value": "RGB",
                        "confidence": 1.0
                    }
                ]
            },
            "augmentations": {
                "value": [
                    {
                        "value": "random horizontal flip",
                        "confidence": 0.9971
                    },
                    {
                        "value": "random vertical flip",
                        "confidence": 1.0
                    },
                    {
                        "value": "random diagonal flip",
                        "confidence": 1.0
                    }
                ]
            },
            "optimizer": {
                "value": "AdamW",
                "confidence": 1.0
            },
            "batch_size": {
                "value": 16,
                "confidence": 1.0
            },
            "learning_rate": {
                "value": 0.0001,
                "confidence": 1.0
            },
            "epochs": {
                "value": 12,
                "confidence": 1.0
            },
            "loss_function": {
                "value": "cross-entropy (class), smooth L1 (bbox)",
                "confidence": 0.9997
            },
            "split_ratio": {
                "value": "11725 train / 11738 test",
                "confidence": 0.834
            }
        },
        {
            "task": {
                "value": "Semantic Segmentation",
                "confidence": 0.9999
            },
            "application": {
                "value": "Urban land cover segmentation",
                "confidence": 0.5205
            },
            "dataset": {
                "value": "Potsdam",
                "confidence": 0.8964
            },
            "metrics": {
                "value": [
                    {
                        "value": "mF1",
                        "confidence": 0.6742
                    },
                    {
                        "value": "OA",
                        "confidence": 0.9968
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 87.35,
                        "confidence": 0.388
                    },
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "sensor": {
                "value": null,
                "confidence": 0.0
            },
            "regions": {
                "value": [
                    {
                        "value": "Potsdam, Germany",
                        "confidence": 0.6066
                    }
                ]
            },
            "original_samples": {
                "value": 38,
                "confidence": 1.0
            },
            "num_samples": {
                "value": 38,
                "confidence": 0.9996
            },
            "sampling_percentage": {
                "value": 100,
                "confidence": 1.0
            },
            "num_classes": {
                "value": 6,
                "confidence": 0.9333
            },
            "classes": {
                "value": [
                    {
                        "value": "impervious surfaces",
                        "confidence": 0.9064
                    },
                    {
                        "value": "building",
                        "confidence": 0.9999
                    },
                    {
                        "value": "low vegetation",
                        "confidence": 1.0
                    },
                    {
                        "value": "tree",
                        "confidence": 1.0
                    },
                    {
                        "value": "car",
                        "confidence": 1.0
                    },
                    {
                        "value": "clutter",
                        "confidence": 1.0
                    }
                ]
            },
            "image_resolution": {
                "value": "6000x6000",
                "confidence": 1.0
            },
            "spatial_resolution": {
                "value": "0.5m",
                "confidence": 0.9998
            },
            "bands_used": {
                "value": [
                    {
                        "value": "RGB",
                        "confidence": 0.9965
                    }
                ]
            },
            "augmentations": {
                "value": [
                    {
                        "value": "random scaling (0.5-2.0)",
                        "confidence": 0.5569
                    },
                    {
                        "value": "random flipping",
                        "confidence": 0.9113
                    },
                    {
                        "value": "photometric distortion",
                        "confidence": 0.9999
                    }
                ]
            },
            "optimizer": {
                "value": "AdamW",
                "confidence": 1.0
            },
            "batch_size": {
                "value": 2,
                "confidence": 0.8587
            },
            "learning_rate": {
                "value": 0.0001,
                "confidence": 1.0
            },
            "epochs": {
                "value": null,
                "confidence": 0.0
            },
            "loss_function": {
                "value": "cross-entropy",
                "confidence": 0.9995
            },
            "split_ratio": {
                "value": "24 train / 14 test",
                "confidence": 0.9989
            }
        },
        {
            "task": {
                "value": "Semantic Segmentation",
                "confidence": 1.0
            },
            "application": {
                "value": "Land cover segmentation",
                "confidence": 0.7622
            },
            "dataset": {
                "value": "LoveDA",
                "confidence": 1.0
            },
            "metrics": {
                "value": [
                    {
                        "value": "mIoU",
                        "confidence": 0.9997
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 53.03,
                        "confidence": 1.0
                    }
                ]
            },
            "sensor": {
                "value": null,
                "confidence": 0.0
            },
            "regions": {
                "value": [
                    {
                        "value": "Urban",
                        "confidence": 0.5665
                    },
                    {
                        "value": "Rural",
                        "confidence": 0.9997
                    }
                ]
            },
            "original_samples": {
                "value": 5987,
                "confidence": 1.0
            },
            "num_samples": {
                "value": 5987,
                "confidence": 1.0
            },
            "sampling_percentage": {
                "value": 100,
                "confidence": 1.0
            },
            "num_classes": {
                "value": 7,
                "confidence": 0.9839
            },
            "classes": {
                "value": [
                    {
                        "value": "background",
                        "confidence": 0.9996
                    },
                    {
                        "value": "buildings",
                        "confidence": 0.8964
                    },
                    {
                        "value": "roads",
                        "confidence": 0.9989
                    },
                    {
                        "value": "water",
                        "confidence": 1.0
                    },
                    {
                        "value": "barren land",
                        "confidence": 0.9667
                    },
                    {
                        "value": "forests",
                        "confidence": 0.9668
                    },
                    {
                        "value": "agriculture",
                        "confidence": 1.0
                    }
                ]
            },
            "image_resolution": {
                "value": "1024x1024",
                "confidence": 1.0
            },
            "spatial_resolution": {
                "value": null,
                "confidence": 0.0
            },
            "bands_used": {
                "value": [
                    {
                        "value": "RGB",
                        "confidence": 0.9955
                    }
                ]
            },
            "augmentations": {
                "value": [
                    {
                        "value": "random scaling (0.5-2.0)",
                        "confidence": 0.7541
                    },
                    {
                        "value": "random flipping",
                        "confidence": 0.9959
                    },
                    {
                        "value": "photometric distortion",
                        "confidence": 0.9977
                    }
                ]
            },
            "optimizer": {
                "value": "AdamW",
                "confidence": 1.0
            },
            "batch_size": {
                "value": 2,
                "confidence": 1.0
            },
            "learning_rate": {
                "value": 0.0001,
                "confidence": 1.0
            },
            "epochs": {
                "value": null,
                "confidence": 0.0
            },
            "loss_function": {
                "value": "cross-entropy",
                "confidence": 1.0
            },
            "split_ratio": {
                "value": "2522 train / 1669 val / 1796 test",
                "confidence": 0.9663
            }
        },
        {
            "task": {
                "value": "Change Detection",
                "confidence": 1.0
            },
            "application": {
                "value": "Building change detection",
                "confidence": 0.9854
            },
            "dataset": {
                "value": "LEVIR-CD",
                "confidence": 0.9998
            },
            "metrics": {
                "value": [
                    {
                        "value": "F1",
                        "confidence": 0.8418
                    },
                    {
                        "value": "Precision",
                        "confidence": 0.9577
                    },
                    {
                        "value": "Recall",
                        "confidence": 1.0
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 91.03,
                        "confidence": 0.3066
                    },
                    {
                        "value": null,
                        "confidence": 0.6
                    },
                    {
                        "value": null,
                        "confidence": 0.6
                    }
                ]
            },
            "sensor": {
                "value": [
                    {
                        "value": "Google Earth",
                        "confidence": 0.8697
                    }
                ]
            },
            "regions": {
                "value": [
                    {
                        "value": "Texas, USA",
                        "confidence": 0.9993
                    }
                ]
            },
            "original_samples": {
                "value": 637,
                "confidence": 1.0
            },
            "num_samples": {
                "value": 637,
                "confidence": 1.0
            },
            "sampling_percentage": {
                "value": 100,
                "confidence": 1.0
            },
            "num_classes": {
                "value": 2,
                "confidence": 1.0
            },
            "classes": {
                "value": [
                    {
                        "value": "change",
                        "confidence": 0.6072
                    },
                    {
                        "value": "no change",
                        "confidence": 0.8902
                    }
                ]
            },
            "image_resolution": {
                "value": "1024x1024",
                "confidence": 1.0
            },
            "spatial_resolution": {
                "value": "0.5m",
                "confidence": 1.0
            },
            "bands_used": {
                "value": [
                    {
                        "value": "RGB",
                        "confidence": 1.0
                    }
                ]
            },
            "augmentations": {
                "value": [
                    {
                        "value": "random rotation",
                        "confidence": 0.997
                    },
                    {
                        "value": "random cropping",
                        "confidence": 0.8886
                    },
                    {
                        "value": "random flipping",
                        "confidence": 0.8391
                    }
                ]
            },
            "optimizer": {
                "value": "AdamW",
                "confidence": 0.8439
            },
            "batch_size": {
                "value": 16,
                "confidence": 1.0
            },
            "learning_rate": {
                "value": 0.0001,
                "confidence": 1.0
            },
            "epochs": {
                "value": null,
                "confidence": 0.0
            },
            "loss_function": {
                "value": "cross-entropy",
                "confidence": 1.0
            },
            "split_ratio": {
                "value": "445 train / 64 val / 128 test",
                "confidence": 0.9989
            }
        }
    ]
}