{
    "model_id": {
        "value": "RemoteSAM",
        "confidence": 0.7725
    },
    "model_name": {
        "value": "RemoteSAM",
        "confidence": 1.0
    },
    "version": {
        "value": "v1",
        "confidence": 0.6203
    },
    "release_date": {
        "value": "2025-06-02",
        "confidence": 1.0
    },
    "last_updated": {
        "value": "2025-06-02",
        "confidence": 0.9996
    },
    "short_description": {
        "value": "RemoteSAM is a unified visual foundation model for Earth observation, centered on referring expression segmentation. It achieves state-of-the-art performance across pixel-level, region-level, and image-level remote sensing tasks with high parameter efficiency, leveraging a large-scale, semantically diverse dataset (RemoteSAM-270K).",
        "confidence": 0.788
    },
    "paper_link": {
        "value": "https://arxiv.org/abs/2505.18022",
        "confidence": 1.0
    },
    "citations": {
        "value": null,
        "confidence": 0.0
    },
    "repository": {
        "value": "https://github.com/1e12Leon/RemoteSAM",
        "confidence": 1.0
    },
    "weights": {
        "value": null,
        "confidence": 0.0
    },
    "backbone": {
        "value": "Swin-Base (visual encoder) + BERT (text encoder)",
        "confidence": 0.8484
    },
    "num_layers": {
        "value": null,
        "confidence": 0.0
    },
    "num_parameters": {
        "value": 180000000,
        "confidence": 0.8993
    },
    "pretext_training_type": {
        "value": "Referring Expression Segmentation (RES) with multi-task conversion",
        "confidence": 0.7093
    },
    "masking_strategy": {
        "value": "Masking via pseudo-labels from expert models and null masks for absent categories",
        "confidence": 0.6069
    },
    "pretraining": {
        "value": "Trained on RemoteSAM-270K, a large-scale, automatically curated referring expression segmentation dataset with 270K image-text-mask triplets, 297 categories, and 16 attributes. Utilizes VLMs for expression generation and multi-teacher pseudo-labeling.",
        "confidence": 0.7036
    },
    "domain_knowledge": {
        "value": [
            {
                "value": "Hierarchical remote sensing semantic vocabulary (RSVocab-1K)",
                "confidence": 0.724
            },
            {
                "value": "Multi-source dataset integration",
                "confidence": 0.5745
            },
            {
                "value": "Semantic attribute enrichment",
                "confidence": 0.2792
            }
        ]
    },
    "backbone_modifications": {
        "value": [
            {
                "value": "Unified architecture without task-specific heads",
                "confidence": 0.7919
            },
            {
                "value": "Pixel-level output as fundamental computation unit",
                "confidence": 0.5283
            }
        ]
    },
    "supported_sensors": {
        "value": [
            {
                "value": null,
                "confidence": 0.3
            }
        ]
    },
    "modality_integration_type": {
        "value": "Unimodal",
        "confidence": 0.9322
    },
    "modalities": {
        "value": [
            {
                "value": "Multispectral",
                "confidence": 0.716
            },
            {
                "value": "RGB",
                "confidence": 0.7244
            }
        ]
    },
    "spectral_alignment": {
        "value": "none",
        "confidence": 0.933
    },
    "temporal_alignment": {
        "value": "none",
        "confidence": 1.0
    },
    "spatial_resolution": {
        "value": "variable (depends on source datasets, e.g., 896x896 for training)",
        "confidence": 0.709
    },
    "temporal_resolution": {
        "value": "variable",
        "confidence": 0.8116
    },
    "bands": {
        "value": [
            {
                "value": "RGB",
                "confidence": 0.7678
            }
        ]
    },
    "pretraining_phases": [
        {
            "dataset": {
                "value": "RemoteSAM-270K",
                "confidence": 1.0
            },
            "regions_coverage": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "time_range": {
                "value": null,
                "confidence": 0.0
            },
            "num_images": {
                "value": 270000,
                "confidence": 1.0
            },
            "token_size": {
                "value": null,
                "confidence": 0.0
            },
            "image_resolution": {
                "value": "variable (training at 896x896)",
                "confidence": 0.3294
            },
            "epochs": {
                "value": 40,
                "confidence": 1.0
            },
            "batch_size": {
                "value": null,
                "confidence": 0.0
            },
            "learning_rate": {
                "value": "3e-5",
                "confidence": 0.9998
            },
            "augmentations": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "processing": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "sampling": {
                "value": null,
                "confidence": 0.0
            },
            "processing_level": {
                "value": null,
                "confidence": 0.0
            },
            "cloud_cover": {
                "value": null,
                "confidence": 0.0
            },
            "missing_data": {
                "value": null,
                "confidence": 0.0
            },
            "masking_ratio": {
                "value": null,
                "confidence": 0.0
            }
        }
    ],
    "benchmarks": [
        {
            "task": {
                "value": "Referring Expression Segmentation",
                "confidence": 0.6302
            },
            "application": {
                "value": "Remote sensing object segmentation via natural language",
                "confidence": 0.3087
            },
            "dataset": {
                "value": "RRSISD",
                "confidence": 0.9947
            },
            "metrics": {
                "value": [
                    {
                        "value": "mIoU",
                        "confidence": 0.6918
                    },
                    {
                        "value": "oIoU",
                        "confidence": 0.9993
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 71.75,
                        "confidence": 1.0
                    },
                    {
                        "value": 80.04,
                        "confidence": 1.0
                    }
                ]
            },
            "sensor": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "regions": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "original_samples": {
                "value": 17402,
                "confidence": 1.0
            },
            "num_samples": {
                "value": 17402,
                "confidence": 1.0
            },
            "sampling_percentage": {
                "value": 100,
                "confidence": 1.0
            },
            "num_classes": {
                "value": 20,
                "confidence": 1.0
            },
            "classes": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "image_resolution": {
                "value": "variable",
                "confidence": 0.8458
            },
            "spatial_resolution": {
                "value": "variable",
                "confidence": 0.9781
            },
            "bands_used": {
                "value": [
                    {
                        "value": "RGB",
                        "confidence": 1.0
                    }
                ]
            },
            "augmentations": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "optimizer": {
                "value": "AdamW",
                "confidence": 1.0
            },
            "batch_size": {
                "value": null,
                "confidence": 0.0
            },
            "learning_rate": {
                "value": 3e-05,
                "confidence": 0.9991
            },
            "epochs": {
                "value": 40,
                "confidence": 1.0
            },
            "loss_function": {
                "value": "Segmentation loss",
                "confidence": 0.6686
            },
            "split_ratio": {
                "value": null,
                "confidence": 0.0
            }
        },
        {
            "task": {
                "value": "Referring Expression Segmentation",
                "confidence": 0.9983
            },
            "application": {
                "value": "Remote sensing object segmentation via natural language",
                "confidence": 0.9465
            },
            "dataset": {
                "value": "RisBench",
                "confidence": 0.9998
            },
            "metrics": {
                "value": [
                    {
                        "value": "mIoU",
                        "confidence": 1.0
                    },
                    {
                        "value": "oIoU",
                        "confidence": 1.0
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 71.46,
                        "confidence": 1.0
                    },
                    {
                        "value": 75.93,
                        "confidence": 1.0
                    }
                ]
            },
            "sensor": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "regions": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "original_samples": {
                "value": 52471,
                "confidence": 1.0
            },
            "num_samples": {
                "value": 52471,
                "confidence": 1.0
            },
            "sampling_percentage": {
                "value": 100,
                "confidence": 1.0
            },
            "num_classes": {
                "value": 26,
                "confidence": 1.0
            },
            "classes": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "image_resolution": {
                "value": "variable",
                "confidence": 1.0
            },
            "spatial_resolution": {
                "value": "variable",
                "confidence": 1.0
            },
            "bands_used": {
                "value": [
                    {
                        "value": "RGB",
                        "confidence": 1.0
                    }
                ]
            },
            "augmentations": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "optimizer": {
                "value": "AdamW",
                "confidence": 1.0
            },
            "batch_size": {
                "value": null,
                "confidence": 0.0
            },
            "learning_rate": {
                "value": 3e-05,
                "confidence": 1.0
            },
            "epochs": {
                "value": 40,
                "confidence": 1.0
            },
            "loss_function": {
                "value": "Segmentation loss",
                "confidence": 1.0
            },
            "split_ratio": {
                "value": null,
                "confidence": 0.0
            }
        },
        {
            "task": {
                "value": "Referring Expression Segmentation",
                "confidence": 0.7353
            },
            "application": {
                "value": "Remote sensing object segmentation via natural language",
                "confidence": 0.942
            },
            "dataset": {
                "value": "RefSegRS",
                "confidence": 1.0
            },
            "metrics": {
                "value": [
                    {
                        "value": "mIoU",
                        "confidence": 1.0
                    },
                    {
                        "value": "oIoU",
                        "confidence": 1.0
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 65.79,
                        "confidence": 1.0
                    },
                    {
                        "value": 75.49,
                        "confidence": 1.0
                    }
                ]
            },
            "sensor": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "regions": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "original_samples": {
                "value": 4420,
                "confidence": 1.0
            },
            "num_samples": {
                "value": 4420,
                "confidence": 1.0
            },
            "sampling_percentage": {
                "value": 100,
                "confidence": 1.0
            },
            "num_classes": {
                "value": 15,
                "confidence": 1.0
            },
            "classes": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "image_resolution": {
                "value": "variable",
                "confidence": 1.0
            },
            "spatial_resolution": {
                "value": "variable",
                "confidence": 1.0
            },
            "bands_used": {
                "value": [
                    {
                        "value": "RGB",
                        "confidence": 1.0
                    }
                ]
            },
            "augmentations": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "optimizer": {
                "value": "AdamW",
                "confidence": 0.9404
            },
            "batch_size": {
                "value": null,
                "confidence": 0.0
            },
            "learning_rate": {
                "value": 3e-05,
                "confidence": 1.0
            },
            "epochs": {
                "value": 40,
                "confidence": 1.0
            },
            "loss_function": {
                "value": "Segmentation loss",
                "confidence": 1.0
            },
            "split_ratio": {
                "value": null,
                "confidence": 0.0
            }
        },
        {
            "task": {
                "value": "Semantic Segmentation",
                "confidence": 0.999
            },
            "application": {
                "value": "Land cover/scene segmentation",
                "confidence": 0.352
            },
            "dataset": {
                "value": "iSAID",
                "confidence": 0.9949
            },
            "metrics": {
                "value": [
                    {
                        "value": "mIoU",
                        "confidence": 1.0
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 64.72,
                        "confidence": 1.0
                    }
                ]
            },
            "sensor": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "regions": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "original_samples": {
                "value": 21165,
                "confidence": 1.0
            },
            "num_samples": {
                "value": 21165,
                "confidence": 1.0
            },
            "sampling_percentage": {
                "value": 100,
                "confidence": 1.0
            },
            "num_classes": {
                "value": null,
                "confidence": 0.0
            },
            "classes": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "image_resolution": {
                "value": "variable",
                "confidence": 0.9931
            },
            "spatial_resolution": {
                "value": "variable",
                "confidence": 1.0
            },
            "bands_used": {
                "value": [
                    {
                        "value": "RGB",
                        "confidence": 1.0
                    }
                ]
            },
            "augmentations": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "optimizer": {
                "value": "AdamW",
                "confidence": 0.9333
            },
            "batch_size": {
                "value": null,
                "confidence": 0.0
            },
            "learning_rate": {
                "value": 3e-05,
                "confidence": 1.0
            },
            "epochs": {
                "value": 40,
                "confidence": 1.0
            },
            "loss_function": {
                "value": "Segmentation loss",
                "confidence": 0.9324
            },
            "split_ratio": {
                "value": null,
                "confidence": 0.0
            }
        },
        {
            "task": {
                "value": "Semantic Segmentation",
                "confidence": 1.0
            },
            "application": {
                "value": "Land cover/scene segmentation",
                "confidence": 0.7214
            },
            "dataset": {
                "value": "Potsdam",
                "confidence": 0.9994
            },
            "metrics": {
                "value": [
                    {
                        "value": "mF1",
                        "confidence": 0.9579
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 91.8,
                        "confidence": 0.9668
                    }
                ]
            },
            "sensor": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "regions": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "original_samples": {
                "value": 10000,
                "confidence": 1.0
            },
            "num_samples": {
                "value": 10000,
                "confidence": 1.0
            },
            "sampling_percentage": {
                "value": 100,
                "confidence": 1.0
            },
            "num_classes": {
                "value": null,
                "confidence": 0.0
            },
            "classes": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "image_resolution": {
                "value": "variable",
                "confidence": 0.9996
            },
            "spatial_resolution": {
                "value": "variable",
                "confidence": 1.0
            },
            "bands_used": {
                "value": [
                    {
                        "value": "RGB",
                        "confidence": 1.0
                    }
                ]
            },
            "augmentations": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "optimizer": {
                "value": "AdamW",
                "confidence": 1.0
            },
            "batch_size": {
                "value": null,
                "confidence": 0.0
            },
            "learning_rate": {
                "value": 3e-05,
                "confidence": 1.0
            },
            "epochs": {
                "value": 40,
                "confidence": 1.0
            },
            "loss_function": {
                "value": "Segmentation loss",
                "confidence": 0.9999
            },
            "split_ratio": {
                "value": null,
                "confidence": 0.0
            }
        },
        {
            "task": {
                "value": "Semantic Segmentation",
                "confidence": 0.6901
            },
            "application": {
                "value": "Land cover/scene segmentation",
                "confidence": 0.5247
            },
            "dataset": {
                "value": "Vaihingen",
                "confidence": 0.9869
            },
            "metrics": {
                "value": [
                    {
                        "value": "mIoU",
                        "confidence": 1.0
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 46.0,
                        "confidence": 0.9963
                    }
                ]
            },
            "sensor": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "regions": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "original_samples": {
                "value": null,
                "confidence": 0.0
            },
            "num_samples": {
                "value": null,
                "confidence": 0.0
            },
            "sampling_percentage": {
                "value": null,
                "confidence": 0.0
            },
            "num_classes": {
                "value": null,
                "confidence": 0.0
            },
            "classes": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "image_resolution": {
                "value": "variable",
                "confidence": 0.9946
            },
            "spatial_resolution": {
                "value": "variable",
                "confidence": 1.0
            },
            "bands_used": {
                "value": [
                    {
                        "value": "RGB",
                        "confidence": 0.9998
                    }
                ]
            },
            "augmentations": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "optimizer": {
                "value": "AdamW",
                "confidence": 0.8587
            },
            "batch_size": {
                "value": null,
                "confidence": 0.0
            },
            "learning_rate": {
                "value": 3e-05,
                "confidence": 1.0
            },
            "epochs": {
                "value": 40,
                "confidence": 1.0
            },
            "loss_function": {
                "value": "Segmentation loss",
                "confidence": 0.9995
            },
            "split_ratio": {
                "value": null,
                "confidence": 0.0
            }
        },
        {
            "task": {
                "value": "Semantic Segmentation",
                "confidence": 0.7986
            },
            "application": {
                "value": "Land cover/scene segmentation",
                "confidence": 0.997
            },
            "dataset": {
                "value": "UDD5",
                "confidence": 0.9575
            },
            "metrics": {
                "value": [
                    {
                        "value": "mIoU",
                        "confidence": 1.0
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 45.6,
                        "confidence": 0.9998
                    }
                ]
            },
            "sensor": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "regions": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "original_samples": {
                "value": null,
                "confidence": 0.0
            },
            "num_samples": {
                "value": null,
                "confidence": 0.0
            },
            "sampling_percentage": {
                "value": null,
                "confidence": 0.0
            },
            "num_classes": {
                "value": null,
                "confidence": 0.0
            },
            "classes": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "image_resolution": {
                "value": "variable",
                "confidence": 1.0
            },
            "spatial_resolution": {
                "value": "variable",
                "confidence": 1.0
            },
            "bands_used": {
                "value": [
                    {
                        "value": "RGB",
                        "confidence": 1.0
                    }
                ]
            },
            "augmentations": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "optimizer": {
                "value": "AdamW",
                "confidence": 0.9998
            },
            "batch_size": {
                "value": null,
                "confidence": 0.0
            },
            "learning_rate": {
                "value": 3e-05,
                "confidence": 1.0
            },
            "epochs": {
                "value": 40,
                "confidence": 1.0
            },
            "loss_function": {
                "value": "Segmentation loss",
                "confidence": 1.0
            },
            "split_ratio": {
                "value": null,
                "confidence": 0.0
            }
        },
        {
            "task": {
                "value": "Semantic Segmentation",
                "confidence": 1.0
            },
            "application": {
                "value": "Land cover/scene segmentation",
                "confidence": 0.9975
            },
            "dataset": {
                "value": "DeepGlobe",
                "confidence": 1.0
            },
            "metrics": {
                "value": [
                    {
                        "value": "mIoU",
                        "confidence": 1.0
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 60.5,
                        "confidence": 1.0
                    }
                ]
            },
            "sensor": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "regions": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "original_samples": {
                "value": null,
                "confidence": 0.0
            },
            "num_samples": {
                "value": null,
                "confidence": 0.0
            },
            "sampling_percentage": {
                "value": null,
                "confidence": 0.0
            },
            "num_classes": {
                "value": null,
                "confidence": 0.0
            },
            "classes": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "image_resolution": {
                "value": "variable",
                "confidence": 1.0
            },
            "spatial_resolution": {
                "value": "variable",
                "confidence": 1.0
            },
            "bands_used": {
                "value": [
                    {
                        "value": "RGB",
                        "confidence": 1.0
                    }
                ]
            },
            "augmentations": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "optimizer": {
                "value": "AdamW",
                "confidence": 1.0
            },
            "batch_size": {
                "value": null,
                "confidence": 0.0
            },
            "learning_rate": {
                "value": 3e-05,
                "confidence": 1.0
            },
            "epochs": {
                "value": 40,
                "confidence": 1.0
            },
            "loss_function": {
                "value": "Segmentation loss",
                "confidence": 1.0
            },
            "split_ratio": {
                "value": null,
                "confidence": 0.0
            }
        },
        {
            "task": {
                "value": "Visual Grounding",
                "confidence": 0.7879
            },
            "application": {
                "value": "Object localization via text",
                "confidence": 0.3171
            },
            "dataset": {
                "value": "RSVG",
                "confidence": 1.0
            },
            "metrics": {
                "value": [
                    {
                        "value": "AP50",
                        "confidence": 0.9921
                    },
                    {
                        "value": "mIoU",
                        "confidence": 1.0
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 74.36,
                        "confidence": 1.0
                    },
                    {
                        "value": 65.07,
                        "confidence": 1.0
                    }
                ]
            },
            "sensor": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "regions": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "original_samples": {
                "value": null,
                "confidence": 0.0
            },
            "num_samples": {
                "value": null,
                "confidence": 0.0
            },
            "sampling_percentage": {
                "value": null,
                "confidence": 0.0
            },
            "num_classes": {
                "value": null,
                "confidence": 0.0
            },
            "classes": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "image_resolution": {
                "value": "variable",
                "confidence": 0.9997
            },
            "spatial_resolution": {
                "value": "variable",
                "confidence": 1.0
            },
            "bands_used": {
                "value": [
                    {
                        "value": "RGB",
                        "confidence": 0.9999
                    }
                ]
            },
            "augmentations": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "optimizer": {
                "value": "AdamW",
                "confidence": 0.9165
            },
            "batch_size": {
                "value": null,
                "confidence": 0.0
            },
            "learning_rate": {
                "value": 3e-05,
                "confidence": 1.0
            },
            "epochs": {
                "value": 40,
                "confidence": 1.0
            },
            "loss_function": {
                "value": "Segmentation loss",
                "confidence": 0.7565
            },
            "split_ratio": {
                "value": null,
                "confidence": 0.0
            }
        },
        {
            "task": {
                "value": "Multi-label Classification",
                "confidence": 0.7803
            },
            "application": {
                "value": "Scene/object multi-label classification",
                "confidence": 0.3408
            },
            "dataset": {
                "value": "DIOR",
                "confidence": 0.9978
            },
            "metrics": {
                "value": [
                    {
                        "value": "Accuracy",
                        "confidence": 0.6863
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 0.94,
                        "confidence": 1.0
                    }
                ]
            },
            "sensor": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "regions": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "original_samples": {
                "value": 20000,
                "confidence": 0.7148
            },
            "num_samples": {
                "value": 20000,
                "confidence": 1.0
            },
            "sampling_percentage": {
                "value": 100,
                "confidence": 1.0
            },
            "num_classes": {
                "value": null,
                "confidence": 0.0
            },
            "classes": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "image_resolution": {
                "value": "variable",
                "confidence": 1.0
            },
            "spatial_resolution": {
                "value": "variable",
                "confidence": 1.0
            },
            "bands_used": {
                "value": [
                    {
                        "value": "RGB",
                        "confidence": 1.0
                    }
                ]
            },
            "augmentations": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "optimizer": {
                "value": "AdamW",
                "confidence": 0.9874
            },
            "batch_size": {
                "value": null,
                "confidence": 0.0
            },
            "learning_rate": {
                "value": 3e-05,
                "confidence": 1.0
            },
            "epochs": {
                "value": 40,
                "confidence": 1.0
            },
            "loss_function": {
                "value": "Classification loss",
                "confidence": 0.5726
            },
            "split_ratio": {
                "value": null,
                "confidence": 0.0
            }
        },
        {
            "task": {
                "value": "Multi-label Classification",
                "confidence": 1.0
            },
            "application": {
                "value": "Scene/object multi-label classification",
                "confidence": 1.0
            },
            "dataset": {
                "value": "DOTA-v2",
                "confidence": 0.6004
            },
            "metrics": {
                "value": [
                    {
                        "value": "Accuracy",
                        "confidence": 1.0
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 0.95,
                        "confidence": 1.0
                    }
                ]
            },
            "sensor": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "regions": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "original_samples": {
                "value": 20000,
                "confidence": 0.7936
            },
            "num_samples": {
                "value": 20000,
                "confidence": 1.0
            },
            "sampling_percentage": {
                "value": 100,
                "confidence": 1.0
            },
            "num_classes": {
                "value": null,
                "confidence": 0.0
            },
            "classes": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "image_resolution": {
                "value": "variable",
                "confidence": 1.0
            },
            "spatial_resolution": {
                "value": "variable",
                "confidence": 1.0
            },
            "bands_used": {
                "value": [
                    {
                        "value": "RGB",
                        "confidence": 1.0
                    }
                ]
            },
            "augmentations": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "optimizer": {
                "value": "AdamW",
                "confidence": 1.0
            },
            "batch_size": {
                "value": null,
                "confidence": 0.0
            },
            "learning_rate": {
                "value": 3e-05,
                "confidence": 1.0
            },
            "epochs": {
                "value": 40,
                "confidence": 1.0
            },
            "loss_function": {
                "value": "Classification loss",
                "confidence": 1.0
            },
            "split_ratio": {
                "value": null,
                "confidence": 0.0
            }
        },
        {
            "task": {
                "value": "Object Counting",
                "confidence": 0.8714
            },
            "application": {
                "value": "Object counting",
                "confidence": 0.4834
            },
            "dataset": {
                "value": "DIOR",
                "confidence": 1.0
            },
            "metrics": {
                "value": [
                    {
                        "value": "Accuracy",
                        "confidence": 0.9999
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 0.62,
                        "confidence": 0.9739
                    }
                ]
            },
            "sensor": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "regions": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "original_samples": {
                "value": 20000,
                "confidence": 0.9999
            },
            "num_samples": {
                "value": 20000,
                "confidence": 1.0
            },
            "sampling_percentage": {
                "value": 100,
                "confidence": 1.0
            },
            "num_classes": {
                "value": null,
                "confidence": 0.0
            },
            "classes": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "image_resolution": {
                "value": "variable",
                "confidence": 1.0
            },
            "spatial_resolution": {
                "value": "variable",
                "confidence": 1.0
            },
            "bands_used": {
                "value": [
                    {
                        "value": "RGB",
                        "confidence": 1.0
                    }
                ]
            },
            "augmentations": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "optimizer": {
                "value": "AdamW",
                "confidence": 0.9991
            },
            "batch_size": {
                "value": null,
                "confidence": 0.0
            },
            "learning_rate": {
                "value": 3e-05,
                "confidence": 1.0
            },
            "epochs": {
                "value": 40,
                "confidence": 1.0
            },
            "loss_function": {
                "value": "Counting loss",
                "confidence": 0.8522
            },
            "split_ratio": {
                "value": null,
                "confidence": 0.0
            }
        },
        {
            "task": {
                "value": "Object Counting",
                "confidence": 1.0
            },
            "application": {
                "value": "Object counting",
                "confidence": 1.0
            },
            "dataset": {
                "value": "DOTA-v2",
                "confidence": 1.0
            },
            "metrics": {
                "value": [
                    {
                        "value": "Accuracy",
                        "confidence": 1.0
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 0.409,
                        "confidence": 0.9999
                    }
                ]
            },
            "sensor": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "regions": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "original_samples": {
                "value": 20000,
                "confidence": 0.9995
            },
            "num_samples": {
                "value": 20000,
                "confidence": 1.0
            },
            "sampling_percentage": {
                "value": 100,
                "confidence": 1.0
            },
            "num_classes": {
                "value": null,
                "confidence": 0.0
            },
            "classes": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "image_resolution": {
                "value": "variable",
                "confidence": 1.0
            },
            "spatial_resolution": {
                "value": "variable",
                "confidence": 1.0
            },
            "bands_used": {
                "value": [
                    {
                        "value": "RGB",
                        "confidence": 1.0
                    }
                ]
            },
            "augmentations": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "optimizer": {
                "value": "AdamW",
                "confidence": 1.0
            },
            "batch_size": {
                "value": null,
                "confidence": 0.0
            },
            "learning_rate": {
                "value": 3e-05,
                "confidence": 1.0
            },
            "epochs": {
                "value": 40,
                "confidence": 1.0
            },
            "loss_function": {
                "value": "Counting loss",
                "confidence": 1.0
            },
            "split_ratio": {
                "value": null,
                "confidence": 0.0
            }
        },
        {
            "task": {
                "value": "Object Detection",
                "confidence": 0.8929
            },
            "application": {
                "value": "Object detection (horizontal bbox)",
                "confidence": 0.4338
            },
            "dataset": {
                "value": "DIOR",
                "confidence": 1.0
            },
            "metrics": {
                "value": [
                    {
                        "value": "AP50",
                        "confidence": 1.0
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 62.74,
                        "confidence": 1.0
                    }
                ]
            },
            "sensor": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "regions": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "original_samples": {
                "value": 20000,
                "confidence": 0.7752
            },
            "num_samples": {
                "value": 20000,
                "confidence": 1.0
            },
            "sampling_percentage": {
                "value": 100,
                "confidence": 1.0
            },
            "num_classes": {
                "value": null,
                "confidence": 0.0
            },
            "classes": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "image_resolution": {
                "value": "variable",
                "confidence": 1.0
            },
            "spatial_resolution": {
                "value": "variable",
                "confidence": 1.0
            },
            "bands_used": {
                "value": [
                    {
                        "value": "RGB",
                        "confidence": 1.0
                    }
                ]
            },
            "augmentations": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "optimizer": {
                "value": "AdamW",
                "confidence": 0.998
            },
            "batch_size": {
                "value": null,
                "confidence": 0.0
            },
            "learning_rate": {
                "value": 3e-05,
                "confidence": 1.0
            },
            "epochs": {
                "value": 40,
                "confidence": 1.0
            },
            "loss_function": {
                "value": "Detection loss",
                "confidence": 0.9818
            },
            "split_ratio": {
                "value": null,
                "confidence": 0.0
            }
        },
        {
            "task": {
                "value": "Object Detection",
                "confidence": 1.0
            },
            "application": {
                "value": "Object detection (horizontal bbox)",
                "confidence": 0.9982
            },
            "dataset": {
                "value": "iSAID",
                "confidence": 1.0
            },
            "metrics": {
                "value": [
                    {
                        "value": "AP50",
                        "confidence": 1.0
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 34.41,
                        "confidence": 1.0
                    }
                ]
            },
            "sensor": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "regions": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "original_samples": {
                "value": 21165,
                "confidence": 0.9953
            },
            "num_samples": {
                "value": 21165,
                "confidence": 1.0
            },
            "sampling_percentage": {
                "value": 100,
                "confidence": 1.0
            },
            "num_classes": {
                "value": null,
                "confidence": 0.0
            },
            "classes": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "image_resolution": {
                "value": "variable",
                "confidence": 1.0
            },
            "spatial_resolution": {
                "value": "variable",
                "confidence": 1.0
            },
            "bands_used": {
                "value": [
                    {
                        "value": "RGB",
                        "confidence": 1.0
                    }
                ]
            },
            "augmentations": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "optimizer": {
                "value": "AdamW",
                "confidence": 1.0
            },
            "batch_size": {
                "value": null,
                "confidence": 0.0
            },
            "learning_rate": {
                "value": 3e-05,
                "confidence": 1.0
            },
            "epochs": {
                "value": 40,
                "confidence": 1.0
            },
            "loss_function": {
                "value": "Detection loss",
                "confidence": 1.0
            },
            "split_ratio": {
                "value": null,
                "confidence": 0.0
            }
        },
        {
            "task": {
                "value": "Object Detection",
                "confidence": 0.9704
            },
            "application": {
                "value": "Object detection (horizontal bbox)",
                "confidence": 0.8434
            },
            "dataset": {
                "value": "DOTA-v2",
                "confidence": 0.9839
            },
            "metrics": {
                "value": [
                    {
                        "value": "AP50",
                        "confidence": 1.0
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 20.17,
                        "confidence": 1.0
                    }
                ]
            },
            "sensor": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "regions": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "original_samples": {
                "value": 20000,
                "confidence": 0.7557
            },
            "num_samples": {
                "value": 20000,
                "confidence": 1.0
            },
            "sampling_percentage": {
                "value": 100,
                "confidence": 1.0
            },
            "num_classes": {
                "value": null,
                "confidence": 0.0
            },
            "classes": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "image_resolution": {
                "value": "variable",
                "confidence": 1.0
            },
            "spatial_resolution": {
                "value": "variable",
                "confidence": 1.0
            },
            "bands_used": {
                "value": [
                    {
                        "value": "RGB",
                        "confidence": 1.0
                    }
                ]
            },
            "augmentations": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "optimizer": {
                "value": "AdamW",
                "confidence": 1.0
            },
            "batch_size": {
                "value": null,
                "confidence": 0.0
            },
            "learning_rate": {
                "value": 3e-05,
                "confidence": 1.0
            },
            "epochs": {
                "value": 40,
                "confidence": 1.0
            },
            "loss_function": {
                "value": "Detection loss",
                "confidence": 1.0
            },
            "split_ratio": {
                "value": null,
                "confidence": 0.0
            }
        },
        {
            "task": {
                "value": "Object Detection",
                "confidence": 0.8908
            },
            "application": {
                "value": "Object detection (oriented bbox)",
                "confidence": 0.9966
            },
            "dataset": {
                "value": "DIOR",
                "confidence": 0.9885
            },
            "metrics": {
                "value": [
                    {
                        "value": "AP50",
                        "confidence": 1.0
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 55.22,
                        "confidence": 1.0
                    }
                ]
            },
            "sensor": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "regions": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "original_samples": {
                "value": 20000,
                "confidence": 1.0
            },
            "num_samples": {
                "value": 20000,
                "confidence": 1.0
            },
            "sampling_percentage": {
                "value": 100,
                "confidence": 1.0
            },
            "num_classes": {
                "value": null,
                "confidence": 0.0
            },
            "classes": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "image_resolution": {
                "value": "variable",
                "confidence": 1.0
            },
            "spatial_resolution": {
                "value": "variable",
                "confidence": 1.0
            },
            "bands_used": {
                "value": [
                    {
                        "value": "RGB",
                        "confidence": 1.0
                    }
                ]
            },
            "augmentations": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "optimizer": {
                "value": "AdamW",
                "confidence": 1.0
            },
            "batch_size": {
                "value": null,
                "confidence": 0.0
            },
            "learning_rate": {
                "value": 3e-05,
                "confidence": 1.0
            },
            "epochs": {
                "value": 40,
                "confidence": 1.0
            },
            "loss_function": {
                "value": "Detection loss",
                "confidence": 1.0
            },
            "split_ratio": {
                "value": null,
                "confidence": 0.0
            }
        },
        {
            "task": {
                "value": "Object Detection",
                "confidence": 0.9992
            },
            "application": {
                "value": "Object detection (oriented bbox)",
                "confidence": 1.0
            },
            "dataset": {
                "value": "iSAID",
                "confidence": 1.0
            },
            "metrics": {
                "value": [
                    {
                        "value": "AP50",
                        "confidence": 1.0
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 34.58,
                        "confidence": 1.0
                    }
                ]
            },
            "sensor": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "regions": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "original_samples": {
                "value": 21165,
                "confidence": 1.0
            },
            "num_samples": {
                "value": 21165,
                "confidence": 1.0
            },
            "sampling_percentage": {
                "value": 100,
                "confidence": 1.0
            },
            "num_classes": {
                "value": null,
                "confidence": 0.0
            },
            "classes": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "image_resolution": {
                "value": "variable",
                "confidence": 1.0
            },
            "spatial_resolution": {
                "value": "variable",
                "confidence": 1.0
            },
            "bands_used": {
                "value": [
                    {
                        "value": "RGB",
                        "confidence": 1.0
                    }
                ]
            },
            "augmentations": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "optimizer": {
                "value": "AdamW",
                "confidence": 1.0
            },
            "batch_size": {
                "value": null,
                "confidence": 0.0
            },
            "learning_rate": {
                "value": 3e-05,
                "confidence": 1.0
            },
            "epochs": {
                "value": 40,
                "confidence": 1.0
            },
            "loss_function": {
                "value": "Detection loss",
                "confidence": 1.0
            },
            "split_ratio": {
                "value": null,
                "confidence": 0.0
            }
        },
        {
            "task": {
                "value": "Object Detection",
                "confidence": 0.9962
            },
            "application": {
                "value": "Object detection (oriented bbox)",
                "confidence": 1.0
            },
            "dataset": {
                "value": "DOTA-v2",
                "confidence": 1.0
            },
            "metrics": {
                "value": [
                    {
                        "value": "AP50",
                        "confidence": 1.0
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 18.21,
                        "confidence": 1.0
                    }
                ]
            },
            "sensor": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "regions": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "original_samples": {
                "value": 20000,
                "confidence": 1.0
            },
            "num_samples": {
                "value": 20000,
                "confidence": 1.0
            },
            "sampling_percentage": {
                "value": 100,
                "confidence": 1.0
            },
            "num_classes": {
                "value": null,
                "confidence": 0.0
            },
            "classes": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "image_resolution": {
                "value": "variable",
                "confidence": 1.0
            },
            "spatial_resolution": {
                "value": "variable",
                "confidence": 1.0
            },
            "bands_used": {
                "value": [
                    {
                        "value": "RGB",
                        "confidence": 1.0
                    }
                ]
            },
            "augmentations": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "optimizer": {
                "value": "AdamW",
                "confidence": 1.0
            },
            "batch_size": {
                "value": null,
                "confidence": 0.0
            },
            "learning_rate": {
                "value": 3e-05,
                "confidence": 1.0
            },
            "epochs": {
                "value": 40,
                "confidence": 1.0
            },
            "loss_function": {
                "value": "Detection loss",
                "confidence": 1.0
            },
            "split_ratio": {
                "value": null,
                "confidence": 0.0
            }
        }
    ]
}