{
    "model_id": {
        "value": "LHRS-Bot",
        "confidence": 0.9888
    },
    "model_name": {
        "value": "LHRS-Bot",
        "confidence": 1.0
    },
    "version": {
        "value": null,
        "confidence": 0.0
    },
    "release_date": {
        "value": "2024-07-16",
        "confidence": 0.977
    },
    "last_updated": {
        "value": "2024-07-16",
        "confidence": 0.9636
    },
    "short_description": {
        "value": "LHRS-Bot is a large multimodal language model (MLLM) tailored for remote sensing (RS) image understanding, leveraging a novel multi-level vision-language alignment strategy and curriculum learning. It is trained on large-scale RS image-text and instruction datasets constructed from global volunteered geographic information (VGI) and RS imagery.",
        "confidence": 0.8301
    },
    "paper_link": {
        "value": "https://arxiv.org/abs/2402.02544",
        "confidence": 0.9999
    },
    "citations": {
        "value": null,
        "confidence": 0.0
    },
    "repository": {
        "value": "https://github.com/NJU-LHRS/LHRS-Bot",
        "confidence": 1.0
    },
    "weights": {
        "value": null,
        "confidence": 0.0
    },
    "backbone": {
        "value": "CLIP ViT-L/14 + LLaMA2-7B",
        "confidence": 0.8168
    },
    "num_layers": {
        "value": null,
        "confidence": 0.0
    },
    "num_parameters": {
        "value": null,
        "confidence": 0.0
    },
    "pretext_training_type": {
        "value": "Multi-level vision-language alignment with curriculum learning",
        "confidence": 0.9196
    },
    "masking_strategy": {
        "value": null,
        "confidence": 0.0
    },
    "pretraining": {
        "value": "Three-stage curriculum learning: (1) Pre-training on LHRS-Align for vision-language alignment, (2) Multi-task pre-training on instruction datasets, (3) Supervised fine-tuning on complex instruction data.",
        "confidence": 0.7993
    },
    "domain_knowledge": {
        "value": [
            {
                "value": "Volunteered Geographic Information (VGI)",
                "confidence": 0.8113
            },
            {
                "value": "OpenStreetMap (OSM) semantic tags",
                "confidence": 0.4736
            },
            {
                "value": "Remote sensing image semantics",
                "confidence": 0.5444
            }
        ]
    },
    "backbone_modifications": {
        "value": [
            {
                "value": "Multi-level feature extraction from vision encoder",
                "confidence": 0.7886
            },
            {
                "value": "Vision perceiver with learnable queries and cross-attention",
                "confidence": 0.614
            },
            {
                "value": "Descending query allocation strategy",
                "confidence": 0.6576
            }
        ]
    },
    "supported_sensors": {
        "value": [
            {
                "value": "Google Earth imagery",
                "confidence": 0.9088
            }
        ]
    },
    "modality_integration_type": {
        "value": "Homogeneous Multimodal",
        "confidence": 0.8242
    },
    "modalities": {
        "value": [
            {
                "value": "Multispectral",
                "confidence": 0.9788
            },
            {
                "value": "Panchromatic",
                "confidence": 0.8724
            }
        ]
    },
    "spectral_alignment": {
        "value": "none",
        "confidence": 0.6929
    },
    "temporal_alignment": {
        "value": "none",
        "confidence": 1.0
    },
    "spatial_resolution": {
        "value": "1m (LHRS-Align); varies for benchmarks",
        "confidence": 0.6106
    },
    "temporal_resolution": {
        "value": null,
        "confidence": 0.0
    },
    "bands": {
        "value": null,
        "confidence": 0.0
    },
    "pretraining_phases": [
        {
            "dataset": {
                "value": "LHRS-Align",
                "confidence": 1.0
            },
            "regions_coverage": {
                "value": [
                    {
                        "value": "9259 cities across 129 countries",
                        "confidence": 0.4742
                    }
                ]
            },
            "time_range": {
                "value": null,
                "confidence": 0.0
            },
            "num_images": {
                "value": 1150000,
                "confidence": 0.9579
            },
            "token_size": {
                "value": null,
                "confidence": 0.0
            },
            "image_resolution": {
                "value": "up to 768x768 (resized if larger)",
                "confidence": 0.3495
            },
            "epochs": {
                "value": 1,
                "confidence": 1.0
            },
            "batch_size": {
                "value": 8,
                "confidence": 1.0
            },
            "learning_rate": {
                "value": "0.0002",
                "confidence": 0.994
            },
            "augmentations": {
                "value": []
            },
            "processing": {
                "value": [
                    {
                        "value": "Deduplication",
                        "confidence": 0.881
                    },
                    {
                        "value": "Cloud and ocean filtering",
                        "confidence": 0.3483
                    },
                    {
                        "value": "Semantic balancing",
                        "confidence": 0.5347
                    },
                    {
                        "value": "Manual and automatic OSM key filtering",
                        "confidence": 0.3344
                    }
                ]
            },
            "sampling": {
                "value": "Semantic balancing and independent sampling for key-value pairs",
                "confidence": 0.3025
            },
            "processing_level": {
                "value": null,
                "confidence": 0.0
            },
            "cloud_cover": {
                "value": "Images with clouds removed using a trained classification network",
                "confidence": 0.3036
            },
            "missing_data": {
                "value": null,
                "confidence": 0.0
            },
            "masking_ratio": {
                "value": null,
                "confidence": 0.0
            }
        }
    ],
    "benchmarks": [
        {
            "task": {
                "value": "Classification",
                "confidence": 0.7306
            },
            "application": {
                "value": "Remote sensing scene classification",
                "confidence": 0.6281
            },
            "dataset": {
                "value": "AID",
                "confidence": 1.0
            },
            "metrics": {
                "value": [
                    {
                        "value": "Accuracy",
                        "confidence": 0.933
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 91.26,
                        "confidence": 1.0
                    }
                ]
            },
            "sensor": {
                "value": [
                    {
                        "value": "Google Earth imagery",
                        "confidence": 0.821
                    }
                ]
            },
            "regions": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "original_samples": {
                "value": null,
                "confidence": 0.0
            },
            "num_samples": {
                "value": null,
                "confidence": 0.0
            },
            "sampling_percentage": {
                "value": null,
                "confidence": 0.0
            },
            "num_classes": {
                "value": 30,
                "confidence": 1.0
            },
            "classes": {
                "value": null,
                "confidence": 0.0
            },
            "image_resolution": {
                "value": "600x600",
                "confidence": 0.9996
            },
            "spatial_resolution": {
                "value": "0.5-8m",
                "confidence": 0.6722
            },
            "bands_used": {
                "value": null,
                "confidence": 0.0
            },
            "augmentations": {
                "value": []
            },
            "optimizer": {
                "value": "Adan",
                "confidence": 0.6495
            },
            "batch_size": {
                "value": 8,
                "confidence": 1.0
            },
            "learning_rate": {
                "value": 0.0002,
                "confidence": 1.0
            },
            "epochs": {
                "value": 1,
                "confidence": 1.0
            },
            "loss_function": {
                "value": null,
                "confidence": 0.0
            },
            "split_ratio": {
                "value": null,
                "confidence": 0.0
            }
        },
        {
            "task": {
                "value": "Classification",
                "confidence": 1.0
            },
            "application": {
                "value": "Remote sensing scene classification",
                "confidence": 0.962
            },
            "dataset": {
                "value": "WHU-RS19",
                "confidence": 1.0
            },
            "metrics": {
                "value": [
                    {
                        "value": "Accuracy",
                        "confidence": 1.0
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 93.17,
                        "confidence": 1.0
                    }
                ]
            },
            "sensor": {
                "value": [
                    {
                        "value": "Google Earth imagery",
                        "confidence": 0.9998
                    }
                ]
            },
            "regions": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "original_samples": {
                "value": null,
                "confidence": 0.0
            },
            "num_samples": {
                "value": null,
                "confidence": 0.0
            },
            "sampling_percentage": {
                "value": null,
                "confidence": 0.0
            },
            "num_classes": {
                "value": 19,
                "confidence": 1.0
            },
            "classes": {
                "value": null,
                "confidence": 0.0
            },
            "image_resolution": {
                "value": "600x600",
                "confidence": 1.0
            },
            "spatial_resolution": {
                "value": "0.5m",
                "confidence": 0.9837
            },
            "bands_used": {
                "value": null,
                "confidence": 0.0
            },
            "augmentations": {
                "value": []
            },
            "optimizer": {
                "value": "Adan",
                "confidence": 1.0
            },
            "batch_size": {
                "value": 8,
                "confidence": 1.0
            },
            "learning_rate": {
                "value": 0.0002,
                "confidence": 1.0
            },
            "epochs": {
                "value": 1,
                "confidence": 1.0
            },
            "loss_function": {
                "value": null,
                "confidence": 0.0
            },
            "split_ratio": {
                "value": null,
                "confidence": 0.0
            }
        },
        {
            "task": {
                "value": "Classification",
                "confidence": 1.0
            },
            "application": {
                "value": "Remote sensing scene classification",
                "confidence": 0.9937
            },
            "dataset": {
                "value": "NWPU",
                "confidence": 1.0
            },
            "metrics": {
                "value": [
                    {
                        "value": "Accuracy",
                        "confidence": 1.0
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 83.94,
                        "confidence": 1.0
                    }
                ]
            },
            "sensor": {
                "value": [
                    {
                        "value": "Google Earth imagery",
                        "confidence": 0.9984
                    }
                ]
            },
            "regions": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "original_samples": {
                "value": null,
                "confidence": 0.0
            },
            "num_samples": {
                "value": null,
                "confidence": 0.0
            },
            "sampling_percentage": {
                "value": null,
                "confidence": 0.0
            },
            "num_classes": {
                "value": 45,
                "confidence": 1.0
            },
            "classes": {
                "value": null,
                "confidence": 0.0
            },
            "image_resolution": {
                "value": "256x256",
                "confidence": 1.0
            },
            "spatial_resolution": {
                "value": "0.2-30m",
                "confidence": 0.99
            },
            "bands_used": {
                "value": null,
                "confidence": 0.0
            },
            "augmentations": {
                "value": []
            },
            "optimizer": {
                "value": "Adan",
                "confidence": 1.0
            },
            "batch_size": {
                "value": 8,
                "confidence": 1.0
            },
            "learning_rate": {
                "value": 0.0002,
                "confidence": 1.0
            },
            "epochs": {
                "value": 1,
                "confidence": 1.0
            },
            "loss_function": {
                "value": null,
                "confidence": 0.0
            },
            "split_ratio": {
                "value": null,
                "confidence": 0.0
            }
        },
        {
            "task": {
                "value": "Classification",
                "confidence": 1.0
            },
            "application": {
                "value": "Remote sensing scene classification",
                "confidence": 0.9856
            },
            "dataset": {
                "value": "SIRI-WHU",
                "confidence": 1.0
            },
            "metrics": {
                "value": [
                    {
                        "value": "Accuracy",
                        "confidence": 1.0
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 62.66,
                        "confidence": 1.0
                    }
                ]
            },
            "sensor": {
                "value": [
                    {
                        "value": "Google Earth imagery",
                        "confidence": 0.9965
                    }
                ]
            },
            "regions": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "original_samples": {
                "value": null,
                "confidence": 0.0
            },
            "num_samples": {
                "value": null,
                "confidence": 0.0
            },
            "sampling_percentage": {
                "value": null,
                "confidence": 0.0
            },
            "num_classes": {
                "value": 12,
                "confidence": 1.0
            },
            "classes": {
                "value": null,
                "confidence": 0.0
            },
            "image_resolution": {
                "value": "200x200",
                "confidence": 1.0
            },
            "spatial_resolution": {
                "value": "2m",
                "confidence": 1.0
            },
            "bands_used": {
                "value": null,
                "confidence": 0.0
            },
            "augmentations": {
                "value": []
            },
            "optimizer": {
                "value": "Adan",
                "confidence": 1.0
            },
            "batch_size": {
                "value": 8,
                "confidence": 1.0
            },
            "learning_rate": {
                "value": 0.0002,
                "confidence": 1.0
            },
            "epochs": {
                "value": 1,
                "confidence": 1.0
            },
            "loss_function": {
                "value": null,
                "confidence": 0.0
            },
            "split_ratio": {
                "value": null,
                "confidence": 0.0
            }
        },
        {
            "task": {
                "value": "Classification",
                "confidence": 1.0
            },
            "application": {
                "value": "Land use/land cover classification",
                "confidence": 0.4857
            },
            "dataset": {
                "value": "EuroSAT",
                "confidence": 1.0
            },
            "metrics": {
                "value": [
                    {
                        "value": "Accuracy",
                        "confidence": 1.0
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 51.4,
                        "confidence": 0.9166
                    }
                ]
            },
            "sensor": {
                "value": [
                    {
                        "value": "Sentinel-2",
                        "confidence": 0.6636
                    }
                ]
            },
            "regions": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "original_samples": {
                "value": null,
                "confidence": 0.0
            },
            "num_samples": {
                "value": null,
                "confidence": 0.0
            },
            "sampling_percentage": {
                "value": null,
                "confidence": 0.0
            },
            "num_classes": {
                "value": 10,
                "confidence": 1.0
            },
            "classes": {
                "value": null,
                "confidence": 0.0
            },
            "image_resolution": {
                "value": "64x64",
                "confidence": 1.0
            },
            "spatial_resolution": {
                "value": "10m",
                "confidence": 1.0
            },
            "bands_used": {
                "value": null,
                "confidence": 0.0
            },
            "augmentations": {
                "value": []
            },
            "optimizer": {
                "value": "Adan",
                "confidence": 0.9997
            },
            "batch_size": {
                "value": 8,
                "confidence": 1.0
            },
            "learning_rate": {
                "value": 0.0002,
                "confidence": 1.0
            },
            "epochs": {
                "value": 1,
                "confidence": 1.0
            },
            "loss_function": {
                "value": null,
                "confidence": 0.0
            },
            "split_ratio": {
                "value": null,
                "confidence": 0.0
            }
        },
        {
            "task": {
                "value": "Classification",
                "confidence": 1.0
            },
            "application": {
                "value": "Methane source mapping",
                "confidence": 0.7346
            },
            "dataset": {
                "value": "METER-ML",
                "confidence": 1.0
            },
            "metrics": {
                "value": [
                    {
                        "value": "Accuracy",
                        "confidence": 1.0
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 69.81,
                        "confidence": 1.0
                    }
                ]
            },
            "sensor": {
                "value": [
                    {
                        "value": "Multi-sensor",
                        "confidence": 0.4861
                    }
                ]
            },
            "regions": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "original_samples": {
                "value": null,
                "confidence": 0.0
            },
            "num_samples": {
                "value": null,
                "confidence": 0.0
            },
            "sampling_percentage": {
                "value": null,
                "confidence": 0.0
            },
            "num_classes": {
                "value": 6,
                "confidence": 1.0
            },
            "classes": {
                "value": null,
                "confidence": 0.0
            },
            "image_resolution": {
                "value": "720x720",
                "confidence": 1.0
            },
            "spatial_resolution": {
                "value": "1m",
                "confidence": 1.0
            },
            "bands_used": {
                "value": null,
                "confidence": 0.0
            },
            "augmentations": {
                "value": []
            },
            "optimizer": {
                "value": "Adan",
                "confidence": 1.0
            },
            "batch_size": {
                "value": 8,
                "confidence": 1.0
            },
            "learning_rate": {
                "value": 0.0002,
                "confidence": 1.0
            },
            "epochs": {
                "value": 1,
                "confidence": 1.0
            },
            "loss_function": {
                "value": null,
                "confidence": 0.0
            },
            "split_ratio": {
                "value": null,
                "confidence": 0.0
            }
        },
        {
            "task": {
                "value": "Classification",
                "confidence": 1.0
            },
            "application": {
                "value": "Fine-grained RS classification",
                "confidence": 0.3997
            },
            "dataset": {
                "value": "fMoW",
                "confidence": 1.0
            },
            "metrics": {
                "value": [
                    {
                        "value": "Accuracy",
                        "confidence": 1.0
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 56.56,
                        "confidence": 1.0
                    }
                ]
            },
            "sensor": {
                "value": [
                    {
                        "value": "Google Earth imagery",
                        "confidence": 0.6557
                    }
                ]
            },
            "regions": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "original_samples": {
                "value": null,
                "confidence": 0.0
            },
            "num_samples": {
                "value": null,
                "confidence": 0.0
            },
            "sampling_percentage": {
                "value": null,
                "confidence": 0.0
            },
            "num_classes": {
                "value": 63,
                "confidence": 1.0
            },
            "classes": {
                "value": null,
                "confidence": 0.0
            },
            "image_resolution": {
                "value": "varies",
                "confidence": 0.5406
            },
            "spatial_resolution": {
                "value": "0.31-1.6m",
                "confidence": 0.9613
            },
            "bands_used": {
                "value": null,
                "confidence": 0.0
            },
            "augmentations": {
                "value": []
            },
            "optimizer": {
                "value": "Adan",
                "confidence": 1.0
            },
            "batch_size": {
                "value": 8,
                "confidence": 1.0
            },
            "learning_rate": {
                "value": 0.0002,
                "confidence": 1.0
            },
            "epochs": {
                "value": 1,
                "confidence": 1.0
            },
            "loss_function": {
                "value": null,
                "confidence": 0.0
            },
            "split_ratio": {
                "value": null,
                "confidence": 0.0
            }
        },
        {
            "task": {
                "value": "Visual Question Answering",
                "confidence": 0.7965
            },
            "application": {
                "value": "RS VQA",
                "confidence": 0.5521
            },
            "dataset": {
                "value": "RSVQA-LR",
                "confidence": 0.9997
            },
            "metrics": {
                "value": [
                    {
                        "value": "Accuracy",
                        "confidence": 0.987
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 89.19,
                        "confidence": 0.9947
                    }
                ]
            },
            "sensor": {
                "value": [
                    {
                        "value": "Google Earth imagery",
                        "confidence": 0.8899
                    }
                ]
            },
            "regions": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "original_samples": {
                "value": null,
                "confidence": 0.0
            },
            "num_samples": {
                "value": null,
                "confidence": 0.0
            },
            "sampling_percentage": {
                "value": null,
                "confidence": 0.0
            },
            "num_classes": {
                "value": null,
                "confidence": 0.0
            },
            "classes": {
                "value": null,
                "confidence": 0.0
            },
            "image_resolution": {
                "value": "256x256",
                "confidence": 1.0
            },
            "spatial_resolution": {
                "value": "10m",
                "confidence": 1.0
            },
            "bands_used": {
                "value": null,
                "confidence": 0.0
            },
            "augmentations": {
                "value": []
            },
            "optimizer": {
                "value": null,
                "confidence": 0.0
            },
            "batch_size": {
                "value": null,
                "confidence": 0.0
            },
            "learning_rate": {
                "value": null,
                "confidence": 0.0
            },
            "epochs": {
                "value": null,
                "confidence": 0.0
            },
            "loss_function": {
                "value": null,
                "confidence": 0.0
            },
            "split_ratio": {
                "value": null,
                "confidence": 0.0
            }
        },
        {
            "task": {
                "value": "Visual Question Answering",
                "confidence": 1.0
            },
            "application": {
                "value": "RS VQA",
                "confidence": 0.9971
            },
            "dataset": {
                "value": "RSVQA-HR",
                "confidence": 1.0
            },
            "metrics": {
                "value": [
                    {
                        "value": "Accuracy",
                        "confidence": 1.0
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 92.55,
                        "confidence": 1.0
                    }
                ]
            },
            "sensor": {
                "value": [
                    {
                        "value": "Google Earth imagery",
                        "confidence": 1.0
                    }
                ]
            },
            "regions": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "original_samples": {
                "value": null,
                "confidence": 0.0
            },
            "num_samples": {
                "value": null,
                "confidence": 0.0
            },
            "sampling_percentage": {
                "value": null,
                "confidence": 0.0
            },
            "num_classes": {
                "value": null,
                "confidence": 0.0
            },
            "classes": {
                "value": null,
                "confidence": 0.0
            },
            "image_resolution": {
                "value": "512x512",
                "confidence": 1.0
            },
            "spatial_resolution": {
                "value": "0.15m",
                "confidence": 1.0
            },
            "bands_used": {
                "value": null,
                "confidence": 0.0
            },
            "augmentations": {
                "value": []
            },
            "optimizer": {
                "value": null,
                "confidence": 0.0
            },
            "batch_size": {
                "value": null,
                "confidence": 0.0
            },
            "learning_rate": {
                "value": null,
                "confidence": 0.0
            },
            "epochs": {
                "value": null,
                "confidence": 0.0
            },
            "loss_function": {
                "value": null,
                "confidence": 0.0
            },
            "split_ratio": {
                "value": null,
                "confidence": 0.0
            }
        },
        {
            "task": {
                "value": "Visual Grounding",
                "confidence": 0.9999
            },
            "application": {
                "value": "Object localization in RS images",
                "confidence": 0.3977
            },
            "dataset": {
                "value": "RSVG",
                "confidence": 1.0
            },
            "metrics": {
                "value": [
                    {
                        "value": "Accuracy (IoU>0.5)",
                        "confidence": 0.7576
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 73.45,
                        "confidence": 1.0
                    }
                ]
            },
            "sensor": {
                "value": [
                    {
                        "value": "Google Earth imagery",
                        "confidence": 0.9453
                    }
                ]
            },
            "regions": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "original_samples": {
                "value": null,
                "confidence": 0.0
            },
            "num_samples": {
                "value": null,
                "confidence": 0.0
            },
            "sampling_percentage": {
                "value": null,
                "confidence": 0.0
            },
            "num_classes": {
                "value": null,
                "confidence": 0.0
            },
            "classes": {
                "value": null,
                "confidence": 0.0
            },
            "image_resolution": {
                "value": "1024x1024",
                "confidence": 1.0
            },
            "spatial_resolution": {
                "value": null,
                "confidence": 0.0
            },
            "bands_used": {
                "value": null,
                "confidence": 0.0
            },
            "augmentations": {
                "value": []
            },
            "optimizer": {
                "value": null,
                "confidence": 0.0
            },
            "batch_size": {
                "value": null,
                "confidence": 0.0
            },
            "learning_rate": {
                "value": null,
                "confidence": 0.0
            },
            "epochs": {
                "value": null,
                "confidence": 0.0
            },
            "loss_function": {
                "value": null,
                "confidence": 0.0
            },
            "split_ratio": {
                "value": null,
                "confidence": 0.0
            }
        },
        {
            "task": {
                "value": "Visual Grounding",
                "confidence": 1.0
            },
            "application": {
                "value": "Object localization in RS images",
                "confidence": 0.9953
            },
            "dataset": {
                "value": "DIOR-RSVG",
                "confidence": 1.0
            },
            "metrics": {
                "value": [
                    {
                        "value": "Accuracy (IoU>0.5)",
                        "confidence": 0.9999
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 88.1,
                        "confidence": 0.9469
                    }
                ]
            },
            "sensor": {
                "value": [
                    {
                        "value": "Google Earth imagery",
                        "confidence": 0.9792
                    }
                ]
            },
            "regions": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "original_samples": {
                "value": null,
                "confidence": 0.0
            },
            "num_samples": {
                "value": null,
                "confidence": 0.0
            },
            "sampling_percentage": {
                "value": null,
                "confidence": 0.0
            },
            "num_classes": {
                "value": 20,
                "confidence": 1.0
            },
            "classes": {
                "value": null,
                "confidence": 0.0
            },
            "image_resolution": {
                "value": "800x800",
                "confidence": 1.0
            },
            "spatial_resolution": {
                "value": "0.5-30m",
                "confidence": 0.9943
            },
            "bands_used": {
                "value": null,
                "confidence": 0.0
            },
            "augmentations": {
                "value": []
            },
            "optimizer": {
                "value": null,
                "confidence": 0.0
            },
            "batch_size": {
                "value": null,
                "confidence": 0.0
            },
            "learning_rate": {
                "value": null,
                "confidence": 0.0
            },
            "epochs": {
                "value": null,
                "confidence": 0.0
            },
            "loss_function": {
                "value": null,
                "confidence": 0.0
            },
            "split_ratio": {
                "value": null,
                "confidence": 0.0
            }
        },
        {
            "task": {
                "value": "Comprehensive RS image understanding",
                "confidence": 0.371
            },
            "application": {
                "value": "RS MLLM evaluation",
                "confidence": 0.3334
            },
            "dataset": {
                "value": "LHRS-Bench",
                "confidence": 1.0
            },
            "metrics": {
                "value": [
                    {
                        "value": "Accuracy",
                        "confidence": 0.9809
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 39.38,
                        "confidence": 0.9967
                    }
                ]
            },
            "sensor": {
                "value": [
                    {
                        "value": "Google Earth imagery",
                        "confidence": 0.9999
                    }
                ]
            },
            "regions": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "original_samples": {
                "value": 108,
                "confidence": 0.8848
            },
            "num_samples": {
                "value": 690,
                "confidence": 0.9998
            },
            "sampling_percentage": {
                "value": null,
                "confidence": 0.0
            },
            "num_classes": {
                "value": null,
                "confidence": 0.0
            },
            "classes": {
                "value": [
                    {
                        "value": "Recognition",
                        "confidence": 0.4993
                    },
                    {
                        "value": "Color",
                        "confidence": 0.6804
                    },
                    {
                        "value": "Orientation",
                        "confidence": 1.0
                    },
                    {
                        "value": "Shape",
                        "confidence": 1.0
                    },
                    {
                        "value": "Area",
                        "confidence": 1.0
                    },
                    {
                        "value": "Resolution",
                        "confidence": 0.7334
                    },
                    {
                        "value": "Modality",
                        "confidence": 1.0
                    },
                    {
                        "value": "Location",
                        "confidence": 0.9739
                    },
                    {
                        "value": "Distance",
                        "confidence": 1.0
                    },
                    {
                        "value": "Quantity",
                        "confidence": 1.0
                    },
                    {
                        "value": "Reasoning",
                        "confidence": 1.0
                    }
                ]
            },
            "image_resolution": {
                "value": null,
                "confidence": 0.0
            },
            "spatial_resolution": {
                "value": null,
                "confidence": 0.0
            },
            "bands_used": {
                "value": null,
                "confidence": 0.0
            },
            "augmentations": {
                "value": []
            },
            "optimizer": {
                "value": null,
                "confidence": 0.0
            },
            "batch_size": {
                "value": null,
                "confidence": 0.0
            },
            "learning_rate": {
                "value": null,
                "confidence": 0.0
            },
            "epochs": {
                "value": null,
                "confidence": 0.0
            },
            "loss_function": {
                "value": null,
                "confidence": 0.0
            },
            "split_ratio": {
                "value": null,
                "confidence": 0.0
            }
        }
    ]
}