{
    "model_id": {
        "value": "RS5M",
        "confidence": 0.868
    },
    "model_name": {
        "value": "RS5M",
        "confidence": 0.9997
    },
    "version": {
        "value": "v1",
        "confidence": 0.7982
    },
    "release_date": {
        "value": null,
        "confidence": 0.0
    },
    "last_updated": {
        "value": null,
        "confidence": 0.0
    },
    "short_description": {
        "value": "RS5M is a large-scale remote sensing vision-language dataset containing 5 million remote sensing images paired with English descriptions, constructed by filtering public image-text datasets and captioning label-only RS datasets with pre-trained VLMs. It is designed to enable domain-specific transfer of general vision-language models to remote sensing tasks.",
        "confidence": 0.784
    },
    "paper_link": {
        "value": "https://arxiv.org/abs/2306.11300",
        "confidence": 0.9999
    },
    "citations": {
        "value": null,
        "confidence": 0.0
    },
    "repository": {
        "value": "https://github.com/om-ai-lab/RS5M",
        "confidence": 1.0
    },
    "weights": {
        "value": null,
        "confidence": 0.0
    },
    "backbone": {
        "value": "CLIP ViT-B32",
        "confidence": 0.7359
    },
    "num_layers": {
        "value": null,
        "confidence": 0.0
    },
    "num_parameters": {
        "value": 152,
        "confidence": 0.7441
    },
    "pretext_training_type": {
        "value": "Contrastive learning (InfoNCE loss), optionally with image-text matching and self-supervised loss",
        "confidence": 0.7632
    },
    "masking_strategy": {
        "value": null,
        "confidence": 0.0
    },
    "pretraining": {
        "value": "RS5M is constructed by filtering 11 public image-text datasets (PUB11) using RS-related keywords and deduplication, and by generating captions for 3 large-scale RS datasets (RS3: BigEarthNet, FMoW, MillionAID) using BLIP2. Extensive denoising and quality assurance methods are applied, including rotation-invariant caption selection and meta-information integration.",
        "confidence": 0.7408
    },
    "domain_knowledge": {
        "value": [
            {
                "value": "Remote sensing-specific keyword filtering",
                "confidence": 0.464
            },
            {
                "value": "Rotation-invariant caption selection",
                "confidence": 0.8224
            },
            {
                "value": "Integration of geospatial meta-information into captions",
                "confidence": 0.5501
            }
        ]
    },
    "backbone_modifications": {
        "value": [
            {
                "value": "Adapters (Pfeiffer, LoRA, Prefix-tuning, UniPELT) inserted into CLIP encoders",
                "confidence": 0.6467
            }
        ]
    },
    "supported_sensors": {
        "value": [
            {
                "value": "Sentinel-1",
                "confidence": 0.9729
            },
            {
                "value": "Sentinel-2",
                "confidence": 1.0
            },
            {
                "value": "Gaofen",
                "confidence": 0.3641
            },
            {
                "value": "USGS",
                "confidence": 0.6858
            },
            {
                "value": "NAIP",
                "confidence": 0.8948
            },
            {
                "value": "MODIS",
                "confidence": 0.9
            },
            {
                "value": "EOSDIS",
                "confidence": 0.5749
            },
            {
                "value": "WorldView",
                "confidence": 0.8923
            },
            {
                "value": "Planet Dove",
                "confidence": 0.8999
            },
            {
                "value": "Maxar",
                "confidence": 0.8481
            },
            {
                "value": "Landsat",
                "confidence": 0.9
            }
        ]
    },
    "modality_integration_type": {
        "value": "Homogeneous Multimodal",
        "confidence": 0.8518
    },
    "modalities": {
        "value": [
            {
                "value": "Multispectral",
                "confidence": 0.9465
            },
            {
                "value": "RGB",
                "confidence": 0.9763
            },
            {
                "value": "Text",
                "confidence": 0.9909
            }
        ]
    },
    "spectral_alignment": {
        "value": "none",
        "confidence": 0.7436
    },
    "temporal_alignment": {
        "value": "none",
        "confidence": 0.7357
    },
    "spatial_resolution": {
        "value": "variable",
        "confidence": 0.8227
    },
    "temporal_resolution": {
        "value": "variable",
        "confidence": 0.9996
    },
    "bands": {
        "value": [
            {
                "value": "RGB",
                "confidence": 0.8667
            },
            {
                "value": "Multispectral (up to 12 bands for Sentinel-2, 2 bands for Sentinel-1, 4/8 bands for FMoW)",
                "confidence": 0.5735
            }
        ]
    },
    "pretraining_phases": [
        {
            "dataset": {
                "value": "RS5M (PUB11 + RS3)",
                "confidence": 0.6534
            },
            "regions_coverage": {
                "value": [
                    {
                        "value": "Global (with overrepresentation in North America, Europe, Asia, and underrepresentation in Africa, Australia, northern Canada/Russia, South America)",
                        "confidence": 0.3
                    }
                ]
            },
            "time_range": {
                "value": null,
                "confidence": 0.0
            },
            "num_images": {
                "value": 5000000,
                "confidence": 0.9769
            },
            "token_size": {
                "value": null,
                "confidence": 0.0
            },
            "image_resolution": {
                "value": "variable (average ~400x520 px, BigEarthNet 120x120 px, others up to 800x800 px)",
                "confidence": 0.3
            },
            "epochs": {
                "value": 10,
                "confidence": 1.0
            },
            "batch_size": {
                "value": 500,
                "confidence": 1.0
            },
            "learning_rate": {
                "value": "1e-4",
                "confidence": 0.9958
            },
            "augmentations": {
                "value": [
                    {
                        "value": "Image rotation (12 angles, 30 deg increments) for rotation-invariant caption selection",
                        "confidence": 0.3009
                    }
                ]
            },
            "processing": {
                "value": [
                    {
                        "value": "Keyword filtering",
                        "confidence": 0.4555
                    },
                    {
                        "value": "Deduplication",
                        "confidence": 0.5683
                    },
                    {
                        "value": "Invalid image removal",
                        "confidence": 0.4831
                    },
                    {
                        "value": "VLM and RS image detector filtering",
                        "confidence": 0.3829
                    },
                    {
                        "value": "Caption generation with BLIP2",
                        "confidence": 0.373
                    },
                    {
                        "value": "Meta-information integration",
                        "confidence": 0.4233
                    }
                ]
            },
            "sampling": {
                "value": "PUB11: top 90% VLM similarity, top 80% RS classifier; RS3: all available images from selected splits",
                "confidence": 0.3
            },
            "processing_level": {
                "value": null,
                "confidence": 0.0
            },
            "cloud_cover": {
                "value": null,
                "confidence": 0.0
            },
            "missing_data": {
                "value": null,
                "confidence": 0.0
            },
            "masking_ratio": {
                "value": null,
                "confidence": 0.0
            }
        }
    ],
    "benchmarks": [
        {
            "task": {
                "value": "Zero-shot classification",
                "confidence": 0.5744
            },
            "application": {
                "value": "Remote sensing scene classification",
                "confidence": 0.6764
            },
            "dataset": {
                "value": "AID",
                "confidence": 0.9332
            },
            "metrics": {
                "value": [
                    {
                        "value": "Top-1 Accuracy",
                        "confidence": 0.9841
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 70.92,
                        "confidence": 0.7408
                    }
                ]
            },
            "sensor": {
                "value": [
                    {
                        "value": "Google Earth",
                        "confidence": 0.8006
                    },
                    {
                        "value": "Aerial",
                        "confidence": 0.4979
                    }
                ]
            },
            "regions": {
                "value": [
                    {
                        "value": "Global",
                        "confidence": 0.6083
                    }
                ]
            },
            "original_samples": {
                "value": null,
                "confidence": 0.0
            },
            "num_samples": {
                "value": null,
                "confidence": 0.0
            },
            "sampling_percentage": {
                "value": null,
                "confidence": 0.0
            },
            "num_classes": {
                "value": null,
                "confidence": 0.0
            },
            "classes": {
                "value": null,
                "confidence": 0.0
            },
            "image_resolution": {
                "value": null,
                "confidence": 0.0
            },
            "spatial_resolution": {
                "value": null,
                "confidence": 0.0
            },
            "bands_used": {
                "value": [
                    {
                        "value": "RGB",
                        "confidence": 0.8963
                    }
                ]
            },
            "augmentations": {
                "value": []
            },
            "optimizer": {
                "value": "AdamW",
                "confidence": 1.0
            },
            "batch_size": {
                "value": 500,
                "confidence": 1.0
            },
            "learning_rate": {
                "value": 0.0001,
                "confidence": 0.9992
            },
            "epochs": {
                "value": 10,
                "confidence": 1.0
            },
            "loss_function": {
                "value": "Contrastive loss (InfoNCE)",
                "confidence": 0.6603
            },
            "split_ratio": {
                "value": "95% train, 5% val",
                "confidence": 0.4397
            }
        },
        {
            "task": {
                "value": "Zero-shot classification",
                "confidence": 1.0
            },
            "application": {
                "value": "Remote sensing scene classification",
                "confidence": 0.9977
            },
            "dataset": {
                "value": "RESISC45",
                "confidence": 0.9995
            },
            "metrics": {
                "value": [
                    {
                        "value": "Top-1 Accuracy",
                        "confidence": 1.0
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 67.79,
                        "confidence": 0.9923
                    }
                ]
            },
            "sensor": {
                "value": [
                    {
                        "value": "Google Earth",
                        "confidence": 0.9144
                    },
                    {
                        "value": "Aerial",
                        "confidence": 0.9938
                    }
                ]
            },
            "regions": {
                "value": [
                    {
                        "value": "Global",
                        "confidence": 0.9941
                    }
                ]
            },
            "original_samples": {
                "value": null,
                "confidence": 0.0
            },
            "num_samples": {
                "value": null,
                "confidence": 0.0
            },
            "sampling_percentage": {
                "value": null,
                "confidence": 0.0
            },
            "num_classes": {
                "value": null,
                "confidence": 0.0
            },
            "classes": {
                "value": null,
                "confidence": 0.0
            },
            "image_resolution": {
                "value": null,
                "confidence": 0.0
            },
            "spatial_resolution": {
                "value": null,
                "confidence": 0.0
            },
            "bands_used": {
                "value": [
                    {
                        "value": "RGB",
                        "confidence": 1.0
                    }
                ]
            },
            "augmentations": {
                "value": []
            },
            "optimizer": {
                "value": "AdamW",
                "confidence": 1.0
            },
            "batch_size": {
                "value": 500,
                "confidence": 1.0
            },
            "learning_rate": {
                "value": 0.0001,
                "confidence": 1.0
            },
            "epochs": {
                "value": 10,
                "confidence": 1.0
            },
            "loss_function": {
                "value": "Contrastive loss (InfoNCE)",
                "confidence": 0.9932
            },
            "split_ratio": {
                "value": "95% train, 5% val",
                "confidence": 0.9971
            }
        },
        {
            "task": {
                "value": "Zero-shot classification",
                "confidence": 1.0
            },
            "application": {
                "value": "Remote sensing scene classification",
                "confidence": 0.9526
            },
            "dataset": {
                "value": "EuroSAT",
                "confidence": 1.0
            },
            "metrics": {
                "value": [
                    {
                        "value": "Top-1 Accuracy",
                        "confidence": 1.0
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 61.24,
                        "confidence": 0.9577
                    }
                ]
            },
            "sensor": {
                "value": [
                    {
                        "value": "Sentinel-2",
                        "confidence": 0.9995
                    }
                ]
            },
            "regions": {
                "value": [
                    {
                        "value": "Europe",
                        "confidence": 0.9858
                    }
                ]
            },
            "original_samples": {
                "value": null,
                "confidence": 0.0
            },
            "num_samples": {
                "value": null,
                "confidence": 0.0
            },
            "sampling_percentage": {
                "value": null,
                "confidence": 0.0
            },
            "num_classes": {
                "value": null,
                "confidence": 0.0
            },
            "classes": {
                "value": null,
                "confidence": 0.0
            },
            "image_resolution": {
                "value": null,
                "confidence": 0.0
            },
            "spatial_resolution": {
                "value": null,
                "confidence": 0.0
            },
            "bands_used": {
                "value": [
                    {
                        "value": "RGB",
                        "confidence": 0.7995
                    }
                ]
            },
            "augmentations": {
                "value": []
            },
            "optimizer": {
                "value": "AdamW",
                "confidence": 1.0
            },
            "batch_size": {
                "value": 500,
                "confidence": 1.0
            },
            "learning_rate": {
                "value": 0.0001,
                "confidence": 1.0
            },
            "epochs": {
                "value": 10,
                "confidence": 1.0
            },
            "loss_function": {
                "value": "Contrastive loss (InfoNCE)",
                "confidence": 0.9999
            },
            "split_ratio": {
                "value": "95% train, 5% val",
                "confidence": 0.9999
            }
        },
        {
            "task": {
                "value": "Vision-language retrieval",
                "confidence": 0.6087
            },
            "application": {
                "value": "Image-to-text retrieval",
                "confidence": 0.4646
            },
            "dataset": {
                "value": "RSICD",
                "confidence": 1.0
            },
            "metrics": {
                "value": [
                    {
                        "value": "Recall@1",
                        "confidence": 0.7754
                    },
                    {
                        "value": "Recall@5",
                        "confidence": 1.0
                    },
                    {
                        "value": "Recall@10",
                        "confidence": 1.0
                    },
                    {
                        "value": "Mean Recall",
                        "confidence": 0.8866
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 9.61,
                        "confidence": 0.6934
                    },
                    {
                        "value": 22.05,
                        "confidence": 1.0
                    },
                    {
                        "value": 32.11,
                        "confidence": 1.0
                    },
                    {
                        "value": 20.99,
                        "confidence": 1.0
                    }
                ]
            },
            "sensor": {
                "value": [
                    {
                        "value": "Google Earth",
                        "confidence": 0.9694
                    },
                    {
                        "value": "Baidu Map",
                        "confidence": 0.8766
                    },
                    {
                        "value": "MapABC",
                        "confidence": 0.9902
                    },
                    {
                        "value": "Tianditu",
                        "confidence": 0.9999
                    }
                ]
            },
            "regions": {
                "value": [
                    {
                        "value": "Global",
                        "confidence": 0.9787
                    }
                ]
            },
            "original_samples": {
                "value": null,
                "confidence": 0.0
            },
            "num_samples": {
                "value": null,
                "confidence": 0.0
            },
            "sampling_percentage": {
                "value": null,
                "confidence": 0.0
            },
            "num_classes": {
                "value": null,
                "confidence": 0.0
            },
            "classes": {
                "value": null,
                "confidence": 0.0
            },
            "image_resolution": {
                "value": null,
                "confidence": 0.0
            },
            "spatial_resolution": {
                "value": null,
                "confidence": 0.0
            },
            "bands_used": {
                "value": [
                    {
                        "value": "RGB",
                        "confidence": 0.9999
                    }
                ]
            },
            "augmentations": {
                "value": []
            },
            "optimizer": {
                "value": "AdamW",
                "confidence": 0.9999
            },
            "batch_size": {
                "value": 500,
                "confidence": 1.0
            },
            "learning_rate": {
                "value": 0.0001,
                "confidence": 1.0
            },
            "epochs": {
                "value": 10,
                "confidence": 1.0
            },
            "loss_function": {
                "value": "Contrastive loss (InfoNCE)",
                "confidence": 0.9986
            },
            "split_ratio": {
                "value": "95% train, 5% val",
                "confidence": 0.5028
            }
        },
        {
            "task": {
                "value": "Vision-language retrieval",
                "confidence": 1.0
            },
            "application": {
                "value": "Text-to-image retrieval",
                "confidence": 0.9626
            },
            "dataset": {
                "value": "RSICD",
                "confidence": 0.9997
            },
            "metrics": {
                "value": [
                    {
                        "value": "Recall@1",
                        "confidence": 1.0
                    },
                    {
                        "value": "Recall@5",
                        "confidence": 1.0
                    },
                    {
                        "value": "Recall@10",
                        "confidence": 1.0
                    },
                    {
                        "value": "Mean Recall",
                        "confidence": 1.0
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 6.99,
                        "confidence": 1.0
                    },
                    {
                        "value": 22.09,
                        "confidence": 1.0
                    },
                    {
                        "value": 33.06,
                        "confidence": 1.0
                    },
                    {
                        "value": 20.99,
                        "confidence": 1.0
                    }
                ]
            },
            "sensor": {
                "value": [
                    {
                        "value": "Google Earth",
                        "confidence": 1.0
                    },
                    {
                        "value": "Baidu Map",
                        "confidence": 1.0
                    },
                    {
                        "value": "MapABC",
                        "confidence": 1.0
                    },
                    {
                        "value": "Tianditu",
                        "confidence": 1.0
                    }
                ]
            },
            "regions": {
                "value": [
                    {
                        "value": "Global",
                        "confidence": 1.0
                    }
                ]
            },
            "original_samples": {
                "value": null,
                "confidence": 0.0
            },
            "num_samples": {
                "value": null,
                "confidence": 0.0
            },
            "sampling_percentage": {
                "value": null,
                "confidence": 0.0
            },
            "num_classes": {
                "value": null,
                "confidence": 0.0
            },
            "classes": {
                "value": null,
                "confidence": 0.0
            },
            "image_resolution": {
                "value": null,
                "confidence": 0.0
            },
            "spatial_resolution": {
                "value": null,
                "confidence": 0.0
            },
            "bands_used": {
                "value": [
                    {
                        "value": "RGB",
                        "confidence": 1.0
                    }
                ]
            },
            "augmentations": {
                "value": []
            },
            "optimizer": {
                "value": "AdamW",
                "confidence": 1.0
            },
            "batch_size": {
                "value": 500,
                "confidence": 1.0
            },
            "learning_rate": {
                "value": 0.0001,
                "confidence": 1.0
            },
            "epochs": {
                "value": 10,
                "confidence": 1.0
            },
            "loss_function": {
                "value": "Contrastive loss (InfoNCE)",
                "confidence": 1.0
            },
            "split_ratio": {
                "value": "95% train, 5% val",
                "confidence": 1.0
            }
        },
        {
            "task": {
                "value": "Vision-language retrieval",
                "confidence": 0.9971
            },
            "application": {
                "value": "Image-to-text retrieval",
                "confidence": 1.0
            },
            "dataset": {
                "value": "RSITMD",
                "confidence": 1.0
            },
            "metrics": {
                "value": [
                    {
                        "value": "Recall@1",
                        "confidence": 1.0
                    },
                    {
                        "value": "Recall@5",
                        "confidence": 1.0
                    },
                    {
                        "value": "Recall@10",
                        "confidence": 1.0
                    },
                    {
                        "value": "Mean Recall",
                        "confidence": 1.0
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 13.72,
                        "confidence": 1.0
                    },
                    {
                        "value": 30.97,
                        "confidence": 1.0
                    },
                    {
                        "value": 43.14,
                        "confidence": 1.0
                    },
                    {
                        "value": 29.06,
                        "confidence": 1.0
                    }
                ]
            },
            "sensor": {
                "value": [
                    {
                        "value": "Satellite",
                        "confidence": 0.4318
                    }
                ]
            },
            "regions": {
                "value": [
                    {
                        "value": "Global",
                        "confidence": 0.9875
                    }
                ]
            },
            "original_samples": {
                "value": null,
                "confidence": 0.0
            },
            "num_samples": {
                "value": null,
                "confidence": 0.0
            },
            "sampling_percentage": {
                "value": null,
                "confidence": 0.0
            },
            "num_classes": {
                "value": null,
                "confidence": 0.0
            },
            "classes": {
                "value": null,
                "confidence": 0.0
            },
            "image_resolution": {
                "value": null,
                "confidence": 0.0
            },
            "spatial_resolution": {
                "value": null,
                "confidence": 0.0
            },
            "bands_used": {
                "value": [
                    {
                        "value": "RGB",
                        "confidence": 1.0
                    }
                ]
            },
            "augmentations": {
                "value": []
            },
            "optimizer": {
                "value": "AdamW",
                "confidence": 1.0
            },
            "batch_size": {
                "value": 500,
                "confidence": 1.0
            },
            "learning_rate": {
                "value": 0.0001,
                "confidence": 1.0
            },
            "epochs": {
                "value": 10,
                "confidence": 1.0
            },
            "loss_function": {
                "value": "Contrastive loss (InfoNCE)",
                "confidence": 1.0
            },
            "split_ratio": {
                "value": "95% train, 5% val",
                "confidence": 0.9978
            }
        },
        {
            "task": {
                "value": "Vision-language retrieval",
                "confidence": 0.9999
            },
            "application": {
                "value": "Text-to-image retrieval",
                "confidence": 1.0
            },
            "dataset": {
                "value": "RSITMD",
                "confidence": 1.0
            },
            "metrics": {
                "value": [
                    {
                        "value": "Recall@1",
                        "confidence": 1.0
                    },
                    {
                        "value": "Recall@5",
                        "confidence": 1.0
                    },
                    {
                        "value": "Recall@10",
                        "confidence": 1.0
                    },
                    {
                        "value": "Mean Recall",
                        "confidence": 1.0
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 9.25,
                        "confidence": 1.0
                    },
                    {
                        "value": 30.04,
                        "confidence": 1.0
                    },
                    {
                        "value": 47.26,
                        "confidence": 1.0
                    },
                    {
                        "value": 29.06,
                        "confidence": 1.0
                    }
                ]
            },
            "sensor": {
                "value": [
                    {
                        "value": "Satellite",
                        "confidence": 1.0
                    }
                ]
            },
            "regions": {
                "value": [
                    {
                        "value": "Global",
                        "confidence": 1.0
                    }
                ]
            },
            "original_samples": {
                "value": null,
                "confidence": 0.0
            },
            "num_samples": {
                "value": null,
                "confidence": 0.0
            },
            "sampling_percentage": {
                "value": null,
                "confidence": 0.0
            },
            "num_classes": {
                "value": null,
                "confidence": 0.0
            },
            "classes": {
                "value": null,
                "confidence": 0.0
            },
            "image_resolution": {
                "value": null,
                "confidence": 0.0
            },
            "spatial_resolution": {
                "value": null,
                "confidence": 0.0
            },
            "bands_used": {
                "value": [
                    {
                        "value": "RGB",
                        "confidence": 1.0
                    }
                ]
            },
            "augmentations": {
                "value": []
            },
            "optimizer": {
                "value": "AdamW",
                "confidence": 1.0
            },
            "batch_size": {
                "value": 500,
                "confidence": 1.0
            },
            "learning_rate": {
                "value": 0.0001,
                "confidence": 1.0
            },
            "epochs": {
                "value": 10,
                "confidence": 1.0
            },
            "loss_function": {
                "value": "Contrastive loss (InfoNCE)",
                "confidence": 1.0
            },
            "split_ratio": {
                "value": "95% train, 5% val",
                "confidence": 1.0
            }
        },
        {
            "task": {
                "value": "Semantic localization",
                "confidence": 0.7754
            },
            "application": {
                "value": "Semantic localization (visual grounding)",
                "confidence": 0.3179
            },
            "dataset": {
                "value": "AIR-SLT",
                "confidence": 0.9999
            },
            "metrics": {
                "value": [
                    {
                        "value": "Rsu",
                        "confidence": 0.9978
                    },
                    {
                        "value": "Ras",
                        "confidence": 1.0
                    },
                    {
                        "value": "Rda",
                        "confidence": 1.0
                    },
                    {
                        "value": "Rmi",
                        "confidence": 1.0
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 0.7292,
                        "confidence": 0.9994
                    },
                    {
                        "value": 0.3463,
                        "confidence": 1.0
                    },
                    {
                        "value": 0.6461,
                        "confidence": 1.0
                    },
                    {
                        "value": 0.682,
                        "confidence": 0.9579
                    }
                ]
            },
            "sensor": {
                "value": [
                    {
                        "value": "Satellite",
                        "confidence": 0.9786
                    }
                ]
            },
            "regions": {
                "value": [
                    {
                        "value": "Global",
                        "confidence": 0.9914
                    }
                ]
            },
            "original_samples": {
                "value": null,
                "confidence": 0.0
            },
            "num_samples": {
                "value": null,
                "confidence": 0.0
            },
            "sampling_percentage": {
                "value": null,
                "confidence": 0.0
            },
            "num_classes": {
                "value": null,
                "confidence": 0.0
            },
            "classes": {
                "value": null,
                "confidence": 0.0
            },
            "image_resolution": {
                "value": null,
                "confidence": 0.0
            },
            "spatial_resolution": {
                "value": null,
                "confidence": 0.0
            },
            "bands_used": {
                "value": [
                    {
                        "value": "RGB",
                        "confidence": 0.9998
                    }
                ]
            },
            "augmentations": {
                "value": []
            },
            "optimizer": {
                "value": "AdamW",
                "confidence": 1.0
            },
            "batch_size": {
                "value": 500,
                "confidence": 1.0
            },
            "learning_rate": {
                "value": 0.0001,
                "confidence": 1.0
            },
            "epochs": {
                "value": 10,
                "confidence": 1.0
            },
            "loss_function": {
                "value": "Contrastive loss (InfoNCE)",
                "confidence": 1.0
            },
            "split_ratio": {
                "value": "95% train, 5% val",
                "confidence": 0.9998
            }
        }
    ]
}