{
    "model_id": {
        "value": "RSGPT",
        "confidence": 0.915
    },
    "model_name": {
        "value": "RSGPT",
        "confidence": 1.0
    },
    "version": {
        "value": null,
        "confidence": 0.0
    },
    "release_date": {
        "value": null,
        "confidence": 0.0
    },
    "last_updated": {
        "value": null,
        "confidence": 0.0
    },
    "short_description": {
        "value": "RSGPT is a remote sensing vision-language model based on finetuning InstructBLIP on a high-quality, human-annotated remote sensing image captioning dataset (RSICap). It aligns visual features of remote sensing images with large language models for tasks such as image captioning and visual question answering, outperforming previous state-of-the-art methods.",
        "confidence": 0.8192
    },
    "paper_link": {
        "value": "https://arxiv.org/abs/2307.15266",
        "confidence": 0.9998
    },
    "citations": {
        "value": null,
        "confidence": 0.0
    },
    "repository": {
        "value": "https://github.com/Lavender105/RSGPT",
        "confidence": 1.0
    },
    "weights": {
        "value": null,
        "confidence": 0.0
    },
    "backbone": {
        "value": "InstructBLIP (frozen image encoder and LLM, Q-Former and linear layer finetuned)",
        "confidence": 0.7671
    },
    "num_layers": {
        "value": null,
        "confidence": 0.0
    },
    "num_parameters": {
        "value": null,
        "confidence": 0.0
    },
    "pretext_training_type": {
        "value": "Instruction-tuned vision-language alignment (finetuning Q-Former and linear layer with instruction prompts)",
        "confidence": 0.6634
    },
    "masking_strategy": {
        "value": null,
        "confidence": 0.0
    },
    "pretraining": {
        "value": "Finetuning InstructBLIP on RSICap (2,585 human-annotated image-caption pairs) for remote sensing domain adaptation. Only Q-Former and linear layer are trained; image encoder and LLM are frozen.",
        "confidence": 0.7363
    },
    "domain_knowledge": {
        "value": [
            {
                "value": "Remote sensing image semantics",
                "confidence": 0.4516
            },
            {
                "value": "Object attributes (color, shape, position, quantity)",
                "confidence": 0.4666
            },
            {
                "value": "Scene and object relationship reasoning",
                "confidence": 0.4925
            }
        ]
    },
    "backbone_modifications": {
        "value": [
            {
                "value": "Finetune only Q-Former and linear layer; freeze image encoder and LLM",
                "confidence": 0.6212
            }
        ]
    },
    "supported_sensors": {
        "value": [
            {
                "value": "GF-2",
                "confidence": 0.9995
            },
            {
                "value": "JL-1",
                "confidence": 0.9998
            },
            {
                "value": "Google Earth",
                "confidence": 1.0
            },
            {
                "value": "Aerial images",
                "confidence": 0.4869
            }
        ]
    },
    "modality_integration_type": {
        "value": "Homogeneous Multimodal",
        "confidence": 0.9391
    },
    "modalities": {
        "value": [
            {
                "value": "Multispectral",
                "confidence": 0.989
            },
            {
                "value": "Panchromatic",
                "confidence": 0.9048
            },
            {
                "value": "Aerial RGB",
                "confidence": 0.4581
            }
        ]
    },
    "spectral_alignment": {
        "value": "none",
        "confidence": 0.5499
    },
    "temporal_alignment": {
        "value": "none",
        "confidence": 1.0
    },
    "spatial_resolution": {
        "value": "variable (from 800x800 to 4000x4000, patches of 512x512)",
        "confidence": 0.7414
    },
    "temporal_resolution": {
        "value": null,
        "confidence": 0.0
    },
    "bands": {
        "value": null,
        "confidence": 0.0
    },
    "pretraining_phases": [
        {
            "dataset": {
                "value": "RSICap (based on DOTA-v1.5)",
                "confidence": 0.4559
            },
            "regions_coverage": {
                "value": null,
                "confidence": 0.0
            },
            "time_range": {
                "value": null,
                "confidence": 0.0
            },
            "num_images": {
                "value": 2585,
                "confidence": 1.0
            },
            "token_size": {
                "value": null,
                "confidence": 0.0
            },
            "image_resolution": {
                "value": "512x512 patches (from original images 800x800 to 4000x4000)",
                "confidence": 0.307
            },
            "epochs": {
                "value": 5,
                "confidence": 1.0
            },
            "batch_size": {
                "value": 64,
                "confidence": 1.0
            },
            "learning_rate": {
                "value": "3e-5",
                "confidence": 0.9995
            },
            "augmentations": {
                "value": null,
                "confidence": 0.0
            },
            "processing": {
                "value": [
                    {
                        "value": "Patch extraction",
                        "confidence": 0.4967
                    },
                    {
                        "value": "Manual annotation",
                        "confidence": 0.4726
                    }
                ]
            },
            "sampling": {
                "value": "Random selection of 2585 patches from DOTA-v1.5",
                "confidence": 0.3726
            },
            "processing_level": {
                "value": null,
                "confidence": 0.0
            },
            "cloud_cover": {
                "value": null,
                "confidence": 0.0
            },
            "missing_data": {
                "value": null,
                "confidence": 0.0
            },
            "masking_ratio": {
                "value": null,
                "confidence": 0.0
            }
        }
    ],
    "benchmarks": [
        {
            "task": {
                "value": "Image Captioning",
                "confidence": 0.7877
            },
            "application": {
                "value": "Remote sensing image captioning",
                "confidence": 0.4975
            },
            "dataset": {
                "value": "RSIEval",
                "confidence": 0.7668
            },
            "metrics": {
                "value": [
                    {
                        "value": "Manual scoring (detail, position, hallucination)",
                        "confidence": 0.3306
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "sensor": {
                "value": [
                    {
                        "value": "GF-2",
                        "confidence": 0.9962
                    },
                    {
                        "value": "JL-1",
                        "confidence": 1.0
                    },
                    {
                        "value": "Google Earth",
                        "confidence": 1.0
                    },
                    {
                        "value": "aerial images",
                        "confidence": 0.8539
                    }
                ]
            },
            "regions": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "original_samples": {
                "value": 100,
                "confidence": 0.9989
            },
            "num_samples": {
                "value": 100,
                "confidence": 1.0
            },
            "sampling_percentage": {
                "value": 100,
                "confidence": 1.0
            },
            "num_classes": {
                "value": null,
                "confidence": 0.0
            },
            "classes": {
                "value": null,
                "confidence": 0.0
            },
            "image_resolution": {
                "value": "512x512",
                "confidence": 1.0
            },
            "spatial_resolution": {
                "value": "variable",
                "confidence": 0.8652
            },
            "bands_used": {
                "value": null,
                "confidence": 0.0
            },
            "augmentations": {
                "value": null,
                "confidence": 0.0
            },
            "optimizer": {
                "value": "AdamW",
                "confidence": 0.9469
            },
            "batch_size": {
                "value": 64,
                "confidence": 1.0
            },
            "learning_rate": {
                "value": 3e-05,
                "confidence": 0.9983
            },
            "epochs": {
                "value": 5,
                "confidence": 1.0
            },
            "loss_function": {
                "value": null,
                "confidence": 0.0
            },
            "split_ratio": {
                "value": null,
                "confidence": 0.0
            }
        },
        {
            "task": {
                "value": "Visual Question Answering",
                "confidence": 0.9984
            },
            "application": {
                "value": "Remote sensing visual question answering",
                "confidence": 0.6085
            },
            "dataset": {
                "value": "RSIEval",
                "confidence": 1.0
            },
            "metrics": {
                "value": [
                    {
                        "value": "Accuracy (per question type and average)",
                        "confidence": 0.3251
                    },
                    {
                        "value": "Quantity relative error",
                        "confidence": 0.6956
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 65.24,
                        "confidence": 0.8274
                    },
                    {
                        "value": 0.4828,
                        "confidence": 0.9999
                    }
                ]
            },
            "sensor": {
                "value": [
                    {
                        "value": "GF-2",
                        "confidence": 1.0
                    },
                    {
                        "value": "JL-1",
                        "confidence": 1.0
                    },
                    {
                        "value": "Google Earth",
                        "confidence": 1.0
                    },
                    {
                        "value": "aerial images",
                        "confidence": 0.9998
                    }
                ]
            },
            "regions": {
                "value": [
                    {
                        "value": null,
                        "confidence": 0.3
                    }
                ]
            },
            "original_samples": {
                "value": 936,
                "confidence": 1.0
            },
            "num_samples": {
                "value": 936,
                "confidence": 1.0
            },
            "sampling_percentage": {
                "value": 100,
                "confidence": 1.0
            },
            "num_classes": {
                "value": 10,
                "confidence": 1.0
            },
            "classes": {
                "value": [
                    {
                        "value": "presence",
                        "confidence": 0.8963
                    },
                    {
                        "value": "quantity",
                        "confidence": 1.0
                    },
                    {
                        "value": "color",
                        "confidence": 1.0
                    },
                    {
                        "value": "absolute position",
                        "confidence": 0.9831
                    },
                    {
                        "value": "relative position",
                        "confidence": 1.0
                    },
                    {
                        "value": "area comparison",
                        "confidence": 1.0
                    },
                    {
                        "value": "road direction",
                        "confidence": 1.0
                    },
                    {
                        "value": "image",
                        "confidence": 1.0
                    },
                    {
                        "value": "scene",
                        "confidence": 1.0
                    },
                    {
                        "value": "reasoning",
                        "confidence": 1.0
                    }
                ]
            },
            "image_resolution": {
                "value": "512x512",
                "confidence": 1.0
            },
            "spatial_resolution": {
                "value": "variable",
                "confidence": 1.0
            },
            "bands_used": {
                "value": null,
                "confidence": 0.0
            },
            "augmentations": {
                "value": null,
                "confidence": 0.0
            },
            "optimizer": {
                "value": "AdamW",
                "confidence": 0.998
            },
            "batch_size": {
                "value": 64,
                "confidence": 1.0
            },
            "learning_rate": {
                "value": 3e-05,
                "confidence": 1.0
            },
            "epochs": {
                "value": 5,
                "confidence": 1.0
            },
            "loss_function": {
                "value": null,
                "confidence": 0.0
            },
            "split_ratio": {
                "value": null,
                "confidence": 0.0
            }
        },
        {
            "task": {
                "value": "Image Captioning",
                "confidence": 0.9964
            },
            "application": {
                "value": "Remote sensing image captioning",
                "confidence": 0.9265
            },
            "dataset": {
                "value": "UCM-Captions",
                "confidence": 0.9791
            },
            "metrics": {
                "value": [
                    {
                        "value": "BLEU-1",
                        "confidence": 0.9998
                    },
                    {
                        "value": "BLEU-2",
                        "confidence": 1.0
                    },
                    {
                        "value": "BLEU-3",
                        "confidence": 1.0
                    },
                    {
                        "value": "BLEU-4",
                        "confidence": 1.0
                    },
                    {
                        "value": "METEOR",
                        "confidence": 1.0
                    },
                    {
                        "value": "ROUGE L",
                        "confidence": 0.9802
                    },
                    {
                        "value": "CIDEr",
                        "confidence": 0.9999
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 86.12,
                        "confidence": 1.0
                    },
                    {
                        "value": 79.14,
                        "confidence": 1.0
                    },
                    {
                        "value": 72.31,
                        "confidence": 1.0
                    },
                    {
                        "value": 65.74,
                        "confidence": 1.0
                    },
                    {
                        "value": 42.21,
                        "confidence": 1.0
                    },
                    {
                        "value": 78.34,
                        "confidence": 1.0
                    },
                    {
                        "value": 333.23,
                        "confidence": 1.0
                    }
                ]
            },
            "sensor": {
                "value": null,
                "confidence": 0.0
            },
            "regions": {
                "value": null,
                "confidence": 0.0
            },
            "original_samples": {
                "value": 2100,
                "confidence": 0.9992
            },
            "num_samples": {
                "value": null,
                "confidence": 0.0
            },
            "sampling_percentage": {
                "value": null,
                "confidence": 0.0
            },
            "num_classes": {
                "value": null,
                "confidence": 0.0
            },
            "classes": {
                "value": null,
                "confidence": 0.0
            },
            "image_resolution": {
                "value": null,
                "confidence": 0.0
            },
            "spatial_resolution": {
                "value": null,
                "confidence": 0.0
            },
            "bands_used": {
                "value": null,
                "confidence": 0.0
            },
            "augmentations": {
                "value": null,
                "confidence": 0.0
            },
            "optimizer": {
                "value": null,
                "confidence": 0.0
            },
            "batch_size": {
                "value": null,
                "confidence": 0.0
            },
            "learning_rate": {
                "value": null,
                "confidence": 0.0
            },
            "epochs": {
                "value": 5,
                "confidence": 1.0
            },
            "loss_function": {
                "value": null,
                "confidence": 0.0
            },
            "split_ratio": {
                "value": null,
                "confidence": 0.0
            }
        },
        {
            "task": {
                "value": "Image Captioning",
                "confidence": 1.0
            },
            "application": {
                "value": "Remote sensing image captioning",
                "confidence": 1.0
            },
            "dataset": {
                "value": "Sydney-Captions",
                "confidence": 0.9997
            },
            "metrics": {
                "value": [
                    {
                        "value": "BLEU-1",
                        "confidence": 1.0
                    },
                    {
                        "value": "BLEU-2",
                        "confidence": 1.0
                    },
                    {
                        "value": "BLEU-3",
                        "confidence": 1.0
                    },
                    {
                        "value": "BLEU-4",
                        "confidence": 1.0
                    },
                    {
                        "value": "METEOR",
                        "confidence": 1.0
                    },
                    {
                        "value": "ROUGE L",
                        "confidence": 1.0
                    },
                    {
                        "value": "CIDEr",
                        "confidence": 1.0
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 82.26,
                        "confidence": 1.0
                    },
                    {
                        "value": 75.28,
                        "confidence": 1.0
                    },
                    {
                        "value": 68.57,
                        "confidence": 1.0
                    },
                    {
                        "value": 62.23,
                        "confidence": 1.0
                    },
                    {
                        "value": 41.37,
                        "confidence": 1.0
                    },
                    {
                        "value": 74.77,
                        "confidence": 1.0
                    },
                    {
                        "value": 273.08,
                        "confidence": 1.0
                    }
                ]
            },
            "sensor": {
                "value": null,
                "confidence": 0.0
            },
            "regions": {
                "value": null,
                "confidence": 0.0
            },
            "original_samples": {
                "value": 613,
                "confidence": 1.0
            },
            "num_samples": {
                "value": null,
                "confidence": 0.0
            },
            "sampling_percentage": {
                "value": null,
                "confidence": 0.0
            },
            "num_classes": {
                "value": null,
                "confidence": 0.0
            },
            "classes": {
                "value": null,
                "confidence": 0.0
            },
            "image_resolution": {
                "value": null,
                "confidence": 0.0
            },
            "spatial_resolution": {
                "value": null,
                "confidence": 0.0
            },
            "bands_used": {
                "value": null,
                "confidence": 0.0
            },
            "augmentations": {
                "value": null,
                "confidence": 0.0
            },
            "optimizer": {
                "value": null,
                "confidence": 0.0
            },
            "batch_size": {
                "value": null,
                "confidence": 0.0
            },
            "learning_rate": {
                "value": null,
                "confidence": 0.0
            },
            "epochs": {
                "value": 5,
                "confidence": 1.0
            },
            "loss_function": {
                "value": null,
                "confidence": 0.0
            },
            "split_ratio": {
                "value": null,
                "confidence": 0.0
            }
        },
        {
            "task": {
                "value": "Image Captioning",
                "confidence": 1.0
            },
            "application": {
                "value": "Remote sensing image captioning",
                "confidence": 1.0
            },
            "dataset": {
                "value": "RSICD",
                "confidence": 1.0
            },
            "metrics": {
                "value": [
                    {
                        "value": "BLEU-1",
                        "confidence": 1.0
                    },
                    {
                        "value": "BLEU-2",
                        "confidence": 1.0
                    },
                    {
                        "value": "BLEU-3",
                        "confidence": 1.0
                    },
                    {
                        "value": "BLEU-4",
                        "confidence": 1.0
                    },
                    {
                        "value": "METEOR",
                        "confidence": 1.0
                    },
                    {
                        "value": "ROUGE L",
                        "confidence": 1.0
                    },
                    {
                        "value": "CIDEr",
                        "confidence": 1.0
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 70.32,
                        "confidence": 1.0
                    },
                    {
                        "value": 54.23,
                        "confidence": 1.0
                    },
                    {
                        "value": 44.02,
                        "confidence": 1.0
                    },
                    {
                        "value": 36.83,
                        "confidence": 1.0
                    },
                    {
                        "value": 30.1,
                        "confidence": 0.9668
                    },
                    {
                        "value": 53.34,
                        "confidence": 1.0
                    },
                    {
                        "value": 102.94,
                        "confidence": 1.0
                    }
                ]
            },
            "sensor": {
                "value": null,
                "confidence": 0.0
            },
            "regions": {
                "value": null,
                "confidence": 0.0
            },
            "original_samples": {
                "value": 10921,
                "confidence": 1.0
            },
            "num_samples": {
                "value": null,
                "confidence": 0.0
            },
            "sampling_percentage": {
                "value": null,
                "confidence": 0.0
            },
            "num_classes": {
                "value": null,
                "confidence": 0.0
            },
            "classes": {
                "value": null,
                "confidence": 0.0
            },
            "image_resolution": {
                "value": null,
                "confidence": 0.0
            },
            "spatial_resolution": {
                "value": null,
                "confidence": 0.0
            },
            "bands_used": {
                "value": null,
                "confidence": 0.0
            },
            "augmentations": {
                "value": null,
                "confidence": 0.0
            },
            "optimizer": {
                "value": null,
                "confidence": 0.0
            },
            "batch_size": {
                "value": null,
                "confidence": 0.0
            },
            "learning_rate": {
                "value": null,
                "confidence": 0.0
            },
            "epochs": {
                "value": 15,
                "confidence": 1.0
            },
            "loss_function": {
                "value": null,
                "confidence": 0.0
            },
            "split_ratio": {
                "value": null,
                "confidence": 0.0
            }
        },
        {
            "task": {
                "value": "Visual Question Answering",
                "confidence": 0.9983
            },
            "application": {
                "value": "Remote sensing visual question answering",
                "confidence": 0.6454
            },
            "dataset": {
                "value": "RSVQA-HR (test set 1)",
                "confidence": 0.4131
            },
            "metrics": {
                "value": [
                    {
                        "value": "Presence accuracy",
                        "confidence": 0.6663
                    },
                    {
                        "value": "Comparison accuracy",
                        "confidence": 1.0
                    },
                    {
                        "value": "Average accuracy",
                        "confidence": 0.9899
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 91.86,
                        "confidence": 1.0
                    },
                    {
                        "value": 92.15,
                        "confidence": 1.0
                    },
                    {
                        "value": 92.0,
                        "confidence": 0.9447
                    }
                ]
            },
            "sensor": {
                "value": null,
                "confidence": 0.0
            },
            "regions": {
                "value": null,
                "confidence": 0.0
            },
            "original_samples": {
                "value": null,
                "confidence": 0.0
            },
            "num_samples": {
                "value": null,
                "confidence": 0.0
            },
            "sampling_percentage": {
                "value": null,
                "confidence": 0.0
            },
            "num_classes": {
                "value": null,
                "confidence": 0.0
            },
            "classes": {
                "value": [
                    {
                        "value": "presence",
                        "confidence": 0.7389
                    },
                    {
                        "value": "comparison",
                        "confidence": 1.0
                    }
                ]
            },
            "image_resolution": {
                "value": null,
                "confidence": 0.0
            },
            "spatial_resolution": {
                "value": null,
                "confidence": 0.0
            },
            "bands_used": {
                "value": null,
                "confidence": 0.0
            },
            "augmentations": {
                "value": null,
                "confidence": 0.0
            },
            "optimizer": {
                "value": null,
                "confidence": 0.0
            },
            "batch_size": {
                "value": null,
                "confidence": 0.0
            },
            "learning_rate": {
                "value": null,
                "confidence": 0.0
            },
            "epochs": {
                "value": 5,
                "confidence": 1.0
            },
            "loss_function": {
                "value": null,
                "confidence": 0.0
            },
            "split_ratio": {
                "value": null,
                "confidence": 0.0
            }
        },
        {
            "task": {
                "value": "Visual Question Answering",
                "confidence": 1.0
            },
            "application": {
                "value": "Remote sensing visual question answering",
                "confidence": 1.0
            },
            "dataset": {
                "value": "RSVQA-HR (test set 2)",
                "confidence": 1.0
            },
            "metrics": {
                "value": [
                    {
                        "value": "Presence accuracy",
                        "confidence": 1.0
                    },
                    {
                        "value": "Comparison accuracy",
                        "confidence": 1.0
                    },
                    {
                        "value": "Average accuracy",
                        "confidence": 1.0
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 89.87,
                        "confidence": 1.0
                    },
                    {
                        "value": 89.68,
                        "confidence": 1.0
                    },
                    {
                        "value": 89.78,
                        "confidence": 1.0
                    }
                ]
            },
            "sensor": {
                "value": null,
                "confidence": 0.0
            },
            "regions": {
                "value": null,
                "confidence": 0.0
            },
            "original_samples": {
                "value": null,
                "confidence": 0.0
            },
            "num_samples": {
                "value": null,
                "confidence": 0.0
            },
            "sampling_percentage": {
                "value": null,
                "confidence": 0.0
            },
            "num_classes": {
                "value": null,
                "confidence": 0.0
            },
            "classes": {
                "value": [
                    {
                        "value": "presence",
                        "confidence": 1.0
                    },
                    {
                        "value": "comparison",
                        "confidence": 1.0
                    }
                ]
            },
            "image_resolution": {
                "value": null,
                "confidence": 0.0
            },
            "spatial_resolution": {
                "value": null,
                "confidence": 0.0
            },
            "bands_used": {
                "value": null,
                "confidence": 0.0
            },
            "augmentations": {
                "value": null,
                "confidence": 0.0
            },
            "optimizer": {
                "value": null,
                "confidence": 0.0
            },
            "batch_size": {
                "value": null,
                "confidence": 0.0
            },
            "learning_rate": {
                "value": null,
                "confidence": 0.0
            },
            "epochs": {
                "value": 5,
                "confidence": 1.0
            },
            "loss_function": {
                "value": null,
                "confidence": 0.0
            },
            "split_ratio": {
                "value": null,
                "confidence": 0.0
            }
        },
        {
            "task": {
                "value": "Visual Question Answering",
                "confidence": 1.0
            },
            "application": {
                "value": "Remote sensing visual question answering",
                "confidence": 0.9999
            },
            "dataset": {
                "value": "RSVQA-LR",
                "confidence": 1.0
            },
            "metrics": {
                "value": [
                    {
                        "value": "Presence accuracy",
                        "confidence": 0.9922
                    },
                    {
                        "value": "Comparison accuracy",
                        "confidence": 1.0
                    },
                    {
                        "value": "Rural/Urban accuracy",
                        "confidence": 0.9818
                    },
                    {
                        "value": "Average accuracy",
                        "confidence": 0.9993
                    }
                ]
            },
            "metrics_value": {
                "value": [
                    {
                        "value": 91.17,
                        "confidence": 1.0
                    },
                    {
                        "value": 91.7,
                        "confidence": 0.9963
                    },
                    {
                        "value": 94.0,
                        "confidence": 0.9961
                    },
                    {
                        "value": 92.29,
                        "confidence": 1.0
                    }
                ]
            },
            "sensor": {
                "value": null,
                "confidence": 0.0
            },
            "regions": {
                "value": null,
                "confidence": 0.0
            },
            "original_samples": {
                "value": null,
                "confidence": 0.0
            },
            "num_samples": {
                "value": null,
                "confidence": 0.0
            },
            "sampling_percentage": {
                "value": null,
                "confidence": 0.0
            },
            "num_classes": {
                "value": null,
                "confidence": 0.0
            },
            "classes": {
                "value": [
                    {
                        "value": "presence",
                        "confidence": 1.0
                    },
                    {
                        "value": "comparison",
                        "confidence": 1.0
                    },
                    {
                        "value": "rural/urban",
                        "confidence": 0.9999
                    }
                ]
            },
            "image_resolution": {
                "value": null,
                "confidence": 0.0
            },
            "spatial_resolution": {
                "value": null,
                "confidence": 0.0
            },
            "bands_used": {
                "value": null,
                "confidence": 0.0
            },
            "augmentations": {
                "value": null,
                "confidence": 0.0
            },
            "optimizer": {
                "value": null,
                "confidence": 0.0
            },
            "batch_size": {
                "value": null,
                "confidence": 0.0
            },
            "learning_rate": {
                "value": null,
                "confidence": 0.0
            },
            "epochs": {
                "value": 5,
                "confidence": 1.0
            },
            "loss_function": {
                "value": null,
                "confidence": 0.0
            },
            "split_ratio": {
                "value": null,
                "confidence": 0.0
            }
        }
    ]
}