{"@context":{"@language":"en","@vocab":"https://schema.org/","arrayShape":"cr:arrayShape","citeAs":"cr:citeAs","column":"cr:column","conformsTo":"dct:conformsTo","cr":"http://mlcommons.org/croissant/","data":{"@id":"cr:data","@type":"@json"},"dataBiases":"cr:dataBiases","dataCollection":"cr:dataCollection","dataType":{"@id":"cr:dataType","@type":"@vocab"},"dct":"http://purl.org/dc/terms/","extract":"cr:extract","field":"cr:field","fileProperty":"cr:fileProperty","fileObject":"cr:fileObject","fileSet":"cr:fileSet","format":"cr:format","includes":"cr:includes","isArray":"cr:isArray","isLiveDataset":"cr:isLiveDataset","jsonPath":"cr:jsonPath","key":"cr:key","md5":"cr:md5","parentField":"cr:parentField","path":"cr:path","personalSensitiveInformation":"cr:personalSensitiveInformation","recordSet":"cr:recordSet","references":"cr:references","regex":"cr:regex","repeated":"cr:repeated","replace":"cr:replace","sc":"https://schema.org/","separator":"cr:separator","source":"cr:source","subField":"cr:subField","transform":"cr:transform"},"@type":"sc:Dataset","distribution":[{"@type":"cr:FileObject","@id":"repo","name":"repo","description":"The Hugging Face git repository.","contentUrl":"https://huggingface.co/datasets/Mirali33/mb-boulder_seg/tree/refs%2Fconvert%2Fparquet","encodingFormat":"git+https","sha256":"https://github.com/mlcommons/croissant/issues/80"},{"@type":"cr:FileSet","@id":"parquet-files-for-config-default","containedIn":{"@id":"repo"},"encodingFormat":"application/x-parquet","includes":"default/*/*.parquet"}],"recordSet":[{"@type":"cr:RecordSet","dataType":"cr:Split","key":{"@id":"default_splits/split_name"},"@id":"default_splits","name":"default_splits","description":"Splits for the default config.","field":[{"@type":"cr:Field","@id":"default_splits/split_name","dataType":"sc:Text"}],"data":[{"default_splits/split_name":"train"},{"default_splits/split_name":"test"},{"default_splits/split_name":"partition_train_0.10x_partition"},{"default_splits/split_name":"partition_train_0.20x_partition"},{"default_splits/split_name":"partition_train_0.25x_partition"},{"default_splits/split_name":"partition_train_0.50x_partition"},{"default_splits/split_name":"val"}]},{"@type":"cr:RecordSet","@id":"default","description":"Mirali33/mb-boulder_seg - 'default' subset\n\nAdditional information:\n- 7 splits: train, test, partition_train_0.10x_partition, partition_train_0.20x_partition, partition_train_0.25x_partition, partition_train_0.50x_partition, val","field":[{"@type":"cr:Field","@id":"default/split","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-default"},"extract":{"fileProperty":"fullpath"},"transform":{"regex":"default/(?:partial-)?(train|test|partition_train_0\\.10x_partition|partition_train_0\\.20x_partition|partition_train_0\\.25x_partition|partition_train_0\\.50x_partition|val)/.+parquet$"}},"references":{"field":{"@id":"default_splits/split_name"}}},{"@type":"cr:Field","@id":"default/image","dataType":"sc:ImageObject","source":{"fileSet":{"@id":"parquet-files-for-config-default"},"extract":{"column":"image"},"transform":{"jsonPath":"bytes"}}},{"@type":"cr:Field","@id":"default/mask","dataType":"sc:ImageObject","source":{"fileSet":{"@id":"parquet-files-for-config-default"},"extract":{"column":"mask"},"transform":{"jsonPath":"bytes"}}},{"@type":"cr:Field","@id":"default/width","dataType":"cr:Int64","source":{"fileSet":{"@id":"parquet-files-for-config-default"},"extract":{"column":"width"}}},{"@type":"cr:Field","@id":"default/height","dataType":"cr:Int64","source":{"fileSet":{"@id":"parquet-files-for-config-default"},"extract":{"column":"height"}}},{"@type":"cr:Field","@id":"default/class_labels","dataType":"sc:Text","source":{"fileSet":{"@id":"parquet-files-for-config-default"},"extract":{"column":"class_labels"}},"isArray":true,"arrayShape":"-1"}]}],"conformsTo":"http://mlcommons.org/croissant/1.1","name":"mb-boulder_seg","description":"\n\t\n\t\t\n\t\tmb-boulder_seg\n\t\n\nA segmentation dataset for planetary science applications.\n\n\t\n\t\t\n\t\tDataset Metadata\n\t\n\n\nLicense: CC-BY-4.0 (Creative Commons Attribution 4.0 International)\nVersion: 1.0\nDate Published: 2025-05-15\nCite As: TBD\n\n\n\t\n\t\t\n\t\tClasses\n\t\n\nThis dataset contains the following classes:\n\n0: Background\n1: Boulder\n\n\n\t\n\t\t\n\t\tDirectory Structure\n\t\n\nThe dataset follows this structure:\ndataset/\n  ├── train/\n  │   ├── images/  # Image files\n  │   └── masks/   # Segmentation masks\n  ├──… See the full description on the dataset page: https://huggingface.co/datasets/Mirali33/mb-boulder_seg.","alternateName":["Mirali33/mb-boulder_seg","mb-boulder_seg"],"creator":{"@type":"Person","name":"Mirali Purohit","url":"https://huggingface.co/Mirali33"},"keywords":["image-segmentation","semantic-segmentation","expert-generated","found","monolingual","original","English","cc-by-4.0","< 1K","parquet","Image","Text","Datasets","pandas","Croissant","Polars","🇺🇸 Region: US"],"license":"https://choosealicense.com/licenses/cc-by-4.0/","url":"https://huggingface.co/datasets/Mirali33/mb-boulder_seg"}