{
  "@context": {
    "@language": "en",
    "@vocab": "https://schema.org/",
    "arrayShape": "cr:arrayShape",
    "citeAs": "cr:citeAs",
    "column": "cr:column",
    "conformsTo": "dct:conformsTo",
    "cr": "http://mlcommons.org/croissant/",
    "data": {
      "@id": "cr:data",
      "@type": "@json"
    },
    "dataBiases": "cr:dataBiases",
    "dataCollection": "cr:dataCollection",
    "dataType": {
      "@id": "cr:dataType",
      "@type": "@vocab"
    },
    "dct": "http://purl.org/dc/terms/",
    "extract": "cr:extract",
    "field": "cr:field",
    "fileProperty": "cr:fileProperty",
    "fileObject": "cr:fileObject",
    "fileSet": "cr:fileSet",
    "format": "cr:format",
    "includes": "cr:includes",
    "isArray": "cr:isArray",
    "isLiveDataset": "cr:isLiveDataset",
    "jsonPath": "cr:jsonPath",
    "key": "cr:key",
    "md5": "cr:md5",
    "parentField": "cr:parentField",
    "path": "cr:path",
    "personalSensitiveInformation": "cr:personalSensitiveInformation",
    "recordSet": "cr:recordSet",
    "references": "cr:references",
    "regex": "cr:regex",
    "repeated": "cr:repeated",
    "replace": "cr:replace",
    "sc": "https://schema.org/",
    "separator": "cr:separator",
    "source": "cr:source",
    "subField": "cr:subField",
    "transform": "cr:transform"
  },
  "@type": "sc:Dataset",
  "distribution": [
    {
      "@type": "cr:FileObject",
      "@id": "repo",
      "name": "repo",
      "description": "The Hugging Face git repository.",
      "contentUrl": "https://huggingface.co/datasets/retail-product-promotion/mSOP-765k/tree/refs%2Fconvert%2Fparquet",
      "encodingFormat": "git+https",
      "sha256": "https://github.com/mlcommons/croissant/issues/80"
    }
  ],
  "recordSet": [],
  "conformsTo": "http://mlcommons.org/croissant/1.1",
  "name": "mSOP-765k",
  "description": "\n\t\n\t\t\n\t\tmSOP-765k: A Benchmark For Multi-Modal Structured Output Predictions\n\t\n\n\n\n\n\nThe mSOP-765k dataset serves as a benchmark for Multi-Modal Structured Output Predictions.\nThe dataset contains approximately 765k data, comprising both images and textual data.\n\n\t\n\t\t\n\t\tData\n\t\n\n\nImage Data:\n\nThe images are cropped from scanned advertisement leaflets.\nThe image data is divided into train and test splits.\nThe image dataset is available in two versions: one with images resized so that the longer… See the full description on the dataset page: https://huggingface.co/datasets/retail-product-promotion/mSOP-765k.",
  "alternateName": [
    "retail-product-promotion/mSOP-765k"
  ],
  "creator": {
    "@type": "Person",
    "name": "rpp-765k",
    "url": "https://huggingface.co/retail-product-promotion"
  },
  "keywords": [
    "visual-question-answering",
    "cc-by-nc-nd-4.0",
    "100K<n<1M",
    "🇺🇸 Region: US"
  ],
  "license": "https://choosealicense.com/licenses/cc-by-nc-nd-4.0/",
  "url": "https://huggingface.co/datasets/retail-product-promotion/mSOP-765k"
}