{
  "@context": {
    "@language": "en",
    "@vocab": "https://schema.org/",
    "arrayShape": "cr:arrayShape",
    "citeAs": "cr:citeAs",
    "column": "cr:column",
    "conformsTo": "dct:conformsTo",
    "cr": "http://mlcommons.org/croissant/",
    "data": {
      "@id": "cr:data",
      "@type": "@json"
    },
    "dataBiases": "cr:dataBiases",
    "dataCollection": "cr:dataCollection",
    "dataType": {
      "@id": "cr:dataType",
      "@type": "@vocab"
    },
    "dct": "http://purl.org/dc/terms/",
    "extract": "cr:extract",
    "field": "cr:field",
    "fileProperty": "cr:fileProperty",
    "fileObject": "cr:fileObject",
    "fileSet": "cr:fileSet",
    "format": "cr:format",
    "includes": "cr:includes",
    "isArray": "cr:isArray",
    "isLiveDataset": "cr:isLiveDataset",
    "jsonPath": "cr:jsonPath",
    "key": "cr:key",
    "md5": "cr:md5",
    "parentField": "cr:parentField",
    "path": "cr:path",
    "personalSensitiveInformation": "cr:personalSensitiveInformation",
    "recordSet": "cr:recordSet",
    "references": "cr:references",
    "regex": "cr:regex",
    "repeated": "cr:repeated",
    "replace": "cr:replace",
    "sc": "https://schema.org/",
    "separator": "cr:separator",
    "source": "cr:source",
    "subField": "cr:subField",
    "transform": "cr:transform"
  },
  "@type": "sc:Dataset",
  "distribution": [
    {
      "@type": "cr:FileObject",
      "@id": "repo",
      "name": "repo",
      "description": "The Hugging Face git repository.",
      "contentUrl": "https://huggingface.co/datasets/SoMi-ToM/SoMi-ToM/tree/refs%2Fconvert%2Fparquet",
      "encodingFormat": "git+https",
      "sha256": "https://github.com/mlcommons/croissant/issues/80"
    },
    {
      "@type": "cr:FileSet",
      "@id": "parquet-files-for-config-first_person_eval",
      "containedIn": {
        "@id": "repo"
      },
      "encodingFormat": "application/x-parquet",
      "includes": "first_person_eval/*/*.parquet"
    },
    {
      "@type": "cr:FileSet",
      "@id": "parquet-files-for-config-third_person_eval",
      "containedIn": {
        "@id": "repo"
      },
      "encodingFormat": "application/x-parquet",
      "includes": "third_person_eval/*/*.parquet"
    }
  ],
  "recordSet": [
    {
      "@type": "cr:RecordSet",
      "dataType": "cr:Split",
      "key": {
        "@id": "first_person_eval_splits/split_name"
      },
      "@id": "first_person_eval_splits",
      "name": "first_person_eval_splits",
      "description": "Splits for the first_person_eval config.",
      "field": [
        {
          "@type": "cr:Field",
          "@id": "first_person_eval_splits/split_name",
          "dataType": "sc:Text"
        }
      ],
      "data": [
        {
          "first_person_eval_splits/split_name": "first_person_boat_hinder"
        },
        {
          "first_person_eval_splits/split_name": "first_person_chest_hinder"
        },
        {
          "first_person_eval_splits/split_name": "first_person_door_hinder"
        },
        {
          "first_person_eval_splits/split_name": "first_person_boat"
        },
        {
          "first_person_eval_splits/split_name": "first_person_chest"
        },
        {
          "first_person_eval_splits/split_name": "first_person_door"
        },
        {
          "first_person_eval_splits/split_name": "first_person_stonepickaxe"
        },
        {
          "first_person_eval_splits/split_name": "first_person_woodenpickaxe"
        }
      ]
    },
    {
      "@type": "cr:RecordSet",
      "@id": "first_person_eval",
      "description": "SoMi-ToM/SoMi-ToM - 'first_person_eval' subset\n\nAdditional information:\n- 8 splits: first_person_boat_hinder, first_person_chest_hinder, first_person_door_hinder, first_person_boat, first_person_chest, first_person_door, first_person_stonepickaxe, first_person_woodenpickaxe",
      "field": [
        {
          "@type": "cr:Field",
          "@id": "first_person_eval/split",
          "dataType": "sc:Text",
          "source": {
            "fileSet": {
              "@id": "parquet-files-for-config-first_person_eval"
            },
            "extract": {
              "fileProperty": "fullpath"
            },
            "transform": {
              "regex": "first_person_eval/(?:partial-)?(first_person_boat_hinder|first_person_chest_hinder|first_person_door_hinder|first_person_boat|first_person_chest|first_person_door|first_person_stonepickaxe|first_person_woodenpickaxe)/.+parquet$"
            }
          },
          "references": {
            "field": {
              "@id": "first_person_eval_splits/split_name"
            }
          }
        },
        {
          "@type": "cr:Field",
          "@id": "first_person_eval/character",
          "dataType": "sc:Text",
          "source": {
            "fileSet": {
              "@id": "parquet-files-for-config-first_person_eval"
            },
            "extract": {
              "column": "character"
            }
          }
        },
        {
          "@type": "cr:Field",
          "@id": "first_person_eval/Jack",
          "dataType": "sc:Text",
          "source": {
            "fileSet": {
              "@id": "parquet-files-for-config-first_person_eval"
            },
            "extract": {
              "column": "Jack"
            }
          }
        },
        {
          "@type": "cr:Field",
          "@id": "first_person_eval/Jane",
          "dataType": "sc:Text",
          "source": {
            "fileSet": {
              "@id": "parquet-files-for-config-first_person_eval"
            },
            "extract": {
              "column": "Jane"
            }
          }
        },
        {
          "@type": "cr:Field",
          "@id": "first_person_eval/John",
          "dataType": "sc:Text",
          "source": {
            "fileSet": {
              "@id": "parquet-files-for-config-first_person_eval"
            },
            "extract": {
              "column": "John"
            }
          }
        },
        {
          "@type": "cr:Field",
          "@id": "first_person_eval/image_url",
          "dataType": "sc:Text",
          "source": {
            "fileSet": {
              "@id": "parquet-files-for-config-first_person_eval"
            },
            "extract": {
              "column": "image_url"
            }
          }
        },
        {
          "@type": "cr:Field",
          "@id": "first_person_eval/dialogue_history",
          "dataType": "sc:Text",
          "source": {
            "fileSet": {
              "@id": "parquet-files-for-config-first_person_eval"
            },
            "extract": {
              "column": "dialogue_history"
            }
          }
        },
        {
          "@type": "cr:Field",
          "@id": "first_person_eval/ground_truth",
          "dataType": "sc:Text",
          "source": {
            "fileSet": {
              "@id": "parquet-files-for-config-first_person_eval"
            },
            "extract": {
              "column": "ground_truth"
            }
          }
        },
        {
          "@type": "cr:Field",
          "@id": "first_person_eval/files",
          "dataType": "sc:Text",
          "source": {
            "fileSet": {
              "@id": "parquet-files-for-config-first_person_eval"
            },
            "extract": {
              "column": "files"
            }
          }
        }
      ]
    },
    {
      "@type": "cr:RecordSet",
      "dataType": "cr:Split",
      "key": {
        "@id": "third_person_eval_splits/split_name"
      },
      "@id": "third_person_eval_splits",
      "name": "third_person_eval_splits",
      "description": "Splits for the third_person_eval config.",
      "field": [
        {
          "@type": "cr:Field",
          "@id": "third_person_eval_splits/split_name",
          "dataType": "sc:Text"
        }
      ],
      "data": [
        {
          "third_person_eval_splits/split_name": "third_person_hinder"
        },
        {
          "third_person_eval_splits/split_name": "third_person"
        }
      ]
    },
    {
      "@type": "cr:RecordSet",
      "@id": "third_person_eval",
      "description": "SoMi-ToM/SoMi-ToM - 'third_person_eval' subset\n\nAdditional information:\n- 2 splits: third_person_hinder, third_person",
      "field": [
        {
          "@type": "cr:Field",
          "@id": "third_person_eval/split",
          "dataType": "sc:Text",
          "source": {
            "fileSet": {
              "@id": "parquet-files-for-config-third_person_eval"
            },
            "extract": {
              "fileProperty": "fullpath"
            },
            "transform": {
              "regex": "third_person_eval/(?:partial-)?(third_person_hinder|third_person)/.+parquet$"
            }
          },
          "references": {
            "field": {
              "@id": "third_person_eval_splits/split_name"
            }
          }
        },
        {
          "@type": "cr:Field",
          "@id": "third_person_eval/files",
          "dataType": "sc:Text",
          "source": {
            "fileSet": {
              "@id": "parquet-files-for-config-third_person_eval"
            },
            "extract": {
              "column": "files"
            }
          }
        },
        {
          "@type": "cr:Field",
          "@id": "third_person_eval/video_paths",
          "dataType": "sc:Text",
          "source": {
            "fileSet": {
              "@id": "parquet-files-for-config-third_person_eval"
            },
            "extract": {
              "column": "video_paths"
            }
          }
        },
        {
          "@type": "cr:Field",
          "@id": "third_person_eval/goal",
          "dataType": "sc:Text",
          "source": {
            "fileSet": {
              "@id": "parquet-files-for-config-third_person_eval"
            },
            "extract": {
              "column": "goal"
            }
          }
        },
        {
          "@type": "cr:Field",
          "@id": "third_person_eval/behavior",
          "dataType": "sc:Text",
          "source": {
            "fileSet": {
              "@id": "parquet-files-for-config-third_person_eval"
            },
            "extract": {
              "column": "behavior"
            }
          }
        },
        {
          "@type": "cr:Field",
          "@id": "third_person_eval/behavior_Jack",
          "dataType": "sc:Text",
          "source": {
            "fileSet": {
              "@id": "parquet-files-for-config-third_person_eval"
            },
            "extract": {
              "column": "behavior_Jack"
            }
          }
        },
        {
          "@type": "cr:Field",
          "@id": "third_person_eval/behavior_Jane",
          "dataType": "sc:Text",
          "source": {
            "fileSet": {
              "@id": "parquet-files-for-config-third_person_eval"
            },
            "extract": {
              "column": "behavior_Jane"
            }
          }
        },
        {
          "@type": "cr:Field",
          "@id": "third_person_eval/behavior_John",
          "dataType": "sc:Text",
          "source": {
            "fileSet": {
              "@id": "parquet-files-for-config-third_person_eval"
            },
            "extract": {
              "column": "behavior_John"
            }
          }
        },
        {
          "@type": "cr:Field",
          "@id": "third_person_eval/ground_truth",
          "dataType": "sc:Text",
          "source": {
            "fileSet": {
              "@id": "parquet-files-for-config-third_person_eval"
            },
            "extract": {
              "column": "ground_truth"
            }
          }
        }
      ]
    }
  ],
  "conformsTo": "http://mlcommons.org/croissant/1.1",
  "name": "SoMi-ToM",
  "identifier": "10.57967/hf/6569",
  "description": "\n  \n    \n      SoMi-ToM: Evaluating Multi-Perspective Theory of Mind in Embodied Social Interactions\n    \n  \n\n\n NeurIPS 2025\n\n\n  ❤️ Like our project on Hugging Face to show your support!\n\n\n\n\n  \n    \n  \n  \n    \n  \n  \n    \n  \n\n\n\n\n\t\n\t\t\n\t\tSoMi-ToM Benchmark\n\t\n\nWe propose the SoMi-ToM benchmark, designed to evaluate multi-perspective ToM in embodied multi-agent complex social interactions. This benchmark is based on rich multimodal interaction data generated by the interaction environment SoMi… See the full description on the dataset page: https://huggingface.co/datasets/SoMi-ToM/SoMi-ToM.",
  "alternateName": [
    "SoMi-ToM/SoMi-ToM"
  ],
  "creator": {
    "@type": "Person",
    "name": "Xianzhe Fan",
    "url": "https://huggingface.co/SoMi-ToM"
  },
  "keywords": [
    "mit",
    "1K - 10K",
    "csv",
    "Image",
    "Text",
    "Video",
    "Datasets",
    "pandas",
    "Croissant",
    "Polars",
    "arxiv:2506.23046",
    "doi:10.57967/hf/6569",
    "🇺🇸 Region: US"
  ],
  "license": "https://choosealicense.com/licenses/mit/",
  "url": "https://huggingface.co/datasets/SoMi-ToM/SoMi-ToM"
}
