{
    "uuid": "e4d57bad-5b6e-4bc0-b364-e63a8f27ca9b",
    "name": "CC_full_v4_pre2023_05_of_10_resliparse",
    "creation_date": "2024-03-14 20:12:09",
    "sources": "s3://***REMOVED***/commoncrawl_paths.txt.gz",
    "tokenized": false,
    "tokenizer": null,
    "size": "26 TB",
    "seed": 42,
    "json_path": "s3://dcnlp-west/CC_full_v4_pre2023_jsons/CC_full_v4_pre2023_split/CC_full_v4_pre2023_05_of_10.json.gz",
    "dcnlp_commit_hash": "483faef02615ae529ea0ae45736948b8975644c4",
    "dataset_url": "s3://***REMOVED***/users/vaishaal/mlr/dcnlp_data/common_crawl_v4_pre2023_jsonls/CC_full_v4_pre2023_05_of_10/",
    "dcnlp_diff": ""
}