[
    {
        "dataset_name": "redpajama_8k",
        "task_name": "redpajama_8k",
        "abs_weight": 0.4,
        "version": "/user/tc_agi/klara/datasets/redpajama/redpajama_8k_20240516",
        "path": "/mnt/data/user/tc_agi/zxr/redpajama_en_5_deduped_0323_0515_8k",
        "transforms": "datasets/redpajama/script.py",
        "nlines": 63407,
        "ave_tokens_per_line": 31749.0455,
        "total_tokens": 20.7,
        "allow_repeat": true
    }
]
