[
    {
        "dataset_name": "redpajama_4k",
        "task_name": "redpajama_4k",
        "abs_weight": 0.4,
        "version": "/user/tc_agi/klara/datasets/redpajama/part_4k_20240515",
        "path": "/mnt/data/user/tc_agi/llm/index_datasets/redpajama_en_5_deduped_0323",
        "transforms": "datasets/redpajama/script.py",
        "nlines": 63407,
        "ave_tokens_per_line": 31749.0455,
        "total_tokens": 20.7,
        "allow_repeat": true
    }
]
