datasets:
  cc_sbu:
    data_type: images
    build_info:
      storage: /data/NeurIPS24/VL/MiniGPT-4/pre_trained/dataset_stage1_pretrain/cc_sbu/cc_sbu_dataset/{00000..01255}.tar
