data:
  - 
    name: "llava-pretrain"
    type: json
    path: "../../data/llava-pretrain/data/train.json"
    format: chat
    split: train