datasets:
  - json_path: llava_instruct/real_vision_flan/llavar_gpt4_20k.json
    sampling_strategy: "all"
    folder_name: llavar_gpt4_20k
  - json_path: llava_instruct/real_vision_flan/scienceqa_nona_context_19218.json
    sampling_strategy: "first:5%"
    folder_name: scienceqa(nona_context)
  - json_path: llava_instruct/real_vision_flan/allava_instruct_vflan4v_20000.json
    sampling_strategy: "all"
    folder_name: allava_instruct_vflan4v
  - json_path: llava_instruct/real_vision_flan/allava_instruct_laion4v_50000.json
    sampling_strategy: "all"
    folder_name: allava_instruct_laion4v
  - json_path: llava_instruct/real_vision_flan/vision_flan_filtered_186070.json
    sampling_strategy: "all"
    folder_name: vision_flan(filtered)
  - json_path: llava_instruct/real_vision_flan/MathV360K_IconQA_22599.json
    sampling_strategy: "first:5%"
    folder_name: IconQA(MathV360K)
  - json_path: llava_instruct/real_vision_flan/MathV360K_VizWiz_6614.json
    sampling_strategy: "all"
    folder_name: VizWiz(MathV360K)
  - json_path: llava_instruct/real_vision_flan/image_textualization_dataset_filtered.json
    sampling_strategy: "all"
    folder_name: image_textualization(filtered)
  - json_path: llava_instruct/real_vision_flan/cambrian_filtered_gpt4vo_sp_token_fltd_max10k.json
    sampling_strategy: "all"
    folder_name: cambrian(filtered)
  - json_path: llava_instruct/cauldron/clevr_70000_llava_format.json
    sampling_strategy: "first:1%"
    folder_name: clevr(cauldron,llava_format)
  - json_path: llava_instruct/cauldron/hateful_memes_8500_llava_format.json
    sampling_strategy: "all"
    folder_name: hateful_memes(cauldron,llava_format)
  - json_path: llava_instruct/cauldron/iconqa_llava_format_27307.json
    sampling_strategy: "first:5%"
    folder_name: iconqa(cauldron,llava_format)
  - json_path: llava_instruct/cauldron/intergps_1280_llava_format.json
    sampling_strategy: "all"
    folder_name: intergps(cauldron,llava_format)
  - json_path: llava_instruct/cauldron/scienceqa_llava_format_4976.json
    sampling_strategy: "all"
    folder_name: scienceqa(cauldron,llava_format)
  - json_path: llava_instruct/cauldron/tallyqa_98680_llava_format.json
    sampling_strategy: "first:10%"
    folder_name: tallyqa(cauldron,llava_format)
  - json_path: llava_instruct/cauldron/st_vqa_17247_llava_format.json
    sampling_strategy: "all"
    folder_name: st_vqa(cauldron,llava_format)
  - json_path: llava_instruct/cauldron/visual7w_llava_format_14366.json
    sampling_strategy: "all"
    folder_name: visual7w(cauldron,llava_format)
  - json_path: llava_instruct/cauldron/vqarad_313_llava_format.json
    sampling_strategy: "all"
    folder_name: vqarad(cauldron,llava_format)
  - json_path: llava_instruct/cauldron/vsr_2157_llava_format.json
    sampling_strategy: "all"
    folder_name: vsr(cauldron,llava_format)
  - json_path: llava_instruct/cauldron/vistext_9969.json
    sampling_strategy: "all"
    folder_name: vistext(cauldron)
  - json_path: llava_instruct/cauldron/websight_10000.json
    sampling_strategy: "all"
    folder_name: websight(cauldron)
