datasets:
  - json_path: llava_instruct/real_vision_flan/ai2d_azuregpt_detailed_understanding_4874.json
    sampling_strategy: "all"
    folder_name: ai2d(gpt4v)
  - json_path: llava_instruct/real_vision_flan/infographic_vqa_4404.json
    sampling_strategy: "all"
    folder_name: infographic_vqa
  - json_path: llava_instruct/real_vision_flan/infographic_azuregpt4v_1992.json
    sampling_strategy: "all"
    folder_name: infographic(gpt4v)
  - json_path: llava_instruct/real_vision_flan/lrv_chart_1787.json
    sampling_strategy: "all"
    folder_name: lrv_chart
  - json_path: llava_instruct/real_vision_flan/ai2d_train_internvl_single_12413.json
    sampling_strategy: "all"
    folder_name: ai2d(internvl)
  - json_path: llava_instruct/ureader_new/ureader_qa_sft.json
    sampling_strategy: "all"
    folder_name: ureader_qa
  - json_path: llava_instruct/ureader_new/ureader_cap_sft.json
    sampling_strategy: "all"
    folder_name: ureader_cap
  - json_path: llava_instruct/ureader_new/ureader_ie_sft.json
    sampling_strategy: "all"
    folder_name: ureader_ie
  - json_path: llava_instruct/ureader_new/ureader_kg_sft.json
    sampling_strategy: "all"
    folder_name: ureader_kg
  - json_path: llava_instruct/real_vision_flan/MathV360K_FigureQA_17597.json
    sampling_strategy: "first:5%"
    folder_name: FigureQA(MathV360K)
  - json_path: llava_instruct/cauldron/ai2d_llava_format_2434.json
    sampling_strategy: "all"
    folder_name: ai2d(cauldron,llava_format)
  - json_path: llava_instruct/cauldron/chart2text_26961.json
    sampling_strategy: "all"
    folder_name: chart2text(cauldron)
  - json_path: llava_instruct/cauldron/chartqa_18265_llava_format.json
    sampling_strategy: "all"
    folder_name: chartqa(cauldron,llava_format)
  - json_path: llava_instruct/cauldron/diagram_image_to_text_300.json
    sampling_strategy: "all"
    folder_name: diagram_image_to_text(cauldron)
  - json_path: llava_instruct/cauldron/dvqa_200000_llava_format.json
    sampling_strategy: "first:1%"
    folder_name: dvqa(cauldron,llava_format)
  - json_path: llava_instruct/cauldron/figureqa_100000_llava_format.json
    sampling_strategy: "first:1%"
    folder_name: figureqa(cauldron,llava_format)
  - json_path: llava_instruct/cauldron/hitab_2500_llava_format.json
    sampling_strategy: "all"
    folder_name: hitab(cauldron,llava_format)
  - json_path: llava_instruct/cauldron/infographic_vqa_2118_llava_format.json
    sampling_strategy: "all"
    folder_name: infographic_vqa_llava_format
  - json_path: llava_instruct/cauldron/robut_sqa_8514.json
    sampling_strategy: "all"
    folder_name: robut_sqa(cauldron)
  - json_path: llava_instruct/cauldron/robut_wikisql_74989.json
    sampling_strategy: "all"
    folder_name: robut_wikisql(cauldron)
  - json_path: llava_instruct/cauldron/robut_wtq_38246_llava_format.json
    sampling_strategy: "all"
    folder_name: robut_wtq(cauldron,llava_format)
  - json_path: llava_instruct/cauldron/screen2words_15730.json
    sampling_strategy: "all"
    folder_name: screen2words(cauldron)
  - json_path: llava_instruct/cauldron/tqa_llava_format_27307.json
    sampling_strategy: "first:5%"
    folder_name: tqa(cauldron,llava_format)
  - json_path: llava_instruct/cauldron/visualmrc_3027.json
    sampling_strategy: "all"
    folder_name: visualmrc(cauldron)
