---
cvpr_mmmu_v13_5M:
    - sharegpt4v_gpt4_100k@0.5
    - llava_instruct@0.5
    - sharegpt4v_sft@0.5_gqa
    - dvqa_train_200k@0.5
    - chartqa_train_18k_cot2
    - ai2d_train_12k
    - docvqa_train_10k
    - geoqa@0.5
    - synthdog_en@0.5
    - scienceqa
    - wit_subset@0.5
    - math@0.5
    - sherlock@0.5
    - idefics2_sft@0.5
    - llave_onevision_images_sft_cot2
    - cambrian_1375k@0.5
    - stem_qa@0.5
    - nv_mm_sft@0.5
    - captioning_image-paragraph-captioning_train@0.5
    - captioning_textcap_train@0.5
    - generation_visual-dialog_train@0.5
    - reasoning_clevr_train@0.5
    - reasoning_nlvr_train@0.5
    - reasoning_visual-mrc_train@0.5
    - vqa_docvqa_train
    - vqa_gqa_train
    - vqa_ivqa_train@0.5
    - vqa_ocr-vqa_train@0.5
    - vqa_st-vqa_train@0.5
    - vqa_viquae_train@0.5
    - vqa_vqa-v2_train@0.5
    - shikra@0.5
    - lrv_instruction@0.5
    - textocr_qa@0.5
    - mmc_instruction@0.5
    - unimm_chat@0.5
    - svit@0.5
    - mmbench_val
    - cvbench
    - doc_reason@0.5
    - mtwi
    - kvqa
    - art@0.5
    - mimicvqa@0.5
    - slake@0.5
    - medvqa@0.5
    - pathvqa@0.5
    - tabmwp_cot
    - grandstaff_qa@0.5
    - chembl@0.5
    - estvqa
    - poie
    - sroie
    - ureaderkg@0.5
    - real-cqa@0.5
    - mminstruct@0.5
    - unichart@0.5
    - wordart
    - orand-b
    - olmo_doc_table@0.5
    - olmo_doc_doc@0.5
    - olmo_doc_diagrams@0.5
    - olmo_doc_charts@0.5
    - olmo_clock200k@0.5
    - olmo_askanything@0.5

llava-video-sft:
    - llava-video/academic-cap
    - llava-video/academic-mc
    - llava-video/academic-oe
    - llava-video/activitynetqa-oe
    - llava-video/nextqa-mc
    - llava-video/nextqa-oe
    - llava-video/perceptiontest-mc
    - llava-video/sharegptvideo-cap
    - llava-video/sharegptvideo-oe
    - llava-video/youtube-cap
    - llava-video/youtube-mc
    - llava-video/youtube-oe

recipe_v13:
    - sharegpt4v_gpt4_100k
    - llava_instruct
    - sharegpt4v_sft
    - dvqa_train_200k
    - chartqa_train_18k
    - ai2d_train_12k
    - docvqa_train_10k
    - geoqa
    - synthdog_en
    - scienceqa
    - wit_subset
    - math
    - sherlock
    - idefics2_sft
    - llave_onevision_images_sft
    - cambrian_1375k
    - shot2story_shotonly
    - video_chatgpt
    - youcook2
    - sharegpt_video
    - stem_qa
    - nv_mm_sft
    - jukinmedia
    - sharegpt4video
    - k710
    - ssv2
    - reason_clevrerqa
    - reason_clevrermc
    - vcg_human
    - video_chat1
    - av_llava_4785
    - vflan
    - refcoco_train
    - shikra
    - lrv_instruction
    - textocr_qa
    - mmc_instruction
    - m4-instruct-video
    - nextqa_mc
    - unimm_chat
    - svit
    - mmbench_val
    - cvbench
    - m4-instruct-image-nuscenes
    - webvid_qa
    - caption_videochat
    - doc_reason
    - metamathqa
    - mminstruct
    - unichart
    - mtwi
    - kvqa

# filtering 1829303 of 6883312, 27% reduction
recipe_v9_no_video_30:
    - sharegpt4v_gpt4_100k@30
    - llava_instruct@30
    - sharegpt4v_sft@30
    - dvqa_train_200k
    - chartqa_train_18k@30
    - ai2d_train_12k@30
    - docvqa_train_10k@30
    - geoqa@30
    - synthdog_en@30
    - scienceqa@30
    - wit_subset@30
    - math
    - sherlock@30
    - idefics2_sft@30
    - llave_onevision_images_sft@30
    - cambrian_1375k@30
    - stem_qa@30
    - nv_mm_sft@30
    - k710
    - ssv2
    - reason_clevrerqa
    - reason_clevrermc
    - vcg_human
    - vflan
    - refcoco_train@30
    - shikra@30
    - lrv_instruction
    - textocr_qa@30
    - mmc_instruction@30
    - nextqa_mc
    - unimm_chat@30
    - svit@30
    - mmbench_val@30
    - cvbench@30

# filtering 2732497 of 6883312, 40% reduction
recipe_v9_no_video_20:
    - sharegpt4v_gpt4_100k@20
    - llava_instruct@20
    - sharegpt4v_sft@20
    - dvqa_train_200k
    - chartqa_train_18k@20
    - ai2d_train_12k@20
    - docvqa_train_10k@20
    - geoqa@20
    - synthdog_en@20
    - scienceqa@20
    - wit_subset@20
    - math
    - sherlock@20
    - idefics2_sft@20
    - llave_onevision_images_sft@20
    - cambrian_1375k@20
    - stem_qa@20
    - nv_mm_sft@20
    - k710
    - ssv2
    - reason_clevrerqa
    - reason_clevrermc
    - vcg_human
    - vflan
    - refcoco_train@20
    - shikra@20
    - lrv_instruction
    - textocr_qa@20
    - mmc_instruction@20
    - nextqa_mc
    - unimm_chat@20
    - svit@20
    - mmbench_val@20
    - cvbench@20

recipe_v9_no_video:
    - sharegpt4v_gpt4_100k
    - llava_instruct
    - sharegpt4v_sft
    - dvqa_train_200k
    - chartqa_train_18k
    - ai2d_train_12k
    - docvqa_train_10k
    - geoqa
    - synthdog_en
    - scienceqa
    - wit_subset
    - math
    - sherlock
    - idefics2_sft
    - llave_onevision_images_sft
    - cambrian_1375k
    - stem_qa
    - nv_mm_sft
    - k710
    - ssv2
    - reason_clevrerqa
    - reason_clevrermc
    - vcg_human
    - vflan
    - refcoco_train
    - shikra
    - lrv_instruction
    - textocr_qa
    - mmc_instruction
    - nextqa_mc
    - unimm_chat
    - svit
    - mmbench_val
    - cvbench

recipe_v9:
    - sharegpt4v_gpt4_100k
    - llava_instruct
    - sharegpt4v_sft
    - dvqa_train_200k
    - chartqa_train_18k
    - ai2d_train_12k
    - docvqa_train_10k
    - geoqa
    - synthdog_en
    - scienceqa
    - wit_subset
    - math
    - sherlock
    - idefics2_sft
    - llave_onevision_images_sft
    - cambrian_1375k
    - shot2story_shotonly
    - video_chatgpt
    - youcook2
    - vatex
    - sharegpt_video
    - stem_qa
    - nv_mm_sft
    - jukinmedia
    - sharegpt4video
    - k710
    - ssv2
    - reason_clevrerqa
    - reason_clevrermc
    - vcg_human
    - video_chat1
    - av_llava_4785
    - vflan
    - refcoco_train
    - shikra
    - lrv_instruction
    - textocr_qa
    - mmc_instruction
    - m4-instruct-video
    - nextqa_mc
    - unimm_chat
    - svit
    - mmbench_val
    - cvbench

vflan:
    - captioning_image-paragraph-captioning_train
    - captioning_msrvtt_train
    - captioning_textcap_train
    - generation_visual-dialog_train
    - reasoning_clevr_train
    - reasoning_nlvr_train
    - reasoning_visual-mrc_train
    - text_flan_1m
    - vqa_activitynet-qa_train
    - vqa_docvqa_train
    - vqa_gqa_train
    - vqa_ivqa_train
    - vqa_msrvtt-qa_train
    - vqa_msvd-qa_train
    - vqa_ocr-vqa_train
    - vqa_st-vqa_train
    - vqa_viquae_train
    - vqa_vqa-v2_train

vflan_no_video:
    - captioning_image-paragraph-captioning_train
    - captioning_textcap_train
    - generation_visual-dialog_train
    - reasoning_clevr_train
    - reasoning_nlvr_train
    - reasoning_visual-mrc_train
    - vqa_docvqa_train
    - vqa_gqa_train
    - vqa_ivqa_train
    - vqa_ocr-vqa_train
    - vqa_st-vqa_train
    - vqa_viquae_train
    - vqa_vqa-v2_train

vflan_no_video_no_docvqa:
    - captioning_image-paragraph-captioning_train
    - captioning_textcap_train
    - generation_visual-dialog_train
    - reasoning_clevr_train
    - reasoning_nlvr_train
    - reasoning_visual-mrc_train
    - vqa_gqa_train
    - vqa_ivqa_train
    - vqa_ocr-vqa_train
    - vqa_st-vqa_train
    - vqa_viquae_train
    - vqa_vqa-v2_train

vila-v1.5-sft:
    - ai2d_train_12k
    - chartqa_train_18k
    - docvqa_train_10k
    - dvqa_train_200k
    - geoqa
    - llava_instruct
    - math
    - scienceqa
    - sharegpt4v_gpt4_100k
    - sharegpt4v_sft
    - sharegpt_video
    - sherlock
    - shot2story_shotonly
    - synthdog_en
    - vatex
    - vflan
    - video_chatgpt
    - wit_subset
    - youcook2
