LICENSE
README.md
pyproject.toml
setup.py
vlmeval/__init__.py
vlmeval/config.py
vlmeval/inference.py
vlmeval/inference_mt.py
vlmeval/inference_video.py
vlmeval/tools.py
vlmeval/api/__init__.py
vlmeval/api/bailingmm.py
vlmeval/api/base.py
vlmeval/api/bluelm_v_api.py
vlmeval/api/claude.py
vlmeval/api/cloudwalk.py
vlmeval/api/doubao_vl_api.py
vlmeval/api/gemini.py
vlmeval/api/glm_vision.py
vlmeval/api/gpt.py
vlmeval/api/hf_chat_model.py
vlmeval/api/hunyuan.py
vlmeval/api/jt_vl_chat.py
vlmeval/api/lmdeploy.py
vlmeval/api/mug_u.py
vlmeval/api/qwen_api.py
vlmeval/api/qwen_vl_api.py
vlmeval/api/reka.py
vlmeval/api/sensechat_vision.py
vlmeval/api/siliconflow.py
vlmeval/api/stepai.py
vlmeval/api/taichu.py
vlmeval/api/taiyi.py
vlmeval/dataset/__init__.py
vlmeval/dataset/cgbench.py
vlmeval/dataset/charxiv.py
vlmeval/dataset/cmmmu.py
vlmeval/dataset/creation.py
vlmeval/dataset/dude.py
vlmeval/dataset/dynamath.py
vlmeval/dataset/emma.py
vlmeval/dataset/image_base.py
vlmeval/dataset/image_caption.py
vlmeval/dataset/image_ccocr.py
vlmeval/dataset/image_mcq.py
vlmeval/dataset/image_mt.py
vlmeval/dataset/image_shortqa.py
vlmeval/dataset/image_vqa.py
vlmeval/dataset/image_yorn.py
vlmeval/dataset/longvideobench.py
vlmeval/dataset/megabench.py
vlmeval/dataset/miabench.py
vlmeval/dataset/mlvu.py
vlmeval/dataset/mmalignbench.py
vlmeval/dataset/mmbench_video.py
vlmeval/dataset/mmgenbench.py
vlmeval/dataset/mmifeval.py
vlmeval/dataset/mmlongbench.py
vlmeval/dataset/mmmath.py
vlmeval/dataset/moat.py
vlmeval/dataset/moviechat1k.py
vlmeval/dataset/mvbench.py
vlmeval/dataset/qbench_video.py
vlmeval/dataset/slidevqa.py
vlmeval/dataset/spatial457.py
vlmeval/dataset/tamperbench.py
vlmeval/dataset/tempcompass.py
vlmeval/dataset/text_base.py
vlmeval/dataset/text_mcq.py
vlmeval/dataset/vcr.py
vlmeval/dataset/vdc.py
vlmeval/dataset/video_base.py
vlmeval/dataset/video_concat_dataset.py
vlmeval/dataset/video_dataset_config.py
vlmeval/dataset/video_mmlu.py
vlmeval/dataset/videomme.py
vlmeval/dataset/vl_rewardbench.py
vlmeval/dataset/vlm2bench.py
vlmeval/dataset/wildvision.py
vlmeval/dataset/worldsense.py
vlmeval/dataset/Omnidocbench/__init__.py
vlmeval/dataset/Omnidocbench/data_preprocess.py
vlmeval/dataset/Omnidocbench/metrics.py
vlmeval/dataset/Omnidocbench/omnidocbench.py
vlmeval/dataset/Omnidocbench/utils.py
vlmeval/dataset/utils/__init__.py
vlmeval/dataset/utils/cgbench.py
vlmeval/dataset/utils/crpe.py
vlmeval/dataset/utils/hrbench.py
vlmeval/dataset/utils/judge_util.py
vlmeval/dataset/utils/llavabench.py
vlmeval/dataset/utils/logicvista.py
vlmeval/dataset/utils/longvideobench.py
vlmeval/dataset/utils/mathv.py
vlmeval/dataset/utils/mathverse.py
vlmeval/dataset/utils/mathvista.py
vlmeval/dataset/utils/mlvu.py
vlmeval/dataset/utils/mmbench_video.py
vlmeval/dataset/utils/mmdu.py
vlmeval/dataset/utils/mmniah.py
vlmeval/dataset/utils/mmsci.py
vlmeval/dataset/utils/mmvet.py
vlmeval/dataset/utils/moviechat1k.py
vlmeval/dataset/utils/multiple_choice.py
vlmeval/dataset/utils/mvbench.py
vlmeval/dataset/utils/naturalbench.py
vlmeval/dataset/utils/ocrbench.py
vlmeval/dataset/utils/olympiadbench.py
vlmeval/dataset/utils/physic.py
vlmeval/dataset/utils/physics_eval_utils.py
vlmeval/dataset/utils/qbench_video.py
vlmeval/dataset/utils/qspatial.py
vlmeval/dataset/utils/shortqa.py
vlmeval/dataset/utils/spatial457.py
vlmeval/dataset/utils/tablevqabench.py
vlmeval/dataset/utils/tamperbench.py
vlmeval/dataset/utils/tdbench.py
vlmeval/dataset/utils/tempcompass.py
vlmeval/dataset/utils/vdc.py
vlmeval/dataset/utils/video_mmlu.py
vlmeval/dataset/utils/videomme.py
vlmeval/dataset/utils/visulogic.py
vlmeval/dataset/utils/vlm2bench.py
vlmeval/dataset/utils/vmcbench.py
vlmeval/dataset/utils/vqa_eval.py
vlmeval/dataset/utils/wemath.py
vlmeval/dataset/utils/worldsense.py
vlmeval/dataset/utils/yorn.py
vlmeval/dataset/utils/ccocr_evaluator/__init__.py
vlmeval/dataset/utils/ccocr_evaluator/common.py
vlmeval/dataset/utils/ccocr_evaluator/doc_parsing_evaluator.py
vlmeval/dataset/utils/ccocr_evaluator/kie_evaluator.py
vlmeval/dataset/utils/ccocr_evaluator/ocr_evaluator.py
vlmeval/dataset/utils/megabench/__init__.py
vlmeval/dataset/utils/megabench/aggregation_type.py
vlmeval/dataset/utils/megabench/evaluator.py
vlmeval/dataset/utils/megabench/metric_type.py
vlmeval/dataset/utils/megabench/response_parse_type.py
vlmeval/dataset/utils/megabench/utils.py
vlmeval/dataset/utils/mmif/__init__.py
vlmeval/dataset/utils/mmif/function_and_compare.py
vlmeval/dataset/utils/vgrpbench/__init__.py
vlmeval/dataset/utils/vgrpbench/evaluation.py
vlmeval/dataset/utils/vgrpbench/score.py
vlmeval/smp/__init__.py
vlmeval/smp/file.py
vlmeval/smp/log.py
vlmeval/smp/misc.py
vlmeval/smp/vlm.py
vlmeval/utils/__init__.py
vlmeval/utils/matching_util.py
vlmeval/utils/mp_util.py
vlmeval/utils/result_transfer.py
vlmeval/vlm/__init__.py
vlmeval/vlm/aki.py
vlmeval/vlm/aria.py
vlmeval/vlm/base.py
vlmeval/vlm/bunnyllama3.py
vlmeval/vlm/chameleon.py
vlmeval/vlm/cogvlm.py
vlmeval/vlm/deepseek_vl2.py
vlmeval/vlm/eagle_chat.py
vlmeval/vlm/emu.py
vlmeval/vlm/falcon_vlm.py
vlmeval/vlm/gemma.py
vlmeval/vlm/h2ovl_mississippi.py
vlmeval/vlm/idefics.py
vlmeval/vlm/instructblip.py
vlmeval/vlm/janus.py
vlmeval/vlm/kimi_vl.py
vlmeval/vlm/kosmos.py
vlmeval/vlm/llama4.py
vlmeval/vlm/llama_vision.py
vlmeval/vlm/long_vita.py
vlmeval/vlm/mantis.py
vlmeval/vlm/mgm.py
vlmeval/vlm/minicpm_v.py
vlmeval/vlm/minigpt4.py
vlmeval/vlm/minimonkey.py
vlmeval/vlm/mixsense.py
vlmeval/vlm/mmalaya.py
vlmeval/vlm/molmo.py
vlmeval/vlm/monkey.py
vlmeval/vlm/moondream.py
vlmeval/vlm/mplug_owl2.py
vlmeval/vlm/mplug_owl3.py
vlmeval/vlm/nvlm.py
vlmeval/vlm/omchat.py
vlmeval/vlm/omnilmm.py
vlmeval/vlm/open_flamingo.py
vlmeval/vlm/pandagpt.py
vlmeval/vlm/parrot.py
vlmeval/vlm/phi3_vision.py
vlmeval/vlm/phi4_multimodal.py
vlmeval/vlm/pixtral.py
vlmeval/vlm/points.py
vlmeval/vlm/qh_360vl.py
vlmeval/vlm/qwen_vl.py
vlmeval/vlm/rbdash.py
vlmeval/vlm/ristretto.py
vlmeval/vlm/ross.py
vlmeval/vlm/sail_vl.py
vlmeval/vlm/slime.py
vlmeval/vlm/smolvlm.py
vlmeval/vlm/transcore_m.py
vlmeval/vlm/vila.py
vlmeval/vlm/vintern_chat.py
vlmeval/vlm/visualglm.py
vlmeval/vlm/vita.py
vlmeval/vlm/vlaa_thinker.py
vlmeval/vlm/vlm_r1.py
vlmeval/vlm/vxverse.py
vlmeval/vlm/wemm.py
vlmeval/vlm/xgen_mm.py
vlmeval/vlm/yi_vl.py
vlmeval/vlm/cambrian/__init__.py
vlmeval/vlm/cambrian/cambrian.py
vlmeval/vlm/cambrian/constants.py
vlmeval/vlm/cambrian/conversation.py
vlmeval/vlm/cambrian/mm_utils.py
vlmeval/vlm/cambrian/utils.py
vlmeval/vlm/cambrian/model/__init__.py
vlmeval/vlm/cambrian/model/builder.py
vlmeval/vlm/cambrian/model/cambrian_arch.py
vlmeval/vlm/cambrian/model/consolidate.py
vlmeval/vlm/cambrian/model/vision_sampler.py
vlmeval/vlm/cambrian/model/multimodal_encoder/__init__.py
vlmeval/vlm/cambrian/model/multimodal_encoder/base_encoder.py
vlmeval/vlm/cambrian/model/multimodal_encoder/builder.py
vlmeval/vlm/cambrian/model/multimodal_encoder/clip_convnext_encoder.py
vlmeval/vlm/cambrian/model/multimodal_encoder/clip_encoder.py
vlmeval/vlm/cambrian/model/multimodal_encoder/dfn_clip_encoder.py
vlmeval/vlm/cambrian/model/multimodal_encoder/diffusion_encoder.py
vlmeval/vlm/cambrian/model/multimodal_encoder/dino_encoder.py
vlmeval/vlm/cambrian/model/multimodal_encoder/eva_clip_encoder.py
vlmeval/vlm/cambrian/model/multimodal_encoder/hybrid_encoder.py
vlmeval/vlm/cambrian/model/multimodal_encoder/ijepa_encoder.py
vlmeval/vlm/cambrian/model/multimodal_encoder/load.py
vlmeval/vlm/cambrian/model/multimodal_encoder/mae_encoder.py
vlmeval/vlm/cambrian/model/multimodal_encoder/maws_encoder.py
vlmeval/vlm/cambrian/model/multimodal_encoder/midas_encoder.py
vlmeval/vlm/cambrian/model/multimodal_encoder/moco_encoder.py
vlmeval/vlm/cambrian/model/multimodal_encoder/oai_clip_encoder.py
vlmeval/vlm/cambrian/model/multimodal_encoder/pixart_alpha_encoder.py
vlmeval/vlm/cambrian/model/multimodal_encoder/sam_encoder.py
vlmeval/vlm/cambrian/model/multimodal_encoder/siglip_clip_encoder.py
vlmeval/vlm/cambrian/model/multimodal_encoder/siglip_encoder.py
vlmeval/vlm/cambrian/model/multimodal_encoder/supervised_vit_encoder.py
vlmeval/vlm/cambrian/model/multimodal_encoder/sam/__init__.py
vlmeval/vlm/cambrian/model/multimodal_encoder/sam/common.py
vlmeval/vlm/cambrian/model/multimodal_encoder/sam/encoder.py
vlmeval/vlm/cambrian/model/multimodal_encoder/sam/transforms.py
vlmeval/vlm/cambrian/serve/__init__.py
vlmeval/vlm/cambrian/serve/cli.py
vlmeval/vlm/cambrian/serve/controller.py
vlmeval/vlm/cambrian/serve/gradio_web_server.py
vlmeval/vlm/cambrian/serve/model_worker.py
vlmeval/vlm/cambrian/serve/register_worker.py
vlmeval/vlm/cambrian/serve/sglang_worker.py
vlmeval/vlm/cambrian/serve/test_message.py
vlmeval/vlm/eagle/__init__.py
vlmeval/vlm/eagle/constants.py
vlmeval/vlm/eagle/conversation.py
vlmeval/vlm/eagle/eagle_x.py
vlmeval/vlm/eagle/mm_utils.py
vlmeval/vlm/eagle/save_attention_features.py
vlmeval/vlm/eagle/utils.py
vlmeval/vlm/eagle/utils_visualize_attn.py
vlmeval/vlm/eagle/model/__init__.py
vlmeval/vlm/eagle/model/builder.py
vlmeval/vlm/eagle/model/consolidate.py
vlmeval/vlm/eagle/model/eagle_arch.py
vlmeval/vlm/eagle/model/language_model/__init__.py
vlmeval/vlm/eagle/model/language_model/eagle_llama.py
vlmeval/vlm/eagle/model/multimodal_encoder/__init__.py
vlmeval/vlm/eagle/model/multimodal_encoder/builder.py
vlmeval/vlm/eagle/model/multimodal_encoder/clip_encoder.py
vlmeval/vlm/eagle/model/multimodal_encoder/convnext_encoder.py
vlmeval/vlm/eagle/model/multimodal_encoder/hr_clip_encoder.py
vlmeval/vlm/eagle/model/multimodal_encoder/multi_backbone_channel_concatenation_encoder.py
vlmeval/vlm/eagle/model/multimodal_encoder/pix2struct_encoder.py
vlmeval/vlm/eagle/model/multimodal_encoder/sam_encoder.py
vlmeval/vlm/eagle/model/multimodal_encoder/vision_models/__init__.py
vlmeval/vlm/eagle/model/multimodal_encoder/vision_models/convnext.py
vlmeval/vlm/eagle/model/multimodal_encoder/vision_models/eva_vit.py
vlmeval/vlm/eagle/model/multimodal_projector/__init__.py
vlmeval/vlm/eagle/model/multimodal_projector/builder.py
vlmeval/vlm/eagle2/__init__.py
vlmeval/vlm/eagle2/eagle2_chat.py
vlmeval/vlm/eagle2/utils.py
vlmeval/vlm/internvl/__init__.py
vlmeval/vlm/internvl/internvl_chat.py
vlmeval/vlm/internvl/utils.py
vlmeval/vlm/llava/__init__.py
vlmeval/vlm/llava/llava.py
vlmeval/vlm/llava/llava_xtuner.py
vlmeval/vlm/ola/__init__.py
vlmeval/vlm/ola/ola_model.py
vlmeval/vlm/ovis/__init__.py
vlmeval/vlm/ovis/ovis.py
vlmeval/vlm/ovis/utils/__init__.py
vlmeval/vlm/ovis/utils/mdp3.py
vlmeval/vlm/qwen2_vl/__init__.py
vlmeval/vlm/qwen2_vl/model.py
vlmeval/vlm/qwen2_vl/prompt.py
vlmeval/vlm/ursa/__init__.py
vlmeval/vlm/ursa/ursa_chat.py
vlmeval/vlm/ursa/ursa_model/__init__.py
vlmeval/vlm/ursa/ursa_model/clip_encoder.py
vlmeval/vlm/ursa/ursa_model/configuration_ursa.py
vlmeval/vlm/ursa/ursa_model/image_processing_vlm.py
vlmeval/vlm/ursa/ursa_model/modeling_ursa.py
vlmeval/vlm/ursa/ursa_model/processing_ursa.py
vlmeval/vlm/ursa/ursa_model/projector.py
vlmeval/vlm/ursa/ursa_model/sam.py
vlmeval/vlm/ursa/ursa_model/siglip_vit.py
vlmeval/vlm/valley/__init__.py
vlmeval/vlm/valley/valley_eagle_chat.py
vlmeval/vlm/video_llm/__init__.py
vlmeval/vlm/video_llm/chat_uni_vi.py
vlmeval/vlm/video_llm/llama_vid.py
vlmeval/vlm/video_llm/pllava.py
vlmeval/vlm/video_llm/video_chatgpt.py
vlmeval/vlm/video_llm/video_llava.py
vlmeval/vlm/video_llm/videochat2.py
vlmeval/vlm/xcomposer/__init__.py
vlmeval/vlm/xcomposer/sharecaptioner.py
vlmeval/vlm/xcomposer/xcomposer.py
vlmeval/vlm/xcomposer/xcomposer2.py
vlmeval/vlm/xcomposer/xcomposer2_4KHD.py
vlmeval/vlm/xcomposer/xcomposer2d5.py
vlmevalkit.egg-info/PKG-INFO
vlmevalkit.egg-info/SOURCES.txt
vlmevalkit.egg-info/dependency_links.txt
vlmevalkit.egg-info/requires.txt
vlmevalkit.egg-info/top_level.txt