date
cd YOUR_ROOT_PATH/MLLM

export CHECKPOINT_PATH="YOUR_ROOT_PATH/model/checkpoint/MLLM/scalability_OI-IC+IC_all_with_JD_then_OI_factorized_mlp/last_4145"
bash scripts/evaluation/Multi_GPU.sh "NoCaps" 0 0 0 "--from_hf"

# Merged model
bash scripts/evaluation/Merged_MME.sh

# Caption
## single GPU
bash scripts/evaluation/Merged_Caption.sh

## multi GPU
# bash scripts/evaluation/Multi_GPU.sh "COCO" 0 0 0 "--from_hf"
# bash scripts/evaluation/Multi_GPU.sh "Flickr30K" 0 0 0 "--from_hf"
# bash scripts/evaluation/Multi_GPU.sh "NoCaps" 0 0 0 "--from_hf"
# bash scripts/evaluation/Multi_GPU.sh "WHOOPS-Caption" 0 0 0 "--from_hf"

# VQA
## single GPU
bash scripts/evaluation/Single_GPU.sh "GQA_TESTDEV_BALANCED" ""
bash scripts/evaluation/Single_GPU.sh "OK-VQA" "--from_hf"
bash scripts/evaluation/Single_GPU.sh "VizWiz_VAL" "--from_hf"
bash scripts/evaluation/Single_GPU.sh "TextVQA" "--from_hf"

## multi GPU
# bash scripts/evaluation/Multi_GPU.sh "GQA_TESTDEV_BALANCED" 0 7 0 ""
# bash scripts/evaluation/Multi_GPU.sh "OK-VQA" 0 7 0 "--from_hf"
# bash scripts/evaluation/Multi_GPU.sh "VizWiz_VAL" 0 7 0 "--from_hf"
# bash scripts/evaluation/Multi_GPU.sh "TextVQA" 0 7 0 "--from_hf"
bash scripts/evaluation/Multi_GPU.sh "VQAv2_VAL" 0 7 1 "--from_hf"

# Misalignment
## single GPU
# bash scripts/evaluation/Single_GPU_PPL.sh "MME" ""
bash scripts/evaluation/Single_GPU_PPL.sh "HallusionBench" ""
bash scripts/evaluation/Single_GPU_PPL.sh "POPE" "--from_hf"
# bash scripts/evaluation/Single_GPU_PPL.sh "Winoground-YN" "--from_hf"

## multi GPU
# bash scripts/evaluation/Multi_GPU_PPL.sh "MME" 0 7 0 ""
# bash scripts/evaluation/Multi_GPU_PPL.sh "HallusionBench" 0 7 0 ""
# bash scripts/evaluation/Multi_GPU_PPL.sh "POPE" 0 7 0 "--from_hf"
# bash scripts/evaluation/Multi_GPU_PPL.sh "Winoground-YN" 0 7 0 "--from_hf"

# MC
## single GPU
bash scripts/evaluation/Single_GPU_PPL.sh "MMBench_DEV_EN" ""
bash scripts/evaluation/Single_GPU_PPL.sh "ScienceQA_VAL" ""
bash scripts/evaluation/Single_GPU_PPL.sh "ScienceQA_TEST" ""
bash scripts/evaluation/Single_GPU_PPL.sh "SEEDBench_IMG" ""

## multi GPU
# bash scripts/evaluation/Multi_GPU_PPL.sh "MMBench_DEV_EN" 0 7 0 ""
# bash scripts/evaluation/Multi_GPU_PPL.sh "ScienceQA_VAL" 0 7 0 ""
# bash scripts/evaluation/Multi_GPU_PPL.sh "ScienceQA_TEST" 0 7 0 ""
# bash scripts/evaluation/Multi_GPU_PPL.sh "SEEDBench_IMG" 0 7 0 ""

# MIX
## single GPU
bash scripts/evaluation/Merged_MMMU.sh
bash scripts/evaluation/Merged_MathVista.sh

## multi GPU
# bash scripts/evaluation/Multi_GPU_PPL.sh "MMMU_VAL_MultiChoice" 0 7 0 "--from_hf"
# bash scripts/evaluation/Multi_GPU.sh "MMMU_VAL_OpenEnded" 0 7 0 "--from_hf"
# bash scripts/evaluation/Multi_GPU_PPL.sh "MathVista_MultiChoice" 0 7 0 "--from_hf"
# bash scripts/evaluation/Multi_GPU.sh "MathVista_OpenEnded" 0 7 0 "--from_hf"

date
