date

cd YOUR_ROOT_PATH/MLLM

export CHECKPOINT_PATH="YOUR_ROOT_PATH/model/checkpoint/MLLM/ablation_vocab_OIv4_factorized_mlp_uni_bi_ls0.1_0.9/last_4145"

# VQA
## single GPU
# bash scripts/evaluation_sft/Single_GPU_CoT.sh "GQA_TESTDEV_BALANCED" ""
# bash scripts/evaluation_sft/Single_GPU_CoT.sh "OK-VQA" "--from_hf"
# bash scripts/evaluation_sft/Single_GPU_CoT.sh "VizWiz_VAL" "--from_hf"
# bash scripts/evaluation_sft/Single_GPU_CoT.sh "TextVQA" "--from_hf"

## multi GPU
bash scripts/evaluation_sft/Multi_GPU_CoT.sh "GQA_TESTDEV_BALANCED" 0 7 0 ""
bash scripts/evaluation_sft/Multi_GPU_CoT.sh "OK-VQA" 0 7 0 "--from_hf"
bash scripts/evaluation_sft/Multi_GPU_CoT.sh "VizWiz_VAL" 0 7 0 "--from_hf"
bash scripts/evaluation_sft/Multi_GPU_CoT.sh "TextVQA" 0 7 0 "--from_hf"
bash scripts/evaluation_sft/Multi_GPU_CoT.sh "VQAv2_VAL" 0 7 1 "--from_hf"

# Misalignment
## single GPU
# bash scripts/evaluation_sft/Single_GPU_PPL_CoT.sh "MME" ""
# bash scripts/evaluation_sft/Single_GPU_PPL_CoT.sh "HallusionBench" ""
# bash scripts/evaluation_sft/Single_GPU_PPL_CoT.sh "POPE" "--from_hf"
# bash scripts/evaluation_sft/Single_GPU_PPL_CoT.sh "Winoground-YN" "--from_hf"

## multi GPU
# # bash scripts/evaluation_sft/Multi_GPU_PPL_CoT.sh "MME" 0 7 0 ""
bash scripts/evaluation_sft/Multi_GPU_PPL_CoT.sh "HallusionBench" 0 7 0 ""
bash scripts/evaluation_sft/Multi_GPU_PPL_CoT.sh "POPE" 0 7 0 "--from_hf"
# # bash scripts/evaluation_sft/Multi_GPU_PPL_CoT.sh "Winoground-YN" 0 7 0 "--from_hf"

# MC
## single GPU
# bash scripts/evaluation_sft/Single_GPU_PPL_CoT.sh "MMBench_DEV_EN" ""
# bash scripts/evaluation_sft/Single_GPU_PPL_CoT.sh "ScienceQA_VAL" ""
# bash scripts/evaluation_sft/Single_GPU_PPL_CoT.sh "ScienceQA_TEST" ""
# bash scripts/evaluation_sft/Single_GPU_PPL_CoT.sh "SEEDBench_IMG" ""

## multi GPU
bash scripts/evaluation_sft/Multi_GPU_PPL_CoT.sh "MMBench_DEV_EN" 0 7 0 ""
bash scripts/evaluation_sft/Multi_GPU_PPL_CoT.sh "ScienceQA_VAL" 0 7 0 ""
bash scripts/evaluation_sft/Multi_GPU_PPL_CoT.sh "ScienceQA_TEST" 0 7 0 ""
bash scripts/evaluation_sft/Multi_GPU_PPL_CoT.sh "SEEDBench_IMG" 0 7 0 ""

# MIX
## single GPU
# bash scripts/evaluation_sft/Merged_MMMU_CoT.sh
bash scripts/evaluation_sft/Merged_MathVista_CoT.sh

## multi GPU
# bash scripts/evaluation_sft/Multi_GPU_PPL_CoT.sh "MMMU_VAL_MultiChoice" 0 7 0 "--from_hf"
# bash scripts/evaluation_sft/Multi_GPU_CoT.sh "MMMU_VAL_OpenEnded" 0 7 0 "--from_hf"
bash scripts/evaluation_sft/Multi_GPU_PPL_CoT.sh "MathVista_MultiChoice" 0 7 0 "--from_hf"
bash scripts/evaluation_sft/Multi_GPU_CoT.sh "MathVista_OpenEnded" 0 7 0 "--from_hf"

date