date

cd YOUR_ROOT_PATH/MLLM

export CHECKPOINT_PATH="YOUR_ROOT_PATH/model/checkpoint/MLLM/fine_tune_OI+IC_then_OI_SFT_OI_IC_256_4e-4_0.05_e1/last_3704"

# # VQA
# ## single GPU
# # bash scripts/evaluation_sft/Single_GPU_TO.sh "GQA_TESTDEV_BALANCED" ""
# # bash scripts/evaluation_sft/Single_GPU_TO.sh "OK-VQA" "--from_hf"
# # bash scripts/evaluation_sft/Single_GPU_TO.sh "VizWiz_VAL" "--from_hf"
# # bash scripts/evaluation_sft/Single_GPU_TO.sh "TextVQA" "--from_hf"

# ## multi GPU
# bash scripts/evaluation_sft/Multi_GPU_TO.sh "GQA_TESTDEV_BALANCED" 0 7 0 ""
# bash scripts/evaluation_sft/Multi_GPU_TO.sh "OK-VQA" 0 7 0 "--from_hf"
# bash scripts/evaluation_sft/Multi_GPU_TO.sh "VizWiz_VAL" 0 7 0 "--from_hf"
# bash scripts/evaluation_sft/Multi_GPU_TO.sh "TextVQA" 0 7 0 "--from_hf"
# bash scripts/evaluation_sft/Multi_GPU_TO.sh "VQAv2_VAL" 0 7 1 "--from_hf"

# # Misalignment
# ## single GPU
# # bash scripts/evaluation_sft/Single_GPU_PPL_TO.sh "MME" ""
# # bash scripts/evaluation_sft/Single_GPU_PPL_TO.sh "HallusionBench" ""
# # bash scripts/evaluation_sft/Single_GPU_PPL_TO.sh "POPE" "--from_hf"
# # bash scripts/evaluation_sft/Single_GPU_PPL_TO.sh "Winoground-YN" "--from_hf"

# ## multi GPU
# # # bash scripts/evaluation_sft/Multi_GPU_PPL_TO.sh "MME" 0 7 0 ""
# bash scripts/evaluation_sft/Multi_GPU_PPL_TO.sh "HallusionBench" 0 7 0 ""
# bash scripts/evaluation_sft/Multi_GPU_PPL_TO.sh "POPE" 0 7 0 "--from_hf"
# # # bash scripts/evaluation_sft/Multi_GPU_PPL_TO.sh "Winoground-YN" 0 7 0 "--from_hf"

# # MC
# ## single GPU
# # bash scripts/evaluation_sft/Single_GPU_PPL_TO.sh "MMBench_DEV_EN" ""
# # bash scripts/evaluation_sft/Single_GPU_PPL_TO.sh "ScienceQA_VAL" ""
# # bash scripts/evaluation_sft/Single_GPU_PPL_TO.sh "ScienceQA_TEST" ""
# # bash scripts/evaluation_sft/Single_GPU_PPL_TO.sh "SEEDBench_IMG" ""

# ## multi GPU
# bash scripts/evaluation_sft/Multi_GPU_PPL_TO.sh "MMBench_DEV_EN" 0 7 0 ""
# bash scripts/evaluation_sft/Multi_GPU_PPL_TO.sh "ScienceQA_VAL" 0 7 0 ""
# bash scripts/evaluation_sft/Multi_GPU_PPL_TO.sh "ScienceQA_TEST" 0 7 0 ""
# bash scripts/evaluation_sft/Multi_GPU_PPL_TO.sh "SEEDBench_IMG" 0 7 0 ""

# # MIX
# ## single GPU
# # bash scripts/evaluation_sft/Merged_MMMU_TO.sh
# # bash scripts/evaluation_sft/Merged_MathVista_TO.sh

# ## multi GPU
# # bash scripts/evaluation_sft/Multi_GPU_PPL_TO.sh "MMMU_VAL_MultiChoice" 0 7 0 "--from_hf"
# # bash scripts/evaluation_sft/Multi_GPU_TO.sh "MMMU_VAL_OpenEnded" 0 7 0 "--from_hf"
# bash scripts/evaluation_sft/Multi_GPU_PPL_TO.sh "MathVista_MultiChoice" 0 7 0 "--from_hf"
# bash scripts/evaluation_sft/Multi_GPU_TO.sh "MathVista_OpenEnded" 0 7 0 "--from_hf"

# Text-only
## single GPU
# bash scripts/evaluation_sft/Single_GPU_PPL_TO.sh "MMLU" "--from_hf"
# bash scripts/evaluation_sft/Single_GPU_PPL_TO.sh "PIQA_VAL" "--from_hf"

## multi GPU
bash scripts/evaluation_sft/Multi_GPU_PPL_TO.sh "MMLU" 0 7 0 "--from_hf"
# bash scripts/evaluation_sft/Multi_GPU_PPL_TO.sh "PIQA_VAL" 0 7 0 "--from_hf"

date