date
cd YOUR_ROOT_PATH/MLLM

export CHECKPOINT_PATH="YOUR_ROOT_PATH/model/checkpoint/MLLM/fine_tune_OI+IC_then_OI_SFT_OI_IC_128_1e-4_0.05_e1/last_7408"

# Merged model
bash scripts/evaluation_sft/Merged_MME.sh

# Caption
## single GPU
bash scripts/evaluation_sft/Merged_Caption.sh

## multi GPU
# bash scripts/evaluation_sft/Multi_GPU.sh "COCO" 0 1 0 "--from_hf"
# bash scripts/evaluation_sft/Multi_GPU.sh "Flickr30K" 0 1 0 "--from_hf"
# bash scripts/evaluation_sft/Multi_GPU.sh "NoCaps" 0 1 0 "--from_hf"
# bash scripts/evaluation_sft/Multi_GPU.sh "WHOOPS-Caption" 0 1 0 "--from_hf"

# VQA
## single GPU
bash scripts/evaluation_sft/Single_GPU.sh "GQA_TESTDEV_BALANCED" ""
bash scripts/evaluation_sft/Single_GPU.sh "OK-VQA" "--from_hf"
bash scripts/evaluation_sft/Single_GPU.sh "VizWiz_VAL" "--from_hf"
bash scripts/evaluation_sft/Single_GPU.sh "TextVQA" "--from_hf"

## multi GPU
# bash scripts/evaluation_sft/Multi_GPU.sh "GQA_TESTDEV_BALANCED" 0 7 0 ""
# bash scripts/evaluation_sft/Multi_GPU.sh "OK-VQA" 0 7 0 "--from_hf"
# bash scripts/evaluation_sft/Multi_GPU.sh "VizWiz_VAL" 0 7 0 "--from_hf"
# bash scripts/evaluation_sft/Multi_GPU.sh "TextVQA" 0 7 0 "--from_hf"
bash scripts/evaluation_sft/Multi_GPU.sh "VQAv2_VAL" 0 7 1 "--from_hf"

# Misalignment
## single GPU
# bash scripts/evaluation_sft/Single_GPU_PPL.sh "MME" ""
bash scripts/evaluation_sft/Single_GPU_PPL.sh "HallusionBench" ""
bash scripts/evaluation_sft/Single_GPU_PPL.sh "POPE" "--from_hf"
# bash scripts/evaluation_sft/Single_GPU_PPL.sh "Winoground-YN" "--from_hf"

## multi GPU
# bash scripts/evaluation_sft/Multi_GPU_PPL.sh "MME" 0 8 0 ""
# bash scripts/evaluation_sft/Multi_GPU_PPL.sh "HallusionBench" 0 8 0 ""
# bash scripts/evaluation_sft/Multi_GPU_PPL.sh "POPE" 0 8 0 "--from_hf"
# bash scripts/evaluation_sft/Multi_GPU_PPL.sh "Winoground-YN" 0 7 0 "--from_hf"

# MC
## single GPU
bash scripts/evaluation_sft/Single_GPU_PPL.sh "MMBench_DEV_EN" ""
bash scripts/evaluation_sft/Single_GPU_PPL.sh "ScienceQA_VAL" ""
bash scripts/evaluation_sft/Single_GPU_PPL.sh "ScienceQA_TEST" ""
bash scripts/evaluation_sft/Single_GPU_PPL.sh "SEEDBench_IMG" ""

## multi GPU
# bash scripts/evaluation_sft/Multi_GPU_PPL.sh "MMBench_DEV_EN" 0 8 0 ""
# bash scripts/evaluation_sft/Multi_GPU_PPL.sh "ScienceQA_VAL" 0 8 0 ""
# bash scripts/evaluation_sft/Multi_GPU_PPL.sh "ScienceQA_TEST" 0 8 0 ""
# bash scripts/evaluation_sft/Multi_GPU_PPL.sh "SEEDBench_IMG" 0 8 0 ""

# MIX
## single GPU
bash scripts/evaluation_sft/Merged_MMMU.sh 
bash scripts/evaluation_sft/Merged_MathVista.sh

## multi GPU
# bash scripts/evaluation_sft/Multi_GPU_PPL.sh "MMMU_VAL_MultiChoice" 0 8 0 "--from_hf"
# bash scripts/evaluation_sft/Multi_GPU.sh "MMMU_VAL_OpenEnded" 0 7 0 "--from_hf"  
# bash scripts/evaluation_sft/Multi_GPU_PPL.sh "MathVista_MultiChoice" 0 8 0 "--from_hf"
# bash scripts/evaluation_sft/Multi_GPU.sh "MathVista_OpenEnded" 0 7 0 "--from_hf" 

date
