full_model_list = [
    "Qwen/Qwen2.5-VL-3B-Instruct",
    "Qwen/Qwen2.5-VL-7B-Instruct",
    "Qwen/Qwen2.5-VL-32B-Instruct",
    "Qwen/Qwen2.5-VL-72B-Instruct",

    "meta-llama/Llama-3.2-11B-Vision-Instruct",
    "meta-llama/Llama-3.2-90B-Vision-Instruct-Turbo",

    "google/gemma-3-1b-it",
    "google/gemma-3-12b-it",
    "google/gemma-3-27b-it",

    "llava-hf/llava-v1.6-vicuna-7b-hf",
    "llava-hf/llava-v1.6-vicuna-13b-hf",
    "llava-hf/llava-v1.6-34b-hf",

    "mistralai/Pixtral-12B-2409",
    "microsoft/Phi-4-multimodal-instruct",
    "Salesforce/xgen-mm-phi3-mini-instruct-interleave-r-v1.5",
]

model_map = {
    "Qwen/Qwen2.5-VL-3B-Instruct": "Qwen2.5-3B",
    "Qwen/Qwen2.5-VL-7B-Instruct": "Qwen2.5-7B",
    "Qwen/Qwen2.5-VL-32B-Instruct": "Qwen2.5-32B",
    "Qwen/Qwen2.5-VL-72B-Instruct": "Qwen2.5-72B",

    "meta-llama/Llama-3.2-11B-Vision-Instruct": "LLaMA3.2-11B",
    "meta-llama/Llama-3.2-90B-Vision-Instruct-Turbo": "LLaMA3.2-90B",

    "google/gemma-3-1b-it": "Gemma3-1B",
    "google/gemma-3-12b-it": "Gemma3-12B",
    "google/gemma-3-27b-it": "Gemma3-27B",

    "llava-hf/llava-v1.6-vicuna-7b-hf": "LLaVA1.6-7B",
    "llava-hf/llava-v1.6-vicuna-13b-hf": "LLaVA1.6-13B",
    "llava-hf/llava-v1.6-34b-hf": "LLaVA1.6-34B",

    "mistralai/Pixtral-12B-2409": "Pixtral-12B",
    "microsoft/Phi-4-multimodal-instruct": "Phi4-5.6B",
    "Salesforce/xgen-mm-phi3-mini-instruct-interleave-r-v1.5": "BLIP3-4B",
}

modalities = ["real", "synthetic", "triple"]

questions = ['Recognition', 'Understanding', 'Grounding', 'Reasoning']
questions_short = ['RC', 'UN', 'GR', 'RS']

categories = ['Bar Chart', 'Line Graph', 'Map', 'Pie Chart',
              'Biology', 'Chemistry', 'Computer Science', 'Mathematics', 'Physics', 'Others']

