# Base model configurations
# Format: model_name: {gpu_type, gpu_count, model_name, model_family}

############################################################
# OpenAI models
############################################################
# gpt-4o-2024-08-06:
#   gpu_type: a100
#   gpu_count: 0  # No GPU needed for API calls
#   model_name: "gpt-4o-2024-08-06"
#   model_family: "gpt"

gpt-4o-2024-11-20:
  model_key: gpt-4o-2024-11-20
  gpu_type: a100
  gpu_count: 0  # No GPU needed for API calls
  model_name: gpt-4o-2024-11-20
  model_family: gpt
  prompt_file: exps/eval_vlms/results/prompts/prompts__dataset_graphics_sz823__gpt.json
  response_file: exps/eval_vlms/results/responses/responses__dataset_graphics_sz823__gpt-4o-2024-11-20.json
  evaluation_file: exps/eval_vlms/results/evaluations/evaluations__dataset_graphics_sz823__gpt-4o-2024-11-20.json

gpt-4-turbo-2024-04-09:
  model_key: gpt-4-turbo-2024-04-09
  gpu_type: a100
  gpu_count: 0  # No GPU needed for API calls
  model_name: gpt-4-turbo-2024-04-09
  model_family: gpt
  prompt_file: exps/eval_vlms/results/prompts/prompts__dataset_graphics_sz823__gpt.json
  response_file: exps/eval_vlms/results/responses/responses__dataset_graphics_sz823__gpt-4-turbo-2024-04-09.json
  evaluation_file: exps/eval_vlms/results/evaluations/evaluations__dataset_graphics_sz823__gpt-4-turbo-2024-04-09.json

############################################################
# Small models (1-3B)
############################################################
paligemma_3b:
  model_key: paligemma_3b
  gpu_type: a100
  gpu_count: 1
  model_name: google/paligemma-3b-mix-224
  model_family: paligemma
  prompt_file: exps/eval_vlms/results/prompts/prompts__dataset_graphics_sz823__paligemma.json
  response_file: exps/eval_vlms/results/responses/responses__dataset_graphics_sz823__paligemma_3b.json
  evaluation_file: exps/eval_vlms/results/evaluations/evaluations__dataset_graphics_sz823__paligemma_3b.json

phi3v_3b:
  model_key: phi3v_3b
  gpu_type: a100
  gpu_count: 1
  model_name: microsoft/Phi-3-vision-128k-instruct
  model_family: phi3v
  prompt_file: exps/eval_vlms/results/prompts/prompts__dataset_graphics_sz823__phi3v.json
  response_file: exps/eval_vlms/results/responses/responses__dataset_graphics_sz823__phi3v_3b.json
  evaluation_file: exps/eval_vlms/results/evaluations/evaluations__dataset_graphics_sz823__phi3v_3b.json

############################################################
# Medium models (7-25B)
############################################################

llavaov_7b_chat:
  model_key: llavaov_7b_chat
  gpu_type: a100
  gpu_count: 2
  model_name: llava-hf/llava-onevision-qwen2-7b-ov-chat-hf
  model_family: llavaov_chat
  prompt_file: exps/eval_vlms/results/prompts/prompts__dataset_graphics_sz823__llavaov_chat.json
  response_file: exps/eval_vlms/results/responses/responses__dataset_graphics_sz823__llavaov_7b_chat.json
  evaluation_file: exps/eval_vlms/results/evaluations/evaluations__dataset_graphics_sz823__llavaov_7b_chat.json

molmo_7b:
  model_key: molmo_7b
  gpu_type: a100
  gpu_count: 2
  model_name: allenai/Molmo-7B-D-0924
  model_family: molmo
  prompt_file: exps/eval_vlms/results/prompts/prompts__dataset_graphics_sz823__molmo.json
  response_file: exps/eval_vlms/results/responses/responses__dataset_graphics_sz823__molmo_7b.json
  evaluation_file: exps/eval_vlms/results/evaluations/evaluations__dataset_graphics_sz823__molmo_7b.json

qwen2vl_7b_instruct:
  model_key: qwen2vl_7b_instruct
  gpu_type: a100
  gpu_count: 2
  model_name: Qwen/Qwen2-VL-7B-Instruct
  model_family: qwen2vl_instruct
  prompt_file: exps/eval_vlms/results/prompts/prompts__dataset_graphics_sz823__qwen2vl_instruct.json
  response_file: exps/eval_vlms/results/responses/responses__dataset_graphics_sz823__qwen2vl_7b_instruct.json
  evaluation_file: exps/eval_vlms/results/evaluations/evaluations__dataset_graphics_sz823__qwen2vl_7b_instruct.json

internvl2_8b:
  model_key: internvl2_8b
  gpu_type: a100
  gpu_count: 2
  model_name: OpenGVLab/InternVL2-8B
  model_family: internvl2
  prompt_file: exps/eval_vlms/results/prompts/prompts__dataset_graphics_sz823__internvl2.json
  response_file: exps/eval_vlms/results/responses/responses__dataset_graphics_sz823__internvl2_8b.json
  evaluation_file: exps/eval_vlms/results/evaluations/evaluations__dataset_graphics_sz823__internvl2_8b.json

glm4v_9b:
  model_key: glm4v_9b
  gpu_type: a100
  gpu_count: 2
  model_name: THUDM/glm-4v-9b
  model_family: glm4v
  inference_script: exps/eval_vlms/build_responses_vlms.py
  prompt_file: exps/eval_vlms/results/prompts/prompts__dataset_graphics_sz823__glm4v.json
  response_file: exps/eval_vlms/results/responses/responses__dataset_graphics_sz823__glm4v_9b.json
  evaluation_file: exps/eval_vlms/results/evaluations/evaluations__dataset_graphics_sz823__glm4v_9b.json

pixtral_12b:
  model_key: pixtral_12b
  gpu_type: a100
  gpu_count: 2
  model_name: mistralai/Pixtral-12B-2409
  model_family: pixtral
  prompt_file: exps/eval_vlms/results/prompts/prompts__dataset_graphics_sz823__pixtral.json
  response_file: exps/eval_vlms/results/responses/responses__dataset_graphics_sz823__pixtral_12b.json
  evaluation_file: exps/eval_vlms/results/evaluations/evaluations__dataset_graphics_sz823__pixtral_12b.json

pixtralhf_12b:
  model_key: pixtralhf_12b
  gpu_type: a100
  gpu_count: 2
  model_name: mistral-community/pixtral-12b
  model_family: pixtralhf
  prompt_file: exps/eval_vlms/results/prompts/prompts__dataset_graphics_sz823__pixtralhf.json
  response_file: exps/eval_vlms/results/responses/responses__dataset_graphics_sz823__pixtralhf_12b.json
  evaluation_file: exps/eval_vlms/results/evaluations/evaluations__dataset_graphics_sz823__pixtralhf_12b.json

deepseek_vl2:
  model_key: deepseek_vl2
  gpu_type: h100
  gpu_count: 4
  model_name: deepseek-ai/deepseek-vl2
  model_family: deepseek_vl2
  inference_script: exps/eval_vlms/build_responses_vlms.py
  prompt_file: exps/eval_vlms/results/prompts/prompts__dataset_graphics_sz823__deepseek_vl2.json
  response_file: exps/eval_vlms/results/responses/responses__dataset_graphics_sz823__deepseek_vl2.json
  evaluation_file: exps/eval_vlms/results/evaluations/evaluations__dataset_graphics_sz823__deepseek_vl2.json

############################################################
# Large models (>70B)
############################################################
llavaov_72b_chat:
  model_key: llavaov_72b_chat
  gpu_type: a100
  gpu_count: 8
  model_name: llava-hf/llava-onevision-qwen2-72b-ov-chat-hf
  model_family: llavaov_chat
  prompt_file: exps/eval_vlms/results/prompts/prompts__dataset_graphics_sz823__llavaov_chat.json
  response_file: exps/eval_vlms/results/responses/responses__dataset_graphics_sz823__llavaov_72b_chat.json
  evaluation_file: exps/eval_vlms/results/evaluations/evaluations__dataset_graphics_sz823__llavaov_72b_chat.json

molmo_72b:
  model_key: molmo_72b
  gpu_type: a100
  gpu_count: 8
  model_name: allenai/Molmo-72B-0924
  model_family: molmo
  prompt_file: exps/eval_vlms/results/prompts/prompts__dataset_graphics_sz823__molmo.json
  response_file: exps/eval_vlms/results/responses/responses__dataset_graphics_sz823__molmo_72b.json
  evaluation_file: exps/eval_vlms/results/evaluations/evaluations__dataset_graphics_sz823__molmo_72b.json

nvlm_72b:
  model_key: nvlm_72b
  gpu_type: a100
  gpu_count: 8
  model_name: nvidia/NVLM-D-72B
  model_family: nvlm
  prompt_file: exps/eval_vlms/results/prompts/prompts__dataset_graphics_sz823__nvlm.json
  response_file: exps/eval_vlms/results/responses/responses__dataset_graphics_sz823__nvlm_72b.json
  evaluation_file: exps/eval_vlms/results/evaluations/evaluations__dataset_graphics_sz823__nvlm_72b.json


qwen2vl_72b_instruct:
  model_key: qwen2vl_72b_instruct
  gpu_type: a100
  gpu_count: 8
  model_name: Qwen/Qwen2-VL-72B-Instruct
  model_family: qwen2vl_instruct
  prompt_file: exps/eval_vlms/results/prompts/prompts__dataset_graphics_sz823__qwen2vl_instruct.json
  response_file: exps/eval_vlms/results/responses/responses__dataset_graphics_sz823__qwen2vl_72b_instruct.json
  evaluation_file: exps/eval_vlms/results/evaluations/evaluations__dataset_graphics_sz823__qwen2vl_72b_instruct.json

internvl2_76b:
  model_key: internvl2_76b
  gpu_type: a100
  gpu_count: 8
  model_name: OpenGVLab/InternVL2-Llama3-76B
  model_family: internvl2
  prompt_file: exps/eval_vlms/results/prompts/prompts__dataset_graphics_sz823__internvl2.json
  response_file: exps/eval_vlms/results/responses/responses__dataset_graphics_sz823__internvl2_76b.json
  evaluation_file: exps/eval_vlms/results/evaluations/evaluations__dataset_graphics_sz823__internvl2_76b.json

pixtral_124b:
  model_key: pixtral_124b
  gpu_type: a100
  gpu_count: 8
  model_name: mistralai/Pixtral-Large-Instruct-2411
  model_family: pixtral
  prompt_file: exps/eval_vlms/results/prompts/prompts__dataset_graphics_sz823__pixtral.json
  response_file: exps/eval_vlms/results/responses/responses__dataset_graphics_sz823__pixtral_124b.json
  evaluation_file: exps/eval_vlms/results/evaluations/evaluations__dataset_graphics_sz823__pixtral_124b.json


qwenqvq_preview_72b:
  model_key: qwenqvq_preview_72b
  gpu_type: a100
  gpu_count: 8
  model_name: Qwen/QVQ-72B-Preview
  model_family: qwen2vl_instruct
  prompt_file: exps/eval_vlms/results/prompts/prompts__dataset_graphics_sz823__qwen2vl_instruct.json
  response_file: exps/eval_vlms/results/responses/responses__dataset_graphics_sz823__qwenqvq_preview_72b.json
  evaluation_file: exps/eval_vlms/results/evaluations/evaluations__dataset_graphics_sz823__qwenqvq_preview_72b.json

