 # Copyright (c) 2022, salesforce.com, inc.
 # All rights reserved.
 # SPDX-License-Identifier: BSD-3-Clause
 # For full license text, see the LICENSE file in the repo root or https://opensource.org/licenses/BSD-3-Clause

# Overall Accuracy is: 63.13
# Per Answer Type Accuracy is the following:
# other : 52.90
# yes/no : 84.28
# number : 41.01

model:
  arch: mini_gpt4
  model_type: pretrain_vicuna0
  end_sym: "###"
  max_txt_len: 200
  ckpt: '.cache/hub/models--minigpt4--vicuna-7b/pretrained_minigpt4_vicuna_7b.pth'
  use_grad_checkpoint: False
  # prompt_template: "Based on the image, answer the question.\nQuestion: {}"
  answer_refinement_prompt: " Assistant: {}\n###Human: Shorten your answer to the question as much as possible, preferrably only 1 word."
  # answer_refinement_prompt: " Assistant: {}\n###Human: Shorten your answer as much as possible and only keep necessary text, preferrably only 1-2 word(s)."
  # prefix: "### Human: <Img>"
  prompt_template: "### Human: <Img><ImageHere></Img>### Human: Based on the image, answer the question below.\nQuestion: {}"
  process_answer: True
  answer_processor: 'vqa'
  conversation: True

  ext_paraphrase: False
  par_num_beams: 5
  num_paraphrases: 4

  pipeline: True
  reason: True
  paraphrase: False

  perform_selection: True
  selection_criterion: 'Aconf'
  perform_ensembling: False

  verbose: True
  alt_device: 0

datasets:
  coco_vqa: # name of the dataset builder
    type: eval
    vis_processor:
        eval:
          name: "blip2_image_eval"
          image_size: 224
    text_processor:
        eval:
          name: "blip_question"
    build_info:
        images:
            storage: '.cache/lavis/coco/images/'

run:
  task: vqa
  # optimization-specific
  batch_size_train: 16
  batch_size_eval: 4
  num_workers: 4

  # inference-specific
  max_len: 50
  min_len: 1
  num_beams: 5
  inference_method: "generate"
  # prompt: "### Human: Answer this question in one word.\nQuestion: {} ### Assistant: Answer:"
  
  seed: 42
  output_dir: "output/Vicuna7B/VQA"

  evaluate: True
  test_splits: ["val"]

  # distribution-specific
  device: "cuda"
  world_size: 1
  dist_url: "env://"
  distributed: True
