 # Copyright (c) 2022, salesforce.com, inc.
 # All rights reserved.
 # SPDX-License-Identifier: BSD-3-Clause
 # For full license text, see the LICENSE file in the repo root or https://opensource.org/licenses/BSD-3-Clause

model:
  arch: flex_m3
  model_type: pretrain_flant5xl
  vit_precision: fp32
  load_finetuned: True
  finetuned: ''
  use_grad_checkpoint: False
  freeze_vit: True
  frame_num: 4
  answer_num: 5
  task: train_discriminator
  downstream_task: oeqa
  modulars: rgb
  lora_rank: 64
  lora_dropout: 0.1
  lora_ckpt: ''

datasets:
  nextqa: # name of the dataset builder
    vis_processor:
        train:
          name: "blip2_frames_train"
          n_frms: 4
          image_size: 224
        eval:
          name: "blip_frames_eval"
          n_frms: 4
          image_size: 224

    text_processor:
        train:
          name: "blip_question"
          max_words: 50
        eval:
          name: "blip_question"
          max_words: 50
    build_info:
        annotations:
          train:
            url: 
              - /home/workspace/flex/nextqa/nextqa_annotation/train.json
            storage: 
              - /home/workspace/flex/nextqa/nextqa_annotation/train.json
          test:
            url: 
              - /home/workspace/flex/nextqa/nextqa_annotation/val.json
            storage: 
              - /home/workspace/flex/nextqa/nextqa_annotation/val.json
          val:
            url: 
              - /home/workspace/flex/nextqa/nextqa_annotation/val.json
            storage: 
              - /home/workspace/flex/nextqa/nextqa_annotation/val.json
        videos:
          storage: /home/workspace/flex/nextqa/nextqa/
        # other modalities data storage is based on videos, see rgbd_vqa_datasets.py

run:
  task: videoqa
  # optimizer
  lr_sched: "linear_warmup_cosine_lr"
  init_lr: 5e-5
  min_lr: 0
  warmup_lr: 1e-8
  warmup_steps: 500
  weight_decay: 0.05
  max_epoch: 5
  batch_size_train: 16
  batch_size_eval: 8
  num_workers: 8
  accum_grad_iters: 1

  max_len: 30
  min_len: 8
  num_beams: 5

  seed: 42
  output_dir: "/result/BLIP2/NextQA/QA/"

  amp: True
  resume_ckpt_path: null

  evaluate: False
  train_splits: ["train"]
  valid_splits: ["val"]
  test_splits: ["val"]

  device: "cuda"
  world_size: 1
  dist_url: "env://"
  distributed: True
  find_unused_parameters: True