# Copyright (2024) Tsinghua University, Bytedance Ltd. and/or its affiliates
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

model:
  # paths
  llama_path: "./checkpoints/vicuna-13b-v1.1"
  whisper_path: "./checkpoints/whisper-large-v2"
  beats_path: "./checkpoints/beats/BEATs_iter3_plus_AS2M_finetuned_on_AS2M_cpt2.pt"

  # "checkpoints/ckpt_salmonn/salmonn_v1.pth" # model used for decoding" # if not "", load model from ckpt for training or evaluation
  ckpt: "./checkpoints/checkpoint_best.pth"

  freeze_whisper: False
  freeze_beats: False

  # window-level Q-Former
  use_speech_Qformer: True
  freeze_speech_QFormer: False
  window_level_Qformer: True
  num_speech_query_token: 1
  second_per_window: 0.333333
  second_stride: 0.333333

  speech_llama_proj_model: ""
  freeze_speech_llama_proj: False

  # LoRA
  lora: True
  lora_rank: 8
  lora_alpha: 32
  lora_dropout: 0.1

  multi_prompt: True
  prompt_template: "USER: {}\nASSISTANT:"
  prompt_path: "prompts/train_prompt.json"
  test_prompt_path: "prompts/test_prompt.json"
  max_txt_len: 300
  end_sym: "</s>"

datasets:
  train_ann_path: ./data/train.json
  valid_ann_path: ./data/val.json
  test_ann_path: ./data/test.json

  whisper_path: "./checkpoints/whisper-large-v2"

run:
  # log & settings
  seed: 42
  output_dir: "./"
  output_folder: "output"
  evaluate: False # if True, only evaluate model on test data

  log_freq: 5
  epoch_based: True
  iters_per_epoch: 3000
  accum_grad_iters: 2
  batch_size_train: 2
  batch_size_eval: 2
  num_workers: 2

  device: "cuda"
  use_distributed: True
  amp: True
  world_size: 1
  dist_url: "env://"

  # optimizer & scheduler
  optims:
    max_epoch: 30
    warmup_steps: 3000
    warmup_start_lr: 1e-6
    init_lr: 3e-5
    min_lr: 1e-5
    weight_decay: 0.05
    beta2: 0.999
