model:
  name: "whisper"  # Model name
  type: "WhisperAsrModel"  # Model type
  local: true  # Use local or Hugging Face transformers
  cache_dir: ~  # Optional for Hugging Face cache directory
  config_type: WhisperConfig
  config_path: configs/model/medium.json  # Optional for local models
  save_trainable_only: true # only save trainable params to ckpt

tokenizer:
  name: whisper_asr_tokenizer
  type: WhisperTokenizer
  local: True
  path: configs/tokenizer/base.json

lora:
  use_lora: True
  config: configs/lora/r64_qkvol_all.json

trainer:
  optimizer: "adamw"
  base_lr: 0.0002
  lr_epochs: 3.5 # Number of epochs that affects how rapidly the learning rate decreases.
  lr_batches: 7500 # Number of steps that affects how rapidly the learning rate decreases. We suggest not to change this.
  warmup_batches: 500
  scheduler: "eden"
  num_epochs: 30
  start_epoch: 1
  start_batch: 0
  ref_duration: 48 # Reference batch duration for purposes of adjusting batch counts for setting various schedules inside the model
  save_every_n: 4000
  keep_last_k: 30
  use_averaged_model: True
  log_interval: 50
  average_period: 200
  reset_interval: 200
  valid_interval: 1000
  use_fp16: True
  ctc_loss_scale: 0.5
  balance_loss_scale: 0
  initial_batch_count: 0 # initial batch count to make ScheduledFloat to its final value when loaded. Used with pretrained model provided
  checkpoint:
    pretrained_model: ~ # Fine-tuning from which pretrained checkpoint (path to a .pt file)
  tensorboard: True
  find_unused_parameters: False

data:
  train_data_config: configs/train_data_config.yaml
  valid_data_config: configs/valid_data_config.yaml
  enable_spec_aug: True
  input_strategy: PrecomputedFeatures
  bucketing_sampler: True
  num_buckets: 30
  max_duration: 48
  on_the_fly_feats: True
  shuffle: True
  drop_last: True
  num_workers: 8
  num_filters: 80
  text_normalization: True