model:
  name: "zipformer_adam"  # Model name
  type: "ZipformerAsrModel"  # Model type
  local: true  # Use local or Hugging Face transformers
  local_path: "./exp/my_local_model"  # Required if local
  cache_dir: ~  # Optional for Hugging Face cache directory
  config_type: ZipformerConfig
  config_path: "./configs/zipformer_config.json"  # Optional for local models

tokenizer:
  name: asr_tokenizer
  type: IcefallBbpeTokenizer
  local: True
  path: data/lang_bbpe_2000/bbpe.model

trainer:
  base_lr: 0.045
  scheduler: "eden"
  # lr_epochs: 3.5 # Number of epochs that affects how rapidly the learning rate decreases.
  # lr_batches: 7500 # Number of steps that affects how rapidly the learning rate decreases. We suggest not to change this.
  warmup_batches: 500
  num_epochs: 30
  start_epoch: 1
  start_batch: 0
  ref_duration: 600 # Reference batch duration for purposes of adjusting batch counts for setting various schedules inside the model
  prune_range: 5 # The prune range for rnnt loss, it means how many symbols(context) we are using to compute the loss
  lm_scale: 0.25 # The scale to smooth the loss with lm(output of prediction network) part
  am_scale: 0 #The scale to smooth the loss with am (output of encoder network) part
  simple_loss_scale: 0.5
  rnnt_warm_step: 2000
  save_every_n: 4
  keep_last_k: 30
  use_averaged_model: True
  log_interval: 50
  average_period: 200
  reset_interval: 200
  valid_interval: 1000
  # use_fp16: True
  ctc_loss_scale: 0.5
  balance_loss_scale: 0
  specialization_loss_scale: 0
  initial_batch_count: 0 # initial batch count to make ScheduledFloat to its final value when loaded. Used with pretrained model provided
  checkpoint:
    pretrained_model: ~ # Fine-tuning from which pretrained checkpoint (path to a .pt file)
  tensorboard: True

data:
  manifest_dir: data/fbank_language_shuffle
  train_sets: [aishell, librispeech1, librispeech2, librispeech3]
  train_sets_weights: ~
  valid_sets: [data/test/aishell/cuts_fbank.jsonl.gz, data/test/librispeech/test-clean/cuts_fbank.jsonl.gz]
  valid_data_path_prefix: true
  enable_spec_aug: True
  input_strategy: PrecomputedFeatures
  bucketing_sampler: True
  num_buckets: 30
  max_duration: 600
  on_the_fly_feats: False
  text_normalization: True
  shuffle: True
  drop_last: True
  num_workers: 8

deepspeed_config: ./configs/ds_config_zero1.json