exp_dir:
hydra:
  run:
    dir: ${exp_dir}/logs/${now:%Y-%m-%d}/${now:%H-%M-%S}  # Force Hydra output (logs, etc.) into your experiment dir

model:
  name: "zipformer-spkveri" # check auto.model_registry.py to see all available models
  id2label_json: "configs/voxceleb2/id2label_voxceleb2.json"
  config_path: # Optional if you have a config.json to load for your model. Otherwise it will use the default value defined by model_type's config dataclass
  config_preset: # 'base', 'large'
  config:

        
trainer:
  optimizer: "scaled_adam"
  base_lr: 0.045
  scheduler: "eden"
  lr_epochs: 3.5 # Number of epochs that affects how rapidly the learning rate decreases.
  lr_batches: 7500 # Number of steps that affects how rapidly the learning rate decreases. We suggest not to change this.
  warmup_batches: 500 # lr warmup steps
  lr_steps_per_epoch: 0 # recommend to adjust this value when you do use_infinite_dataset=True to get exact learning rate schedule as usual. Set it close to your estimated number of steps per epoch
  num_epochs: 40
  start_epoch: 1
  start_batch: 0
  ref_duration: 600 # Reference batch duration for purposes of adjusting batch counts for setting various schedules inside the model
  keep_last_k: 30 # save last_k checkpoints on disk
  use_averaged_model: True
  log_interval: 50
  average_period: 200 # how rapidly the averaged_model is averaged and saved
  reset_interval: 200 # moving average interval for info tracker
  valid_interval: 1000
  save_every_n: 4 # save checkpoint every (n * valid_interval) steps
  use_fp16: False
  initialization:
    checkpoint: ~ # initialized from other pretrained checkpoint (path to a .pt file). We will only use the init_modules
    init_modules: ['encoder_embed', 'encoder'] # these 2 are for audio encoders
  tensorboard: True
  freeze_modules: ~ # name of modules to be frozen during training

data:
  train_data_config: configs/voxceleb2/train_data_config_voxceleb2.yaml
  valid_sets: ['/apdcephfs_cq10/share_1603164/user/mingyuehuo/process_data/voxceleb2_valid_filtered.jsonl.gz']
  valid_data_path_prefix: false
  enable_spec_aug: True
  input_strategy: ~ # PrecomputedFeatures
  enable_musan: False
  musan: /apdcephfs_cq12/share_302080740/data/asr_train_data/manifests/musan/musan_cuts.jsonl.gz # for ASR
  enable_speed_perturb: False
  ge2e_sampler: True
  max_duration: 600
  on_the_fly_feats: True
  shuffle: True
  drop_last: True
  num_workers: 8
  use_infinite_dataset: True
  label_field: "speaker" # supervisions field used as the label 
  speakers_per_batch: 8 # Number of unique speakers per training batch
  utts_per_speaker: 4 # Number of utterances sampled per speaker in each batch
  sample_ratio: 0.1 # Proportion of verification pairs sampled to compute AUC/EER during validation; 
                    # reduces computation when using all pairs is too expensive