# @package __global__

defaults:
  - encodec/default

compression_model: speechtokenizer_hier6

encodec:
  semantic_dim: ${semantic_model.dim}

encodec_hier:
  autoencoder: seanets
  quantizer: rvqs
  sample_rate: ${sample_rate}
  channels: ${channels}
  causal: false
  renormalize: false
  target_n_qs: [1, 2, 2, 3]

seanet:
  # default ratios are [8, 5, 4, 2]
  ratios: [10,5,5,2]
  n_filters: 64
  bilstm: true

rvq:
  bins: 1024
  n_q: 8
  q_dropout: false

seanets:
  dimension: 128
  channels: 128
  causal: ${encodec_hier.causal}
  n_filters: 256
  n_residual_layers: 1
  ratios: [[6, 1], [3, 1], [2, 1], []]
  activation: ELU
  activation_params: {"alpha": 1.}
  norm: weight_norm
  norm_params: {}
  kernel_size: 7
  residual_kernel_size: 3
  last_kernel_size: 7
  dilation_base: 2
  pad_mode: constant
  true_skip: true
  compress: 2
  lstm: 2
  bilstm: true
  disable_norm_outer_blocks: 0
  # Specific encoder or decoder params.
  # You can also override any param for the encoder or decoder only
  # by using Hydra `+param=` syntax, i.e.`
  # `+seanet.decoder.n_filters=64`.
  decoder:
    trim_right_ratio: 1.0
    final_activation: null
    final_activation_params: null
  encoder: {}

rvqs:
  n_q: [6, 6, 4, 3]
  q_dropout: false
  bins: 1024
  decay: 0.99
  kmeans_init: true
  kmeans_iters: 50
  threshold_ema_dead_code: 2
  orthogonal_reg_weight: 0.0
  orthogonal_reg_active_codes_only: false
