# optimization config
gpu: "3"
batch_size: 2
epoch_num: 1000
encoder_lr: !!float 0.0
head_lr: !!float 0.0
main_lr: !!float 0.002

lr_schedule: plateau
mode: min
patience: 50
factor: 0.5
min_lr: !!float 1e-6

save_epoch: 50
optimizer: Adam

# =========== encoder ==========
# load_encoder: "PATH/TO/TRAINED/ENCODER/encoder_<ID>.pt"
load_encoder: ""

# ========= encoder head =========
# load_encoder_head: "PATH/TO/TRAINED/ENCODER/encoder_head_<ID>.pt"
load_encoder_head: ""
layer_num: 2
out_dim: 0

# ============ fusion method =============

# ----------- tfgridnet as kv fusion ------------
fusion_name: "tfgridnet_kv"
pooling_size: 40
fusion_stride: 40

# # ----------- film fusion ------------
# fusion_name: "tfgridnet_kv"

# ========= main branch =========

# --------- causal -----------
model_name: tfgridnet_causal
n_fft: 128
stride: 64
lstm_hidden_units: 64
emb_dim: 64
emb_ks: 1
n_layers: 3
model_normalize: True
fusion_layer: [0, 1]

# # --------- film fusion -----------
# model_name: tfgridnet_film_causal
# n_fft: 128
# stride: 64
# lstm_hidden_units: 64
# emb_dim: 64
# emb_ks: 1
# n_layers: 3
# model_normalize: False
# fusion_layer: [0, 1]

# # --------- tce -----------
# model_name: tce
# load_encoder_head: ""
# fusion_name: ""

# ===================================================

load_model: ""

# librispeech dataset
train_dataset_dir: "data/LibriSpeech/LibriSpeech/_train_data"
val_dataset_dir: "data/LibriSpeech/LibriSpeech/_val_data"

# # wsj0 dataset
# train_dataset_dir: "data/2/wsj0"
# val_dataset_dir: "data/2/wsj0"

sample_rate: 16000 
wave_length: 48000
pos_example_length: 48000
neg_example_length: 48000
dvec_rate: 50
return_clean_dvec: False
snr_db_range: [-2.5, 2.5]
source_num: 3
min_source_num: 3
active_num: [-1, 1, -1]
reproducable: False
normalize: False
perturb_speeds: 
filling_pattern: repeat
reverb: none
brir_dir: []
binaural: False
zero_degree_pos: False
concat_pos: False
reverb_cond: False
zero_in_tgt: False
noise_dir: "data/wham_noise/"
clean_pos: False
special_spk: ["Partial_Pos", "Partial_Neg"]
partial_range: [0.33, 0.66]
neg_partial_range: [1.0, 1.0]
tgt_snr: -1000000000 # no scaling on tgt intensity in enrollment
same_disturb: False
loss_type: "snr"

SNR_Weight: 10.0
Embedding_Weight: 0.0
