task: sft

dataset_conf:
  max_len: 5
  sample_rate: 44100
  batch_size: 1
  num_workers: 20
  max_train_samples: 50000
  max_eval_samples: 5000
  train_file: "sft_data.jsonl"
  eval_file: "test_86k.jsonl"

encoder_conf:
  encoder_strategy: "lora"

decoder_conf:
  decoder_strategy: "lora"

optim_args:
  lr: !!float 5e-5
  name: "adamw_torch"
  weight_decay: !!float 1e-6

epochs: 50
warmup_radio: 0.1
acc_grad: 4
clip_grad: 1

teacher_forcing_ratio: 0.0

swanlab_conf:
  enabled: true
  project: "LALM_sft2"
  # 使用占位符来定义动态的 run_name 模板
  run_name_template: "{model_name}-{task}-{timestamp}"