defaults:
  - qwen3_4B_lora128
  - _self_

training:
  per_device_train_batch_size: 8
  gradient_accumulation_steps: 1
  learning_rate: 2e-5

inference:
  model_path: /path/to/checkpoint-merged/
  max_new_tokens: 32768