defaults:
  - _self_

mlflow:
  experiment_name: qwen3-4B-car4cast
  tracking_uri: file:/path/to/mlruns
  project: ft_car4cast

model:
  model_name: unsloth/Qwen3-4B-unsloth-bnb-4bit
  # model_name: unsloth/Qwen3-4B
  max_seq_length: 40096
  load_in_4bit: true
  # load_in_4bit: false
  load_in_8bit: false
  full_finetuning: false

peft:
  target_modules: ["q_proj", "k_proj", "v_proj", "o_proj", "gate_proj", "up_proj", "down_proj"]
  lora_dropout: 0
  bias: "none"
  use_gradient_checkpointing: "unsloth"
  use_rslora: false
  loftq_config: null

trainer:
  eval_strategy: epoch
  save_strategy: epoch
  save_steps: null
  output_dir: /path/to/checkpoints

training:
  dataset_text_field: text
  per_device_train_batch_size: 2
  gradient_accumulation_steps: 8
  warmup_ratio: 0.03
  num_train_epochs: 3
  max_steps: -1
  learning_rate: 4e-5
  logging_steps: 10
  optim: adamw_8bit
  weight_decay: 0.1
  lr_scheduler_type: cosine

inference:
  batch_size: 1
  max_new_tokens: 32768
  temperature: 0.7
  top_p: 0.8
  top_k: 20
  model_path: unsloth/Qwen3-4B-unsloth-bnb-4bit
  data_path: /path/to/test.jsonl
  out_dir: /your/out/dir