# Supervised Finetuning
name: ppo

trainer: SFTTrainer

dataloader: SFTDataLoader

use_reference_model: false
