
SFT_DATASET="bird_train_full_qwen"

LABELED_FILE="data/labeled/bird_train_pipeline_label.jsonl"

SFT_CONFIG="sft_config"  


python -m src.dpo.prepare_dpo_data
python -m src.dpo.generate_dpo_pairs
python -m src.dpo.qwen_dpo_train