
"""The Direct Preference Optimization (DPO) algorithm."""

from safe_rlhf.algorithms.dpo.trainer import DPOTrainer


__all__ = ['DPOTrainer']
