# @package _global_
defaults:
  - override /model: tiny-mistral
  - override /loss: dpo

datasets:
 - hh 

local_dirs:
 - test_outputs

exp_name: test_dpo_tiny_mistral_run

trainer: BasicTrainer 
loss:
 beta: 0.1

sample_during_eval: false
gradient_accumulation_steps: 2 
batch_size: 10 
eval_batch_size: 10 

wandb:
 enabled: false

test_dataset: true
 
