type: "dpo-train-claim-rewriter"
input_dir: "data/task_outputs/dpo_claim_rewriter_dataset/"
learning_rate: 0.000001
output_dir: "data/task_outputs/dpo_claim_rewriter_model/"
model_name: "meta-llama/Meta-Llama-3-8B-Instruct"
dependencies:
  dataset: "configs/prepare_dpo_claim_rewriter_dataset.yaml"