name: tldr 
max_samples: 512


data:
  name: trl-internal-testing/tldr-preference-sft-trl-style
  subset: null
  split: test
  question_field: prompt
  answer_field: null
  comparator_field: summary

generation: 
  max_response_length: 200 
  max_prompt_length: 1024

rstar_keys: 
  - correct

TASK_DESC: ""
