name: alpaca 
max_samples: -1

data:
  name: tatsu-lab/alpaca_eval
  subset: null
  split: eval
  question_field: instruction
  answer_field: null
  comparator_field: response

generation: 
  max_response_length: 1024 
  max_prompt_length: 1024

rstar_keys: 
  - winrate

TASK_DESC: ""
