task: openbookqa_cot
dataset_path: allenai/openbookqa
dataset_name: additional
output_type: generate_until
test_split: test

doc_to_text: |
  Fact: {{fact1}}
  Question: {{question_stem}}

  Think step by step using relevant facts. 
  Finally output the final answer text (not the letter) on its own line like "The answer is: <answer>".

doc_to_target: |
  {%- for L in choices.label -%}
  {%- if L == answerKey -%}{{ choices.text[loop.index0] }}{%- endif -%}
  {%- endfor -%}

generation_kwargs:
  until:
    - "\n\nQ:"
    - "</s>"
    - "<|im_end|>"
    - "Q:"
    - "Question: "
    - "\nAnswer:"
  do_sample: true
  temperature: 0.5
  top_p: 0.95

# Pass@5 wiring
repeats: 5
num_fewshot: 0

# process_results: !function utils.process_results_openbookqa_freeform

# metric_list:
#   - metric: acc_fs4
#     aggregation: mean
#     higher_is_better: true

metric_list:
  - metric: !function utils.fs4_per_gen_list
    aggregation: mean
    higher_is_better: true

filter_list:
  - name: take_first_five
    filter:
      - function: take_first_k
        k: 5
