task: qasc_cot
dataset_path: allenai/qasc
dataset_name: default
output_type: generate_until
test_split: validation

doc_to_text: |
  Facts: 
  1. {{fact1}} 
  2. {{fact2}}

  Question: {{question}}

  Think step by step using relevant facts. 
  Finally output the final answer text (not the letter) on its own line like "The answer is: <answer>".


doc_to_target: |
  {%- for L in choices.label -%}
  {%- if L == answerKey -%}{{ choices.text[loop.index0] }}{%- endif -%}
  {%- endfor -%}

generation_kwargs:
  until:
    - "\n\nQ:"
    - "</s>"
    - "<|im_end|>"
    - "Question:"
    - "\nAnswer:"
  do_sample: true
  temperature: 0.5
  top_p: 0.95


# process_results: !function utils.process_results_qasc_freeform

# metric_list:
#   - metric: acc_fs4
#     aggregation: mean
#     higher_is_better: true
repeats: 5
num_fewshot: 0

metric_list:
  - metric: !function utils.fs4_per_gen_list
    aggregation: mean
    higher_is_better: true

filter_list:
  - name: take_first_five
    filter:
      - function: take_first_k
        k: 5
