group:
  - math_word_problems
task: gsm8k_test
dataset_path: gsm8k
dataset_name: main
output_type: generate_until
training_split: train
fewshot_split: train
test_split: test
doc_to_text: "Below is an instruction that describes a task. Write a response that appropriately completes the request.\n\n### Instruction:\n{{question}}\n\n### Response: Let's think step by step."
doc_to_target: "{{answer.split('### ')[-1].rstrip()}}"
metric_list:
  - metric: exact_match
    aggregation: mean
    higher_is_better: true
    ignore_case: true
    ignore_punctuation: false
    regexes_to_ignore:
      - ","
      - "\\$"
      - "(?s).*#### "
      - "\\.$"
generation_kwargs:
  until:
    - "Q:"
    - "</s>"
    - "<|im_end|>"
  do_sample: false
  max_gen_toks: 1024 
repeats: 1
num_fewshot: 0
filter_list:
  - name: "custom-strict-match"
    filter:
      - function: "get_answer"
metadata:
  version: 3.0