task: gsm1k
dataset_path: ScaleAI/gsm1k
output_type: generate_until
test_split: test
doc_to_text: "{{question}} Let's think step by step."
doc_to_target: "{{answer}}"
generation_kwargs:
  max_gen_toks: 1024
  do_sample: true
  temperature: 0.1
  until: []
repeats: 4
num_fewshot: 0
filter_list:
  - name: "flexible-extract"
    filter:
      - function: "regex"
        group_select: -1
        regex_pattern: "(-?[$0-9.,]{2,})|(-?[0-9]+)"
metric_list:
  - metric: !function utils.exact_match
    aggregation: mean
    higher_is_better: true
    ignore_case: true
    ignore_punctuation: false
    regexes_to_ignore:
      - ","
      - "\\$"
      - "(?s).*#### "
      - "\\.$"
metadata:
  version: 3.0
