task: mmlu_pro_only_options_prompting
dataset_path: TIGER-Lab/MMLU-Pro
test_split: test
process_docs: !function utils.process_docs
doc_to_text: !function utils.only_options
repeats: 1
doc_to_target: answer
filter_list:
  - name: "custom-extract"
    filter:
      - function: "regex"
        regex_pattern: 'answer is \(?([ABCDEFGHIJ])\)?'
        # regex_pattern: r".*[aA]nswer:\s*([A-J])",
      - function: "take_first"
generation_kwargs:
  until:
    - "</s>"
    - "Q:"
    - "<|im_end|>"
  max_gen_toks: 2048
  do_sample: false
  temperature: 0.0
metric_list:
  - metric: exact_match
    aggregation: mean
    higher_is_better: true
    ignore_case: true
    ignore_punctuation: true
metadata:
  version: 2.1
dataset_kwargs:
  trust_remote_code: true

# dataset_path: hails/mmlu_no_train # a copy of `cais/mmlu` with no auxiliary_train split
# output_type: multiple_choice
# test_split: test
# fewshot_split: dev
# fewshot_config:
#   sampler: first_n
# doc_to_text: "Question: {{question.strip()}}\nAnswer:"
# doc_to_choice: "{{choices}}"
# doc_to_target: "{{answer}}"
# metadata:
#   version: 1.0
# dataset_kwargs:
#   trust_remote_code: true
