task: mbpp
dataset_path: google-research-datasets/mbpp
dataset_name: sanitized
unsafe_code: true
output_type: generate_until
test_split: test
doc_to_text: "You are an expert Python programmer, and here is your task: {{prompt}} Your code should pass these tests:\n\n{{test_list[0]}}\n{{test_list[1]}}\n{{test_list[2]}}\n[BEGIN]\n"
doc_to_target: "{% if is_fewshot is defined %}{{code}}\n[DONE]{% else %}{{test_list[0]}}\n{{test_list[1]}}\n{{test_list[2]}}{% endif %}"
target_delimiter: ""
metric_list:
  - metric: !function utils.pass_at_1
    aggregation: mean
    higher_is_better: true
filter_list:
  - name: "extract_code"
    filter:
      - function: "custom"
        filter_fn: !function utils.build_predictions
generation_kwargs:
  until:
    - "[DONE]"
  do_sample: false
num_fewshot: 3
fewshot_config:
  sampler: first_n
  samples: !function utils.list_fewshot_samples
metadata:
  version: 1.0