task: mbpp_inst64
dataset_path: google-research-datasets/mbpp
dataset_name: full
unsafe_code: true
output_type: generate_until
test_split: test
doc_to_text: "You are an expert Python programmer, and here is your task:\n{{text}}\nYour code should pass these tests:\n{{test_list[0]}}\n{{test_list[1]}}\n{{test_list[2]}}"
doc_to_target: "{% if is_fewshot is defined %}{{code}}\n```{% else %}{{test_list[0]}}\n{{test_list[1]}}\n{{test_list[2]}}{% endif %}"
gen_prefix: "\n```python\n"
target_delimiter: ""
metric_list:
  - metric: !function mbpp_utils.pass_at_k
    aggregation: mean
    higher_is_better: true
    k: [1,4,8,16,32]
generation_kwargs:
  until: []
  do_sample: true
  temperature: 0.6
repeats: 32
num_fewshot: 3
fewshot_config:
  sampler: first_n
  samples: !function mbpp_utils.list_fewshot_samples
filter_list:
  - name: "code_block"
    filter:
      - function: "custom"
        filter_fn: !function mbpp_utils.build_predictions
metadata:
  version: 1.0