# hotpot_support_sents_only.yaml
task: hotpot_support_only
dataset_path: hotpot_qa
dataset_name: distractor   # or fullwiki; both contain supporting_facts
output_type: generate_until
training_split: train
fewshot_split: train
test_split: validation

# Keep only the gold supporting sentences
process_docs: !function utils.hotpot_process_docs

doc_to_text: |
  Context:
  {{support_text}}

  Question: {{question}}

  Think step by step. Finally output the final answer on its own line in the format "The answer is: <answer>".
doc_to_target: "{{ answer | default('') | string }}"

# process_results: !function utils.process_results_freeform

# metric_list:
#   - metric: acc_fs4
#     aggregation: mean
#     higher_is_better: true

# Use pass@5-compatible metric over k generations
metric_list:
  - metric: !function utils.fs4_per_gen_list
    aggregation: mean
    higher_is_better: true

generation_kwargs:
  until:
    - "\n\nQ:"
    - "</s>"
    - "<|im_end|>"
    - "\nQuestion:"
    - "\nContext:" 
  do_sample: true
  temperature: 0.5
  top_p: 0.95

# Pass@5 wiring
repeats: 5
num_fewshot: 0

filter_list:
  - name: take_first_five
    filter:
      - function: take_first_k
        k: 5
