
tag:
  - longbench_multi_tasks
  - longbench_tasks
task: longbench_hotpotqa
dataset_path: Xnhyacinth/LongBench
test_split: test
dataset_name: hotpotqa
doc_to_text: "Answer the question based on the given passages. Only give me the answer and do not output any other words.\n\nThe following are given passages.\n{{context}}\n\nAnswer the question based on the given passages. Only give me the answer and do not output any other words.\n\nQuestion: {{question}}\nAnswer:"
doc_to_target: '{{answers}}'
process_results: !function metrics.get_qa_f1_with_score
generation_kwargs:
  max_gen_toks: 32
  temperature: 1
  do_sample: False
  until: []
metric_list:
  - metric: "score"
    aggregation: mean
    higher_is_better: True
  - metric: "qa_f1_score"
    aggregation: mean
    higher_is_better: True
metadata:
  version: 5.0
