tag:
  - kobest
task: kobest_hellaswag
dataset_path: skt/kobest_v1
dataset_name: hellaswag
training_split: train
validation_split: validation
output_type: multiple_choice
test_split: test
doc_to_text: "{{query}}"
doc_to_target: "{{label}}"
process_docs: !function utils.hellaswag_process_doc
doc_to_choice: "choices"
metric_list:
  - metric: acc
    aggregation: mean
    higher_is_better: True
  - metric: acc_norm
    aggregation: mean
    higher_is_better: True
  - metric: f1
    aggregation: !function utils.macro_f1_score
    average: macro
    hf_evaluate: true
    higher_is_better: True
metadata:
  version: 1.0
