group: mmlu_pro
task:
  - mmlu_pro_biology
  - mmlu_pro_business
  - mmlu_pro_chemistry
  - mmlu_pro_computer_science
  - mmlu_pro_economics
  - mmlu_pro_engineering
  - mmlu_pro_health
  - mmlu_pro_history
  - mmlu_pro_law
  - mmlu_pro_math
  - mmlu_pro_other
  - mmlu_pro_philosophy
  - mmlu_pro_physics
  - mmlu_pro_psychology
aggregate_metric_list:
  - aggregation: mean
    metric: exact_match
    weight_by_size: true
    filter_list: custom-extract
metadata:
  version: 2.0
