group: agieval_en
task:
  - agieval_aqua_rat
  - agieval_gaokao_english # categorizing as EN because the AGIEval codebase lists this as in `english_qa_tasks`
  - agieval_logiqa_en
  - agieval_lsat_ar
  - agieval_lsat_lr
  - agieval_lsat_rc
  - agieval_math
  - agieval_sat_en_without_passage
  - agieval_sat_en
  - agieval_sat_math
aggregate_metric_list:
  - metric: acc
    aggregation: mean
    weight_by_size: true
metadata:
  version: 0.0
