group: mgsm
task:
  - mgsm_native_cot_bn
  - mgsm_native_cot_de
  - mgsm_native_cot_en
  - mgsm_native_cot_es
  - mgsm_native_cot_fr
  - mgsm_native_cot_ja
  - mgsm_native_cot_ru
  - mgsm_native_cot_sw
  - mgsm_native_cot_te
  - mgsm_native_cot_th
  - mgsm_native_cot_zh
aggregate_metric_list:
  - aggregation: mean
    metric: accuracy
    weight_by_size: true
  - aggregation: mean
    metric: answer_accuracy
    weight_by_size: true
  - aggregation: mean
    metric: language_accuracy
    weight_by_size: true
metadata:
  version: 2.0
