group: mmlu_continuation
group_alias: mmlu (continuation)
task:
  - group: stem
    task:
      - mmlu_continuation_stem
    aggregate_metric_list:
      - metric: acc
        weight_by_size: True
      - metric: acc_norm
        weight_by_size: True
      # - metric: acc_mutual_info
        # weight_by_size: True
  - group: other
    task:
      - mmlu_continuation_other
    aggregate_metric_list:
      - metric: acc
        weight_by_size: True
      - metric: acc_norm
        weight_by_size: True
      # - metric: acc_mutual_info
        # weight_by_size: True
  - group: social sciences
    task:
      - mmlu_continuation_social_sciences
    aggregate_metric_list:
      - metric: acc
        weight_by_size: True
      - metric: acc_norm
        weight_by_size: True
      # - metric: acc_mutual_info
        # weight_by_size: True
  - group: humanities
    task:
      - mmlu_continuation_humanities
    aggregate_metric_list:
      - metric: acc
        weight_by_size: True
      - metric: acc_norm
        weight_by_size: True
      # - metric: acc_mutual_info
        # weight_by_size: True
aggregate_metric_list:
  - metric: acc
    weight_by_size: True
  - metric: acc_norm
    weight_by_size: True
  # - metric: acc_mutual_info
    # weight_by_size: True
metadata:
  version: 2
