group: flan_held_out
task:
  # BBH
  - bbh_zeroshot
  - bbh_fewshot
  - bbh_cot_fewshot
  - bbh_cot_zeroshot
  # MMLU
  - mmlu
  - mmlu_flan_n_shot_generative
  - mmlu_flan_n_shot_loglikelihood
  - mmlu_flan_cot_zeroshot
  - mmlu_flan_cot_fewshot
