{
  "baselines": {
    "keyword_heuristic": {
      "accuracy": 0.18057455540355677,
      "macro_f1": 0.019529379114384876,
      "top1_accuracy": 0.18057455540355677,
      "top3_accuracy": 0.46511627906976744,
      "top5_accuracy": 0.6046511627906976
    },
    "majority_class": {
      "accuracy": 0.17510259917920656,
      "macro_f1": 0.005518906566636485,
      "top1_accuracy": 0.17510259917920656,
      "top3_accuracy": 0.493844049247606,
      "top5_accuracy": 0.6046511627906976
    },
    "text_naive_bayes": {
      "accuracy": 0.35567715458276333,
      "macro_f1": 0.04563250656689107,
      "top1_accuracy": 0.35567715458276333,
      "top3_accuracy": 0.5868673050615595,
      "top5_accuracy": 0.66484268125855
    },
    "tfidf_linear_svm": {
      "accuracy": 0.33652530779753764,
      "macro_f1": 0.13257033663091922,
      "top1_accuracy": 0.33652530779753764,
      "top3_accuracy": 0.5430916552667578,
      "top5_accuracy": 0.6306429548563611
    },
    "tfidf_logistic_regression": {
      "accuracy": 0.18741450068399454,
      "macro_f1": 0.11436214894109277,
      "top1_accuracy": 0.18741450068399454,
      "top3_accuracy": 0.32558139534883723,
      "top5_accuracy": 0.46238030095759236
    }
  },
  "label_distribution": {
    "ac_rfl": 19,
    "aesop": 67,
    "all_goals": 2,
    "apply": 31,
    "by_cases": 12,
    "by_cases!": 1,
    "by_contra": 5,
    "by_contra!": 2,
    "calc": 8,
    "cases": 17,
    "choose": 1,
    "classical": 5,
    "congr": 3,
    "constructor": 17,
    "contradiction": 1,
    "contrapose!": 5,
    "conv_lhs": 5,
    "conv_rhs": 4,
    "convert": 13,
    "decide": 23,
    "dsimp": 2,
    "exact": 207,
    "exacts": 2,
    "exists": 2,
    "ext": 31,
    "ext1": 1,
    "fun_prop": 1,
    "gcongr": 3,
    "grind": 182,
    "grw": 5,
    "have": 61,
    "if": 13,
    "induction": 24,
    "injection": 1,
    "intro": 31,
    "let": 10,
    "letI": 1,
    "lia": 18,
    "linarith": 1,
    "norm_cast": 2,
    "nth_rw": 3,
    "obtain": 47,
    "positivity": 3,
    "push": 1,
    "push_neg": 1,
    "rcases": 47,
    "refine": 64,
    "replace": 2,
    "revert": 1,
    "rfl": 14,
    "right": 2,
    "ring": 1,
    "rintro": 41,
    "rw": 487,
    "rw!": 2,
    "rwa": 30,
    "set": 2,
    "show": 2,
    "simp": 423,
    "simp_all": 14,
    "simp_all!": 3,
    "simp_rw": 40,
    "simpa": 84,
    "specialize": 1,
    "split_ifs": 5,
    "subst": 9,
    "suffices": 6,
    "symm": 2,
    "tauto": 2,
    "unfold": 8,
    "use": 12,
    "zify": 1
  },
  "representation": "premise",
  "split": {
    "n_rows": 2199,
    "n_test": 731,
    "n_test_theorems": 307,
    "n_train": 1468,
    "n_train_theorems": 715,
    "seed": 3,
    "strategy": "theorem-level random split",
    "test_ratio": 0.3,
    "test_theorems": [
      "AddCommGroup.Int.ModEq.ModEq.add",
      "AddCommGroup.Int.ModEq.ModEq.add_modEq_left",
      "AddCommGroup.Int.ModEq.ModEq.add_modulus_modEq_iff",
      "AddCommGroup.Int.ModEq.ModEq.add_mul_modulus_modEq_iff",
      "AddCommGroup.Int.ModEq.ModEq.add_right_cancel",
      "AddCommGroup.Int.ModEq.ModEq.cancel_left_div_gcd",
      "AddCommGroup.Int.ModEq.ModEq.dvd_iff",
      "AddCommGroup.Int.ModEq.ModEq.left_modEq_add_iff",
      "AddCommGroup.Int.ModEq.ModEq.modEq_abs",
      "AddCommGroup.Int.ModEq.ModEq.modEq_add_fac_self",
      "AddCommGroup.Int.ModEq.ModEq.modEq_iff_eq_of_div_eq",
      "AddCommGroup.Int.ModEq.ModEq.mul_left'",
      "AddCommGroup.Int.ModEq.ModEq.mul_modulus_add_modEq_iff",
      "AddCommGroup.Int.ModEq.ModEq.mul_right'",
      "AddCommGroup.Int.ModEq.ModEq.mul_right_cancel'",
      "AddCommGroup.Int.ModEq.ModEq.sub",
      "AddCommGroup.Int.ModEq.modEq_neg",
      "AddCommGroup.Nat.ModEq.ModEq.ModEq.add_div_eq_of_le_mod_add_mod",
      "AddCommGroup.Nat.ModEq.ModEq.ModEq.add_mod_of_add_mod_lt",
      "AddCommGroup.Nat.ModEq.ModEq.ModEq.chineseRemainder'_lt_lcm",
      "AddCommGroup.Nat.ModEq.ModEq.ModEq.dvd_iff",
      "AddCommGroup.Nat.ModEq.ModEq.ModEq.le_mod_add_mod_of_dvd_add_of_not_dvd",
      "AddCommGroup.Nat.ModEq.ModEq.ModEq.modEq_iff_eq_of_div_eq",
      "AddCommGroup.Nat.ModEq.ModEq.ModEq.odd_mod_four_iff",
      "AddCommGroup.Nat.ModEq.ModEq.ModEq.odd_mul_odd",
      "AddCommGroup.Nat.ModEq.ModEq.ModEq.odd_mul_odd_div_two",
      "AddCommGroup.Nat.ModEq.ModEq.add_modEq_left",
      "AddCommGroup.Nat.ModEq.ModEq.add_right_cancel",
      "AddCommGroup.Nat.ModEq.ModEq.modEq_add_mul_modulus_iff",
      "AddCommGroup.Nat.ModEq.ModEq.modEq_modulus_mul_add_iff",
      "AddCommGroup.Nat.ModEq.ModEq.modulus_add_modEq_iff",
      "AddCommGroup.Nat.ModEq.ModEq.mul_left'",
      "AddCommGroup.Nat.ModEq.ModEq.mul_left_cancel'",
      "AddCommGroup.Nat.ModEq.ModEq.mul_modulus_add_modEq_iff",
      "AddCommGroup.Nat.ModEq.ModEq.mul_right",
      "AddCommGroup.Nat.ModEq.ModEq.of_mul_left",
      "Bool.coe_false",
      "Bool.coe_sort_false",
      "Bool.coe_sort_true",
      "Bool.coe_true",
      "Bool.decide_iff",
      "Bool.dichotomy",
      "Bool.injective_iff",
      "Bool.le_iff_imp",
      "Bool.not_eq_iff",
      "Bool.not_ne_self",
      "Bool.or_eq_false_eq_eq_false_and_eq_false",
      "Bool.or_inl",
      "Bool.self_ne_not",
      "Bool.toNat_beq_zero",
      "Bool.toNat_bne_one",
      "Bool.toNat_bne_zero",
      "Bool.toNat_le_toNat",
      "Even.mul_left",
      "Even.mul_right",
      "Even.pow_of_ne_zero",
      "Finset.Multiset.List.Finset.Equiv.Finset.union_symm_left",
      "Finset.Multiset.List.Finset.Equiv.Finset.union_symm_right",
      "Finset.Multiset.List.Finset.Equiv.Multiset.Finset.univ_finset_of_isEmpty",
      "Finset.Multiset.List.Finset.Equiv.Multiset.toFinset_replicate",
      "Finset.Multiset.List.Finset.Equiv.piFinsetUnion_left",
      "Finset.Multiset.List.Finset.empty_toList",
      "Finset.Multiset.List.toFinset_cons",
      "Finset.Multiset.List.toFinset_eq_empty_iff",
      "Finset.Multiset.List.toFinset_filter",
      "Finset.Multiset.List.toFinset_inter",
      "Finset.Multiset.List.toFinset_nonempty_iff",
      "Finset.Multiset.List.toFinset_replicate_of_ne_zero",
      "Finset.Multiset.toFinset_add",
      "Finset.Multiset.toFinset_filter",
      "Finset.Multiset.toFinset_union",
      "Finset.Nonempty.cons_induction",
      "Finset.Nonempty.of_disjSups_left",
      "Finset.Nonempty.of_disjSups_right",
      "Finset.attach_nonempty_iff",
      "Finset.coe_eq_pair",
      "Finset.coe_subset_singleton",
      "Finset.compls_compls",
      "Finset.compls_infs",
      "Finset.compls_subset_iff",
      "Finset.cons_induction",
      "Finset.disjSups_assoc",
      "Finset.disjSups_disjSups_disjSups_comm",
      "Finset.disjSups_empty_right",
      "Finset.disjSups_left_comm",
      "Finset.disjSups_subset_sups",
      "Finset.disjSups_union_right",
      "Finset.disjUnion_eq_union",
      "Finset.disjoint_erase_insert",
      "Finset.disjoint_filter",
      "Finset.disjoint_or_nonempty_inter",
      "Finset.erase_cons_of_ne",
      "Finset.erase_eq_iff_eq_insert",
      "Finset.erase_injOn'",
      "Finset.erase_inter_comm",
      "Finset.erase_nonempty",
      "Finset.erase_sdiff_distrib",
      "Finset.erase_singleton",
      "Finset.erase_union_distrib",
      "Finset.filter_and",
      "Finset.filter_and_not",
      "Finset.filter_cons",
      "Finset.filter_inter",
      "Finset.filter_ne",
      "Finset.filter_ne'",
      "Finset.filter_not",
      "Finset.filter_notMem_eq_sdiff",
      "Finset.filter_or",
      "Finset.filter_union",
      "Finset.image_compl",
      "Finset.infs_compls_eq_diffs",
      "Finset.insert_eq_self",
      "Finset.inter_erase",
      "Finset.mem_diffs",
      "Finset.nonempty_mk",
      "Finset.not_disjoint_iff_nonempty_inter",
      "Finset.pairwiseDisjoint_iff",
      "Finset.powerset_infs_powerset_self",
      "Finset.range_inter_range",
      "Finset.range_union_range",
      "Finset.sdiff_eq_filter",
      "Finset.sdiff_singleton_eq_erase",
      "Finset.ssubset_singleton_iff",
      "Finset.univ_infs_univ",
      "Fintype.card_eq_card_units_add_one",
      "Fintype.card_units",
      "HasSubset.Subset.diff_ssubset_of_nonempty",
      "Int.Prime.dvd_natAbs_of_coe_dvd_sq",
      "Int.nonneg_or_nonpos_of_mul_nonneg",
      "Int.sqrt_eq",
      "List.IsRotated.cons_append_singleton",
      "List.IsRotated.cyclicPermutations",
      "List.IsRotated.dropLast_tail",
      "List.IsRotated.symm",
      "List.IsRotated.trans",
      "List.Nodup.cyclicPermutations",
      "List.Nodup.rotate_congr",
      "List.Nodup.rotate_congr_iff",
      "List.count_diff",
      "List.getElem?_iterate",
      "List.getElem_cyclicPermutations",
      "List.isRotated_nil_iff",
      "List.isRotated_reverse_comm_iff",
      "List.isRotated_reverse_iff",
      "List.isRotated_singleton_iff'",
      "List.length_cyclicPermutations_of_ne_nil",
      "List.length_iterate",
      "List.length_rotate'",
      "List.map_rotate",
      "List.mem_cyclicPermutations_iff",
      "List.mem_iterate",
      "List.nil_eq_rotate_iff",
      "List.range_map_iterate",
      "List.reverse_rotate",
      "List.rotate'_eq_drop_append_take",
      "List.rotate'_length",
      "List.rotate'_length_mul",
      "List.rotate_append_length_eq",
      "List.rotate_eq_self_iff_eq_replicate",
      "List.rotate_length",
      "List.rotate_rotate",
      "List.rotate_zero",
      "List.take_iterate",
      "List.zipWith_rotate_one",
      "Multiset.sum_map_div",
      "NNReal.Real.Mathlib.Meta.Positivity.Real.NNReal.Real.sum_mul_le_sqrt_mul_sqrt",
      "NNReal.Real.Mathlib.Meta.Positivity.Real.lt_sq_of_sqrt_lt",
      "NNReal.Real.Mathlib.Meta.Positivity.Real.nat_sqrt_le_real_sqrt",
      "NNReal.Real.Mathlib.Meta.Positivity.Real.sq_lt",
      "NNReal.Real.Mathlib.Meta.Positivity.Real.sqrt_div_self'",
      "NNReal.Real.Mathlib.Meta.Positivity.Real.sqrt_prod",
      "NNReal.Real.Mathlib.Meta.Positivity.Real.sqrt_two_lt_three_halves",
      "NNReal.Real.comap_sqrt_atTop",
      "NNReal.Real.sq_le",
      "NNReal.Real.sqrt_eq_iff_mul_self_eq_of_pos",
      "NNReal.Real.sqrt_eq_zero'",
      "NNReal.Real.sqrt_inj",
      "NNReal.Real.sqrt_lt",
      "NNReal.Real.sqrt_mul_self_eq_abs",
      "NNReal.Real.sqrt_one",
      "NNReal.Real.sqrt_zero",
      "NNReal.sqrt_eq_one",
      "NNReal.sqrt_mul",
      "NNReal.sqrt_zero",
      "Nat.Even.sub_odd",
      "Nat.Function.Involutive.Even.neg_zpow",
      "Nat.Function.Involutive.iterate_eq_id",
      "Nat.Function.Involutive.iterate_eq_self",
      "Nat.Function.Involutive.iterate_even",
      "Nat.Function.Involutive.natCast_eq_zero_or_one_of_two_eq_zero",
      "Nat.Function.Involutive.neg_one_pow_eq_ite",
      "Nat.Ico_filter_pow_dvd_eq",
      "Nat.Odd.sub_odd",
      "Nat.Prime.coprime_choose_of_lt",
      "Nat.Prime.dvd_iff_eq",
      "Nat.Prime.factorization_self",
      "Nat.Prime.pow_inj",
      "Nat.card_multiples'",
      "Nat.coprime_fintype_prod_right_iff",
      "Nat.coprime_multiset_prod_left_iff",
      "Nat.descFactorial_eq_prod_range",
      "Nat.div_two_mul_two_add_one_of_odd",
      "Nat.eq_iff_prime_padicValNat_eq",
      "Nat.even_xor_odd'",
      "Nat.exists_eq_pow_of_exponent_coprime_of_pow_eq_pow",
      "Nat.factorization_eq_card_pow_dvd",
      "Nat.factorization_eq_card_pow_dvd_of_lt",
      "Nat.factorization_eq_of_coprime_left",
      "Nat.factorization_gcd",
      "Nat.factorization_le_of_le_pow",
      "Nat.factorization_prod_apply",
      "Nat.mod_two_add_succ_mod_two",
      "Nat.ne_one_iff_exists_prime_dvd",
      "Nat.not_dvd_ordCompl",
      "Nat.not_even_two_mul_add_one",
      "Nat.not_odd_iff",
      "Nat.not_prime_iff_exists_mul_eq",
      "Nat.not_prime_mul",
      "Nat.odd_pow_iff",
      "Nat.ordCompl_eq_self_iff_zero_or_not_dvd",
      "Nat.ordCompl_mul",
      "Nat.ordCompl_pos",
      "Nat.ordCompl_self_pow_mul",
      "Nat.ordProj_of_not_prime",
      "Nat.ordProj_pos",
      "Nat.pairwise_coprime_pow_primeFactors_factorization",
      "Nat.prime_iff_prime_int",
      "Nat.prime_mul_iff",
      "Nat.prod_factorial_dvd_factorial_sum",
      "Nat.prod_pow_primeFactors_factorization",
      "Nat.prod_primeFactors_dvd",
      "Nat.psub'_eq_psub",
      "Nat.psub_eq_some",
      "Nat.setOf_pow_dvd_eq_Icc_factorization",
      "Nat.sub_eq_psub",
      "Odd.neg_one_pow",
      "Odd.pow_add_pow_eq_zero",
      "Set.Icc_union_Ici",
      "Set.Ici_diff_Ici",
      "Set.Ico_eq_Ico_iff",
      "Set.Ico_inter_Ico",
      "Set.Ico_union_Ici'",
      "Set.Iic_union_Ioc",
      "Set.Iic_union_Ioc'",
      "Set.Iio_union_Ioo'",
      "Set.Ioc_diff_Ioi",
      "Set.Ioc_inter_Ioc",
      "Set.Ioc_inter_Ioi",
      "Set.Ioc_inter_Ioo_of_left_lt",
      "Set.Ioc_subset_Ioc_iff",
      "Set.Ioc_union_Ioc_right",
      "Set.Ioi_diff_Ioi",
      "Set.Ioi_subset_Ioi_iff",
      "Set.Ioo_inter_Ioo",
      "Set.Ioo_union_Ioi",
      "Set.Ioo_union_Ioi'",
      "Set.diff_singleton_eq_self",
      "Set.inl_compl_union_inr_compl",
      "Set.insert_diff_insert",
      "Set.insert_diff_of_notMem",
      "Set.insert_diff_self_of_mem",
      "Set.insert_diff_self_of_notMem",
      "Set.insert_diff_singleton",
      "Set.ite_empty_left",
      "Set.ite_empty_right",
      "Set.ite_inter_inter",
      "Set.ncard_Iic_nat",
      "Set.subset_insert_diff_singleton",
      "Set.subset_inter_union_compl_left",
      "Set.subset_ite",
      "Set.symmDiff_union_subset",
      "Set.union_inter_compl_left_subset",
      "SetRel.Function.SetRel.exists_graph_eq_iff",
      "SetRel.Function.graph_id",
      "SetRel.cod_univ",
      "SetRel.comp_assoc",
      "SetRel.core_inter",
      "SetRel.dom_empty",
      "SetRel.dom_univ",
      "SetRel.image_eq_biUnion",
      "SetRel.image_union",
      "SetRel.inv_eq_self_iff",
      "SetRel.left_subset_comp",
      "SetRel.preimage_empty_right",
      "SetRel.preimage_iUnion",
      "SetRel.preimage_id",
      "SetRel.preimage_union",
      "compl_le_of_compl_le",
      "compl_sdiff",
      "compl_sup_eq_top",
      "disjoint_sdiff_comm",
      "disjoint_sdiff_iff_le",
      "even_iff_exists_two_mul",
      "even_sub_two",
      "inf_sdiff",
      "inf_sdiff_eq_bot_iff",
      "inf_sdiff_left_comm",
      "le_iff_eq_sup_sdiff",
      "odd_sub_one",
      "sdiff_eq_symm",
      "sdiff_lt_left",
      "sdiff_sdiff_right",
      "sdiff_sdiff_sdiff_cancel_right",
      "sdiff_sup",
      "sdiff_sup_self'",
      "star_finsuppSum",
      "sup_eq_sdiff_sup_sdiff_sup_inf"
    ]
  }
}