{
  "baselines": {
    "keyword_heuristic": {
      "accuracy": 0.1752738654147105,
      "macro_f1": 0.02297342456591411,
      "top1_accuracy": 0.1752738654147105,
      "top3_accuracy": 0.47417840375586856,
      "top5_accuracy": 0.6494522691705791
    },
    "majority_class": {
      "accuracy": 0.2347417840375587,
      "macro_f1": 0.007455453664355476,
      "top1_accuracy": 0.2347417840375587,
      "top3_accuracy": 0.5179968701095462,
      "top5_accuracy": 0.6557120500782473
    },
    "text_naive_bayes": {
      "accuracy": 0.325508607198748,
      "macro_f1": 0.051968737861647345,
      "top1_accuracy": 0.325508607198748,
      "top3_accuracy": 0.6009389671361502,
      "top5_accuracy": 0.7183098591549296
    },
    "tfidf_linear_svm": {
      "accuracy": 0.15023474178403756,
      "macro_f1": 0.06862254878686994,
      "top1_accuracy": 0.15023474178403756,
      "top3_accuracy": 0.3082942097026604,
      "top5_accuracy": 0.48200312989045385
    },
    "tfidf_logistic_regression": {
      "accuracy": 0.0892018779342723,
      "macro_f1": 0.051073000596877555,
      "top1_accuracy": 0.0892018779342723,
      "top3_accuracy": 0.2222222222222222,
      "top5_accuracy": 0.3489827856025039
    }
  },
  "label_distribution": {
    "ac_rfl": 19,
    "aesop": 67,
    "all_goals": 2,
    "apply": 31,
    "by_cases": 12,
    "by_cases!": 1,
    "by_contra": 5,
    "by_contra!": 2,
    "calc": 8,
    "cases": 17,
    "choose": 1,
    "classical": 5,
    "congr": 3,
    "constructor": 17,
    "contradiction": 1,
    "contrapose!": 5,
    "conv_lhs": 5,
    "conv_rhs": 4,
    "convert": 13,
    "decide": 23,
    "dsimp": 2,
    "exact": 207,
    "exacts": 2,
    "exists": 2,
    "ext": 31,
    "ext1": 1,
    "fun_prop": 1,
    "gcongr": 3,
    "grind": 182,
    "grw": 5,
    "have": 61,
    "if": 13,
    "induction": 24,
    "injection": 1,
    "intro": 31,
    "let": 10,
    "letI": 1,
    "lia": 18,
    "linarith": 1,
    "norm_cast": 2,
    "nth_rw": 3,
    "obtain": 47,
    "positivity": 3,
    "push": 1,
    "push_neg": 1,
    "rcases": 47,
    "refine": 64,
    "replace": 2,
    "revert": 1,
    "rfl": 14,
    "right": 2,
    "ring": 1,
    "rintro": 41,
    "rw": 487,
    "rw!": 2,
    "rwa": 30,
    "set": 2,
    "show": 2,
    "simp": 423,
    "simp_all": 14,
    "simp_all!": 3,
    "simp_rw": 40,
    "simpa": 84,
    "specialize": 1,
    "split_ifs": 5,
    "subst": 9,
    "suffices": 6,
    "symm": 2,
    "tauto": 2,
    "unfold": 8,
    "use": 12,
    "zify": 1
  },
  "representation": "structured",
  "split": {
    "n_rows": 2199,
    "n_test": 639,
    "n_test_theorems": 307,
    "n_train": 1560,
    "n_train_theorems": 715,
    "seed": 42,
    "strategy": "theorem-level random split",
    "test_ratio": 0.3,
    "test_theorems": [
      "AddCommGroup.Int.ModEq.ModEq.add_left_cancel",
      "AddCommGroup.Int.ModEq.ModEq.add_modEq_right",
      "AddCommGroup.Int.ModEq.ModEq.add_modEq_right_iff",
      "AddCommGroup.Int.ModEq.ModEq.existsUnique_equiv",
      "AddCommGroup.Int.ModEq.ModEq.existsUnique_equiv_nat",
      "AddCommGroup.Int.ModEq.ModEq.left_modEq_add_iff",
      "AddCommGroup.Int.ModEq.ModEq.modEq_abs",
      "AddCommGroup.Int.ModEq.ModEq.modEq_add_fac",
      "AddCommGroup.Int.ModEq.ModEq.modEq_add_modulus_iff",
      "AddCommGroup.Int.ModEq.ModEq.modEq_modulus_add_iff",
      "AddCommGroup.Int.ModEq.ModEq.modEq_natAbs",
      "AddCommGroup.Int.ModEq.ModEq.modEq_zero_iff",
      "AddCommGroup.Int.ModEq.ModEq.mod_coprime",
      "AddCommGroup.Int.ModEq.ModEq.mul_left'",
      "AddCommGroup.Int.ModEq.ModEq.sub_modulus_modEq_iff",
      "AddCommGroup.Int.ModEq.ModEq.sub_modulus_mul_modEq_iff",
      "AddCommGroup.Int.ModEq.modEq_neg",
      "AddCommGroup.Int.ModEq.neg_modEq_neg",
      "AddCommGroup.Nat.ModEq.ModEq.ModEq.add_div_of_dvd_left",
      "AddCommGroup.Nat.ModEq.ModEq.ModEq.add_mod_add_ite",
      "AddCommGroup.Nat.ModEq.ModEq.ModEq.add_mod_of_add_mod_lt",
      "AddCommGroup.Nat.ModEq.ModEq.ModEq.gcd_eq",
      "AddCommGroup.Nat.ModEq.ModEq.ModEq.modEq_and_modEq_iff_modEq_mul",
      "AddCommGroup.Nat.ModEq.ModEq.ModEq.odd_mul_odd_div_two",
      "AddCommGroup.Nat.ModEq.ModEq.ModEq.odd_of_mod_four_eq_one",
      "AddCommGroup.Nat.ModEq.ModEq.add_left_cancel",
      "AddCommGroup.Nat.ModEq.ModEq.add_modEq_right",
      "AddCommGroup.Nat.ModEq.ModEq.add_modEq_right_iff",
      "AddCommGroup.Nat.ModEq.ModEq.mul_left_cancel'",
      "AddCommGroup.Nat.ModEq.ModEq.mul_right'",
      "AddCommGroup.Nat.ModEq.ModEq.of_mul_left",
      "AddCommGroup.Nat.ModEq.ModEq.right_modEq_add_iff",
      "AddCommGroup.modEq_iff_natModEq",
      "Bool.and_intro",
      "Bool.and_le_right",
      "Bool.coe_sort_true",
      "Bool.decide_iff",
      "Bool.dichotomy",
      "Bool.eq_false_eq_not_eq_true",
      "Bool.eq_false_of_not_eq_true'",
      "Bool.le_and",
      "Bool.or_le",
      "Bool.right_le_or",
      "Bool.self_ne_not",
      "Bool.toNat_bne_one",
      "Bool.toNat_bne_zero",
      "Bool.toNat_le_toNat",
      "Even.add_odd",
      "Even.mul_left",
      "Even.neg_pow",
      "Even.of_isUnit_two",
      "Even.sub_odd",
      "Finset.Multiset.List.Finset.Equiv.Finset.union_symm_left",
      "Finset.Multiset.List.Finset.Equiv.Finset.union_symm_right",
      "Finset.Multiset.List.Finset.Equiv.Multiset.Finset.mem_union_of_disjoint",
      "Finset.Multiset.List.Finset.Equiv.Multiset.toFinset_replicate",
      "Finset.Multiset.List.Finset.Equiv.piFinsetUnion_right",
      "Finset.Multiset.List.Finset.empty_toList",
      "Finset.Multiset.List.Finset.pairwise_cons'",
      "Finset.Multiset.List.toFinset_replicate_of_ne_zero",
      "Finset.Multiset.List.toFinset_union",
      "Finset.Multiset.toFinset_filter",
      "Finset.Nontrivial.erase_nonempty",
      "Finset.coe_eq_singleton",
      "Finset.coe_pair",
      "Finset.coe_singleton",
      "Finset.compls_infs",
      "Finset.compls_sups",
      "Finset.cons_eq_insert",
      "Finset.dens_eq_sum_dens_fiberwise",
      "Finset.disjSups_assoc",
      "Finset.disjSups_disjSups_disjSups_comm",
      "Finset.disjSups_left_comm",
      "Finset.disjSups_union_left",
      "Finset.disjUnion_eq_union",
      "Finset.disjoint_disjUnion_right",
      "Finset.disjoint_or_nonempty_inter",
      "Finset.erase_cons_of_ne",
      "Finset.erase_injOn'",
      "Finset.erase_inter_comm",
      "Finset.erase_sdiff_comm",
      "Finset.erase_sdiff_distrib",
      "Finset.erase_ssubset",
      "Finset.even_sum_iff_even_card_odd",
      "Finset.filter_and",
      "Finset.filter_and_not",
      "Finset.filter_insert",
      "Finset.filter_mem_eq_inter",
      "Finset.filter_or",
      "Finset.filter_sups_le",
      "Finset.infs_compls_eq_diffs",
      "Finset.insert_comm",
      "Finset.insert_eq_self",
      "Finset.insert_erase",
      "Finset.insert_idem",
      "Finset.insert_subset_insert",
      "Finset.insert_subset_insert_iff",
      "Finset.mem_diffs",
      "Finset.nonempty_mk",
      "Finset.not_nontrivial_singleton",
      "Finset.odd_sum_iff_odd_card_odd",
      "Finset.pairwiseDisjoint_iff",
      "Finset.prod_eraseNone",
      "Finset.prod_insertNone",
      "Finset.range_union_range",
      "Finset.sdiff_eq_filter",
      "Finset.sdiff_insert_insert_of_mem_of_notMem",
      "Finset.singleton_iff_unique_mem",
      "Finset.singleton_subset_set_iff",
      "Finset.singleton_subset_singleton",
      "Finset.subset_insert_iff",
      "Finset.subset_insert_iff_of_notMem",
      "Finset.sups_eq_self",
      "Finset.union_erase_of_mem",
      "HasSubset.Subset.diff_ssubset_of_nonempty",
      "Int.exists_mul_self",
      "Int.mul_ediv_le_mul_ediv_assoc",
      "Int.natAbs_lt_iff_mul_self_lt",
      "Int.nonneg_or_nonpos_of_mul_nonneg",
      "Int.sqrt_natCast",
      "Int.succ_dvd_or_succ_dvd_of_succ_sum_dvd_mul",
      "List.Nodup.cyclicPermutations",
      "List.Nodup.rotate_congr",
      "List.Nodup.rotate_eq_self_iff",
      "List.countP_diff",
      "List.countP_erase",
      "List.count_map_of_injective",
      "List.cyclicPermutations_ne_nil",
      "List.forall_mem_zipIdx'",
      "List.getElem_eq_getElem_rotate",
      "List.head?_rotate",
      "List.head_cyclicPermutations",
      "List.isRotated_append",
      "List.isRotated_cyclicPermutations_iff",
      "List.isRotated_iff_mem_map_range",
      "List.isRotated_nil_iff",
      "List.isRotated_reverse_comm_iff",
      "List.isRotated_singleton_iff'",
      "List.iterate_eq_nil",
      "List.length_cyclicPermutations_cons",
      "List.length_cyclicPermutations_of_ne_nil",
      "List.length_rotate",
      "List.mem_iterate",
      "List.rotate'_mod",
      "List.rotate'_nil",
      "List.rotate'_rotate'",
      "List.rotate_eq_drop_append_take_mod",
      "List.rotate_eq_iff",
      "List.rotate_eq_singleton_iff",
      "List.rotate_length",
      "List.rotate_length_mul",
      "List.rotate_mod",
      "List.rotate_perm",
      "List.rotate_replicate",
      "List.zipWith_rotate_one",
      "NNReal.Real.Mathlib.Meta.Positivity.Real.NNReal.Real.sum_mul_le_sqrt_mul_sqrt",
      "NNReal.Real.Mathlib.Meta.Positivity.Real.NNReal.sum_sqrt_mul_sqrt_le",
      "NNReal.Real.Mathlib.Meta.Positivity.Real.div_sqrt",
      "NNReal.Real.Mathlib.Meta.Positivity.Real.floor_real_sqrt_eq_nat_sqrt",
      "NNReal.Real.Mathlib.Meta.Positivity.Real.inv_sqrt_two_sub_one",
      "NNReal.Real.Mathlib.Meta.Positivity.Real.lt_sq_of_sqrt_lt",
      "NNReal.Real.Mathlib.Meta.Positivity.Real.sq_lt",
      "NNReal.Real.Mathlib.Meta.Positivity.Real.sqrt_mul",
      "NNReal.Real.Mathlib.Meta.Positivity.Real.sqrt_one_add_le",
      "NNReal.Real.coe_sqrt",
      "NNReal.Real.map_sqrt_atTop",
      "NNReal.Real.mul_self_sqrt",
      "NNReal.Real.sqrt_eq_cases",
      "NNReal.Real.sqrt_eq_iff_eq_sq",
      "NNReal.Real.sqrt_eq_iff_mul_self_eq",
      "NNReal.Real.sqrt_eq_zero_of_nonpos",
      "NNReal.Real.sqrt_le_one",
      "NNReal.Real.sqrt_lt_sqrt_iff_of_pos",
      "NNReal.Real.sqrt_ne_zero'",
      "NNReal.Real.sqrt_sq",
      "NNReal.sqrt_le_one",
      "NNReal.sqrt_one",
      "NNReal.sqrt_pos",
      "NNReal.sqrt_zero",
      "Nat.Function.Involutive.iterate_even",
      "Nat.Function.Involutive.iterate_two_mul",
      "Nat.Function.Involutive.neg_one_pow_eq_one_iff_even",
      "Nat.Function.Involutive.neg_one_zpow_eq_ite",
      "Nat.Odd.sub_odd",
      "Nat.Prime.coprime_choose_of_lt",
      "Nat.Prime.dvd_choose_add",
      "Nat.Prime.dvd_factorial",
      "Nat.Prime.dvd_iff_eq",
      "Nat.Prime.factorization_self",
      "Nat.Prime.pow_inj'",
      "Nat.card_multiples",
      "Nat.card_units",
      "Nat.cast_div_charZero",
      "Nat.cast_div_div_div_cancel_right",
      "Nat.coprime_fintype_prod_right_iff",
      "Nat.coprime_multiset_prod_right_iff",
      "Nat.coprime_prod_left_iff",
      "Nat.coprime_prod_right_iff",
      "Nat.coprime_two_left",
      "Nat.dvd_iff_prime_pow_dvd_dvd",
      "Nat.dvd_prime_pow",
      "Nat.eq_factorization_iff",
      "Nat.eq_one_iff_not_exists_prime_dvd",
      "Nat.eq_prime_pow_of_dvd_least_prime_pow",
      "Nat.even_or_odd'",
      "Nat.exists_eq_pow_of_pow_eq_pow",
      "Nat.factorization_eq_zero_iff'",
      "Nat.factorization_le_of_le_pow",
      "Nat.factorization_lt",
      "Nat.mod_two_add_add_odd_mod_two",
      "Nat.mod_two_add_succ_mod_two",
      "Nat.not_odd_zero",
      "Nat.odd_iff",
      "Nat.ordCompl_dvd_ordCompl_iff_dvd",
      "Nat.ordCompl_self_pow_mul",
      "Nat.ordProj_dvd_ordProj_of_dvd",
      "Nat.pred_eq_ppred",
      "Nat.prod_pow_primeFactors_factorization",
      "Nat.prod_primeFactors_gcd_mul_prod_primeFactors_mul",
      "Nat.psub_eq_none",
      "Nat.sub_eq_psub",
      "Odd.not_two_dvd_nat",
      "Odd.pow_add_pow_eq_zero",
      "Odd.sub_odd",
      "Rat.exists_mul_self",
      "Rat.sqrt_natCast",
      "Set.Ico_eq_Ico_iff",
      "Set.Ico_union_Ici",
      "Set.Ico_union_Ico",
      "Set.Iic_diff_Ioc",
      "Set.Iio_diff_Iic",
      "Set.Iio_subset_Iic_iff",
      "Set.Iio_union_Ico'",
      "Set.Iio_union_Ioo",
      "Set.Iio_union_Ioo'",
      "Set.Ioc_inter_Ioi",
      "Set.Ioc_inter_Ioo_of_left_lt",
      "Set.Ioc_subset_Ioc_iff",
      "Set.Ioc_union_Ioc_left",
      "Set.Ioc_union_Ioc_right",
      "Set.Ioc_union_Ioi'",
      "Set.Ioo_inter_Ioc_of_right_lt",
      "Set.Ioo_inter_Ioi",
      "Set.Ioo_subset_Ioo_iff",
      "Set.Ioo_union_Ioi",
      "Set.Ioo_union_Ioo'",
      "Set.diff_eq_compl_inter",
      "Set.diff_insert_of_notMem",
      "Set.diff_singleton_eq_self",
      "Set.diff_union_inter",
      "Set.insert_diff_of_mem",
      "Set.insert_diff_of_notMem",
      "Set.insert_diff_singleton",
      "Set.inter_compl_nonempty_iff",
      "Set.ite_empty",
      "Set.ite_eq_of_subset_right",
      "Set.ite_inter_compl_self",
      "Set.ite_univ",
      "Set.ncard_Ioc_nat",
      "Set.ncard_Ioo_nat",
      "Set.ncard_uIcc_nat",
      "Set.pair_diff_left",
      "Set.pair_diff_right",
      "Set.subset_insert_iff",
      "Set.union_symmDiff_subset",
      "SetRel.Function.graph_id",
      "SetRel.cod_empty",
      "SetRel.comp_empty",
      "SetRel.comp_sUnion",
      "SetRel.comp_univ",
      "SetRel.dom_univ",
      "SetRel.empty_comp",
      "SetRel.iUnion_comp",
      "SetRel.id_comp",
      "SetRel.id_subset",
      "SetRel.image_empty_left",
      "SetRel.image_eq_biUnion",
      "SetRel.image_univ_right",
      "SetRel.inter_dom_subset_preimage_image",
      "SetRel.inv_eq_self",
      "SetRel.preimage_empty_left",
      "SetRel.preimage_eq_image",
      "SetRel.preimage_inter_cod",
      "SetRel.preimage_sUnion",
      "SetRel.preimage_union",
      "SetRel.prod_comp_prod",
      "SetRel.right_subset_comp",
      "compl_eq_comm",
      "compl_le_self",
      "even_neg_two",
      "even_two",
      "himp_eq_left",
      "inf_sdiff_eq_bot_iff",
      "inf_sdiff_left_comm",
      "isUnit_two_iff_forall_even",
      "le_sdiff",
      "odd_add_one_self",
      "odd_add_self_one'",
      "sdiff_eq_right",
      "sdiff_inf_right_comm",
      "sdiff_inf_sdiff",
      "sdiff_sdiff_eq_self",
      "sdiff_sdiff_right'",
      "sdiff_sdiff_sup_sdiff",
      "sdiff_unique",
      "sup_inf_inf_compl",
      "sup_inf_inf_sdiff"
    ]
  }
}