{
  "baselines": {
    "keyword_heuristic": {
      "accuracy": 0.16923076923076924,
      "macro_f1": 0.01763611891757059,
      "top1_accuracy": 0.16923076923076924,
      "top3_accuracy": 0.4671328671328671,
      "top5_accuracy": 0.6041958041958042
    },
    "majority_class": {
      "accuracy": 0.2055944055944056,
      "macro_f1": 0.0069605568445475635,
      "top1_accuracy": 0.2055944055944056,
      "top3_accuracy": 0.48951048951048953,
      "top5_accuracy": 0.6
    },
    "text_naive_bayes": {
      "accuracy": 0.2853146853146853,
      "macro_f1": 0.03806421638782837,
      "top1_accuracy": 0.2853146853146853,
      "top3_accuracy": 0.5650349650349651,
      "top5_accuracy": 0.6531468531468532
    },
    "tfidf_linear_svm": {
      "accuracy": 0.16643356643356644,
      "macro_f1": 0.0816352331087155,
      "top1_accuracy": 0.16643356643356644,
      "top3_accuracy": 0.3412587412587413,
      "top5_accuracy": 0.4979020979020979
    },
    "tfidf_logistic_regression": {
      "accuracy": 0.1020979020979021,
      "macro_f1": 0.05514314414808752,
      "top1_accuracy": 0.1020979020979021,
      "top3_accuracy": 0.22237762237762237,
      "top5_accuracy": 0.3356643356643357
    }
  },
  "label_distribution": {
    "ac_rfl": 19,
    "aesop": 67,
    "all_goals": 2,
    "apply": 31,
    "by_cases": 12,
    "by_cases!": 1,
    "by_contra": 5,
    "by_contra!": 2,
    "calc": 8,
    "cases": 17,
    "choose": 1,
    "classical": 5,
    "congr": 3,
    "constructor": 17,
    "contradiction": 1,
    "contrapose!": 5,
    "conv_lhs": 5,
    "conv_rhs": 4,
    "convert": 13,
    "decide": 23,
    "dsimp": 2,
    "exact": 207,
    "exacts": 2,
    "exists": 2,
    "ext": 31,
    "ext1": 1,
    "fun_prop": 1,
    "gcongr": 3,
    "grind": 182,
    "grw": 5,
    "have": 61,
    "if": 13,
    "induction": 24,
    "injection": 1,
    "intro": 31,
    "let": 10,
    "letI": 1,
    "lia": 18,
    "linarith": 1,
    "norm_cast": 2,
    "nth_rw": 3,
    "obtain": 47,
    "positivity": 3,
    "push": 1,
    "push_neg": 1,
    "rcases": 47,
    "refine": 64,
    "replace": 2,
    "revert": 1,
    "rfl": 14,
    "right": 2,
    "ring": 1,
    "rintro": 41,
    "rw": 487,
    "rw!": 2,
    "rwa": 30,
    "set": 2,
    "show": 2,
    "simp": 423,
    "simp_all": 14,
    "simp_all!": 3,
    "simp_rw": 40,
    "simpa": 84,
    "specialize": 1,
    "split_ifs": 5,
    "subst": 9,
    "suffices": 6,
    "symm": 2,
    "tauto": 2,
    "unfold": 8,
    "use": 12,
    "zify": 1
  },
  "representation": "structured",
  "split": {
    "n_rows": 2199,
    "n_test": 715,
    "n_test_theorems": 307,
    "n_train": 1484,
    "n_train_theorems": 715,
    "seed": 1,
    "strategy": "theorem-level random split",
    "test_ratio": 0.3,
    "test_theorems": [
      "AddCommGroup.Int.ModEq.ModEq.add",
      "AddCommGroup.Int.ModEq.ModEq.add_modEq_right",
      "AddCommGroup.Int.ModEq.ModEq.add_modulus_modEq_iff",
      "AddCommGroup.Int.ModEq.ModEq.add_modulus_mul_modEq_iff",
      "AddCommGroup.Int.ModEq.ModEq.cancel_right_div_gcd",
      "AddCommGroup.Int.ModEq.ModEq.existsUnique_equiv",
      "AddCommGroup.Int.ModEq.ModEq.modEq_add_fac_self",
      "AddCommGroup.Int.ModEq.ModEq.modEq_and_modEq_iff_modEq_lcm",
      "AddCommGroup.Int.ModEq.ModEq.modEq_iff_eq_of_div_eq",
      "AddCommGroup.Int.ModEq.ModEq.mod_coprime",
      "AddCommGroup.Int.ModEq.ModEq.modulus_mul_add_modEq_iff",
      "AddCommGroup.Int.ModEq.ModEq.mul_left_cancel'",
      "AddCommGroup.Int.ModEq.ModEq.right_modEq_add_iff",
      "AddCommGroup.Int.ModEq.ModEq.sub_modulus_modEq_iff",
      "AddCommGroup.Int.ModEq.ModEq.sub_modulus_mul_modEq_iff",
      "AddCommGroup.Int.ModEq.modEq_iff_dvd",
      "AddCommGroup.Int.ModEq.modEq_neg",
      "AddCommGroup.Int.ModEq.modEq_zero_iff_dvd",
      "AddCommGroup.Int.ModEq.natCast_modEq_iff",
      "AddCommGroup.Int.ModEq.neg_modEq_neg",
      "AddCommGroup.Nat.ModEq.ModEq.ModEq.add_div_eq_of_add_mod_lt",
      "AddCommGroup.Nat.ModEq.ModEq.ModEq.add_div_eq_of_le_mod_add_mod",
      "AddCommGroup.Nat.ModEq.ModEq.ModEq.add_div_of_dvd_right",
      "AddCommGroup.Nat.ModEq.ModEq.ModEq.cancel_left_div_gcd",
      "AddCommGroup.Nat.ModEq.ModEq.ModEq.cancel_left_of_coprime",
      "AddCommGroup.Nat.ModEq.ModEq.ModEq.cancel_right_div_gcd",
      "AddCommGroup.Nat.ModEq.ModEq.ModEq.coprime_of_mul_modEq_one",
      "AddCommGroup.Nat.ModEq.ModEq.ModEq.le_mod_add_mod_of_dvd_add_of_not_dvd",
      "AddCommGroup.Nat.ModEq.ModEq.ModEq.odd_mod_four_iff",
      "AddCommGroup.Nat.ModEq.ModEq.add_modEq_left",
      "AddCommGroup.Nat.ModEq.ModEq.add_mul_modulus_modEq_iff",
      "AddCommGroup.Nat.ModEq.ModEq.modEq_add_modulus_mul_iff",
      "AddCommGroup.Nat.ModEq.ModEq.modEq_add_mul_modulus_iff",
      "AddCommGroup.Nat.ModEq.ModEq.modEq_zero_iff",
      "AddCommGroup.Nat.ModEq.ModEq.mul_left_cancel'",
      "AddCommGroup.Nat.ModEq.ModEq.right_modEq_add_iff",
      "AddCommGroup.Nat.ModEq.modEq_iff_dvd'",
      "Associated.neg_left",
      "Bool.and_eq_false_eq_eq_false_or_eq_false",
      "Bool.and_eq_true_eq_eq_true_and_eq_true",
      "Bool.coe_sort_false",
      "Bool.coe_xor_iff",
      "Bool.decide_iff",
      "Bool.dichotomy",
      "Bool.eq_true_of_not_eq_false'",
      "Bool.false_eq_true_eq_False",
      "Bool.injective_iff",
      "Bool.le_iff_imp",
      "Bool.or_eq_false_eq_eq_false_and_eq_false",
      "Bool.or_eq_true_eq_eq_true_or_eq_true",
      "Bool.toNat_beq_zero",
      "Bool.toNat_le_toNat",
      "Bool.true_eq_false_eq_False",
      "Disjoint.sdiff_eq_of_sup_eq",
      "Even.add_odd",
      "Even.mul_right",
      "Finset.Multiset.List.Finset.Equiv.Multiset.Finset.univ_finset_of_isEmpty",
      "Finset.Multiset.List.Finset.Equiv.piFinsetUnion_left",
      "Finset.Multiset.List.Finset.Equiv.piFinsetUnion_right",
      "Finset.Multiset.List.toFinset_eq_empty_iff",
      "Finset.Multiset.List.toFinset_filter",
      "Finset.Multiset.List.toFinset_inter",
      "Finset.Multiset.toFinset_nonempty",
      "Finset.Multiset.toFinset_singleton",
      "Finset.Nonempty.of_disjSups_left",
      "Finset.Nontrivial.ne_singleton",
      "Finset.card_preimage_eq_sum_card_image_eq",
      "Finset.coe_pair",
      "Finset.coe_subset_singleton",
      "Finset.compls_sups",
      "Finset.cons_eq_insert",
      "Finset.cons_induction",
      "Finset.cons_subset_cons",
      "Finset.dens_biUnion",
      "Finset.dens_disjiUnion",
      "Finset.disjSups_inter_subset_left",
      "Finset.disjSups_right_comm",
      "Finset.disjSups_union_left",
      "Finset.disjUnion_eq_union",
      "Finset.disjoint_erase_insert",
      "Finset.disjoint_filter",
      "Finset.disjoint_insert_erase",
      "Finset.disjoint_of_erase_right",
      "Finset.eq_singleton_iff_unique_mem",
      "Finset.erase_eq_empty_iff",
      "Finset.erase_insert_eq_erase",
      "Finset.erase_insert_of_ne",
      "Finset.erase_sdiff_comm",
      "Finset.erase_ssubset",
      "Finset.erase_ssubset_insert",
      "Finset.erase_subset_iff_of_mem",
      "Finset.filter_erase",
      "Finset.filter_insert",
      "Finset.filter_inter",
      "Finset.filter_mem_eq_inter",
      "Finset.filter_or",
      "Finset.forall_mem_insert",
      "Finset.insert_inter_distrib",
      "Finset.insert_val_of_notMem",
      "Finset.inter_filter",
      "Finset.mem_disjSups",
      "Finset.mem_insert_coe",
      "Finset.nonempty_mk",
      "Finset.powerset_infs_powerset_self",
      "Finset.powerset_inter",
      "Finset.powerset_sups_powerset_self",
      "Finset.prod_eraseNone",
      "Finset.range_filter_eq",
      "Finset.range_inter_range",
      "Finset.sdiff_erase",
      "Finset.sdiff_singleton_eq_erase",
      "Finset.sdiff_union_erase_cancel",
      "Finset.subset_insert_iff",
      "Finset.sups_eq_self",
      "Finset.union_erase_of_mem",
      "Int.Prime.dvd_natAbs_of_coe_dvd_sq",
      "Int.abs_le_sqrt",
      "Int.fdiv_fdiv_eq_fdiv_mul",
      "Int.mul_ediv_le_mul_ediv_assoc",
      "Int.nonneg_or_nonpos_of_mul_nonneg",
      "List.IsRotated.cyclicPermutations",
      "List.IsRotated.map",
      "List.IsRotated.symm",
      "List.Nodup.rotate_eq_self_iff",
      "List.countP_erase",
      "List.cyclicPermutations_rotate",
      "List.getElem_rotate",
      "List.get_cyclicPermutations",
      "List.isRotated_append",
      "List.isRotated_cyclicPermutations_iff",
      "List.isRotated_iff_mem_map_range",
      "List.isRotated_reverse_iff",
      "List.isRotated_singleton_iff'",
      "List.iterate_add",
      "List.length_cyclicPermutations_cons",
      "List.length_iterate",
      "List.mem_rotate",
      "List.rotate'_length_mul",
      "List.rotate'_nil",
      "List.rotate'_rotate'",
      "List.rotate'_zero",
      "List.rotate_append_length_eq",
      "List.rotate_eq_drop_append_take",
      "List.rotate_eq_drop_append_take_mod",
      "List.rotate_eq_nil_iff",
      "List.rotate_eq_singleton_iff",
      "List.rotate_one_eq_self_iff_eq_replicate",
      "List.rotate_perm",
      "List.rotate_replicate",
      "List.rotate_rotate",
      "List.rotate_zero",
      "Multiset.sum_map_div",
      "NNReal.Real.Mathlib.Meta.Positivity.Real.NNReal.sum_sqrt_mul_sqrt_le",
      "NNReal.Real.Mathlib.Meta.Positivity.Real.inv_sqrt_two_sub_one",
      "NNReal.Real.Mathlib.Meta.Positivity.Real.lt_sq_of_sqrt_lt",
      "NNReal.Real.Mathlib.Meta.Positivity.Real.sqrt_mul'",
      "NNReal.Real.Mathlib.Meta.Positivity.Real.sqrt_prod",
      "NNReal.Real.abs_le_sqrt",
      "NNReal.Real.comap_sqrt_atTop",
      "NNReal.Real.mul_self_sqrt",
      "NNReal.Real.sq_le",
      "NNReal.Real.sq_sqrt",
      "NNReal.Real.sqrt_eq_iff_mul_self_eq",
      "NNReal.Real.sqrt_eq_one",
      "NNReal.Real.sqrt_eq_zero_of_nonpos",
      "NNReal.Real.sqrt_le_iff",
      "NNReal.Real.sqrt_le_sqrt_iff",
      "NNReal.Real.sqrt_nonneg",
      "NNReal.one_le_sqrt",
      "NNReal.sqrt_pos",
      "Nat.Function.Involutive.Even.neg_one_zpow",
      "Nat.Function.Involutive.iterate_odd",
      "Nat.Function.Involutive.neg_one_pow_congr",
      "Nat.Function.Involutive.neg_one_pow_eq_ite",
      "Nat.Odd.sub_odd",
      "Nat.Prime.coprime_choose_of_lt",
      "Nat.Prime.dvd_choose_add",
      "Nat.Prime.dvd_iff_one_le_factorization",
      "Nat.Prime.mod_two_eq_one_iff_ne_two",
      "Nat.Prime.mul_eq_prime_sq_iff",
      "Nat.Prime.not_coprime_iff_dvd",
      "Nat.Prime.not_dvd_mul",
      "Nat.Prime.pow_inj",
      "Nat.card_multiples'",
      "Nat.coprime_of_lt_minFac",
      "Nat.dvd_iff_div_factorization_eq_tsub",
      "Nat.dvd_of_forall_prime_mul_dvd",
      "Nat.dvd_ordCompl_of_dvd_not_dvd",
      "Nat.eq_one_iff_not_exists_prime_dvd",
      "Nat.eq_pow_of_factorization_eq_single",
      "Nat.eq_prime_pow_of_dvd_least_prime_pow",
      "Nat.even_div",
      "Nat.even_sub'",
      "Nat.even_xor_odd",
      "Nat.exists_factorization_lt_of_lt",
      "Nat.factorization_le_factorization_mul_left",
      "Nat.factorization_lt",
      "Nat.factorization_ordCompl",
      "Nat.factorization_prime_le_iff_dvd",
      "Nat.mod_two_add_add_odd_mod_two",
      "Nat.not_even_two_mul_add_one",
      "Nat.odd_sub",
      "Nat.odd_sub'",
      "Nat.one_add_div_two_mul_two_of_odd",
      "Nat.ordCompl_dvd_ordCompl_of_dvd",
      "Nat.ordCompl_mul",
      "Nat.ordCompl_of_not_prime",
      "Nat.ordCompl_pos",
      "Nat.ordProj_dvd_ordProj_of_dvd",
      "Nat.ordProj_mul",
      "Nat.ordProj_of_not_prime",
      "Nat.ppred_eq_none",
      "Nat.ppred_eq_some",
      "Nat.prime_mul_iff",
      "Nat.prod_primeFactors_dvd",
      "Nat.psub'_eq_psub",
      "Nat.psub_add",
      "Nat.sub_eq_psub",
      "Nat.succ_dvd_or_succ_dvd_of_succ_sum_dvd_mul",
      "Odd.add_odd",
      "Odd.map",
      "Odd.not_two_dvd_nat",
      "Rat.exists_mul_self",
      "Set.Icc_union_Ici",
      "Set.Ici_diff_Ici",
      "Set.Ici_diff_Ioi",
      "Set.Ico_diff_Iio",
      "Set.Ico_inter_Iio",
      "Set.Ico_union_Ici",
      "Set.Ico_union_Ici'",
      "Set.Ico_union_Ico",
      "Set.Ico_union_Ico'",
      "Set.Iic_diff_Iic",
      "Set.Iic_diff_Iio",
      "Set.Iic_union_Icc",
      "Set.Iio_diff_Iic",
      "Set.Iio_union_Ico",
      "Set.Ioc_inter_Ioc",
      "Set.Ioc_inter_Ioo_of_left_lt",
      "Set.Ioc_subset_Ioc_iff",
      "Set.Ioi_diff_Ici",
      "Set.Ioi_subset_Ioi_iff",
      "Set.Ioo_inter_Ioc_of_left_le",
      "Set.Ioo_inter_Ioi",
      "Set.Ioo_inter_Ioo",
      "Set.Ioo_union_Ioo",
      "Set.compl_union_self",
      "Set.diff_eq_compl_inter",
      "Set.diff_singleton_eq_self",
      "Set.diff_singleton_ssubset",
      "Set.diff_singleton_subset_iff",
      "Set.diff_union_inter",
      "Set.insert_diff_of_mem",
      "Set.inter_diff_right_comm",
      "Set.ite_eq_of_subset_left",
      "Set.ite_inter_of_inter_eq",
      "Set.ite_left",
      "Set.ite_right",
      "Set.ncard_Ioo_nat",
      "Set.ssubset_iff_sdiff_singleton",
      "Set.subset_insert_diff_singleton",
      "Set.subset_insert_iff",
      "SetRel.Function.Set.preimage_eq",
      "SetRel.Function.SetRel.exists_graph_eq_iff",
      "SetRel.Function.graph_comp",
      "SetRel.Function.graph_id",
      "SetRel.cod_empty",
      "SetRel.comp_assoc",
      "SetRel.comp_iUnion",
      "SetRel.comp_sUnion",
      "SetRel.comp_univ",
      "SetRel.core_comp",
      "SetRel.core_id",
      "SetRel.core_inter",
      "SetRel.dom_eq_empty_iff",
      "SetRel.dom_univ",
      "SetRel.exists_eq_singleton_of_prod_subset_id",
      "SetRel.id_comp",
      "SetRel.image_inter_dom",
      "SetRel.inv_eq_self",
      "SetRel.inv_id",
      "SetRel.preimage_comp",
      "SetRel.preimage_eq_image",
      "SetRel.preimage_id",
      "SetRel.preimage_union",
      "SetRel.preimage_univ_left",
      "SetRel.prod_comp_prod_of_inter_nonempty",
      "SetRel.prod_subset_comm",
      "compl_eq_iff_isCompl",
      "eq_compl_comm",
      "even_add_one",
      "even_iff_two_dvd",
      "even_sub_one",
      "even_sub_two",
      "even_two",
      "inf_sdiff_distrib_right",
      "le_iff_eq_sup_sdiff",
      "odd_sub_one",
      "odd_sub_two",
      "sdiff_inf_right_comm",
      "sdiff_sdiff_left'",
      "sdiff_sdiff_right",
      "sdiff_sdiff_sup_sdiff",
      "star_finsuppProd",
      "sup_lt_of_lt_sdiff_left",
      "sup_lt_of_lt_sdiff_right",
      "sup_sdiff_inf"
    ]
  }
}