{
  "baselines": {
    "keyword_heuristic": {
      "accuracy": 0.19224806201550387,
      "macro_f1": 0.031240450480646564,
      "top1_accuracy": 0.19224806201550387,
      "top3_accuracy": 0.4790697674418605,
      "top5_accuracy": 0.6465116279069767
    },
    "majority_class": {
      "accuracy": 0.22790697674418606,
      "macro_f1": 0.0084366391184573,
      "top1_accuracy": 0.22790697674418606,
      "top3_accuracy": 0.5116279069767442,
      "top5_accuracy": 0.6403100775193798
    },
    "text_naive_bayes": {
      "accuracy": 0.2806201550387597,
      "macro_f1": 0.05681881933899414,
      "top1_accuracy": 0.2806201550387597,
      "top3_accuracy": 0.5751937984496124,
      "top5_accuracy": 0.6759689922480621
    },
    "tfidf_linear_svm": {
      "accuracy": 0.16899224806201552,
      "macro_f1": 0.07665795590755173,
      "top1_accuracy": 0.16899224806201552,
      "top3_accuracy": 0.34418604651162793,
      "top5_accuracy": 0.4992248062015504
    },
    "tfidf_logistic_regression": {
      "accuracy": 0.08837209302325581,
      "macro_f1": 0.05289446754647466,
      "top1_accuracy": 0.08837209302325581,
      "top3_accuracy": 0.21705426356589147,
      "top5_accuracy": 0.34108527131782945
    }
  },
  "label_distribution": {
    "ac_rfl": 19,
    "aesop": 67,
    "all_goals": 2,
    "apply": 31,
    "by_cases": 12,
    "by_cases!": 1,
    "by_contra": 5,
    "by_contra!": 2,
    "calc": 8,
    "cases": 17,
    "choose": 1,
    "classical": 5,
    "congr": 3,
    "constructor": 17,
    "contradiction": 1,
    "contrapose!": 5,
    "conv_lhs": 5,
    "conv_rhs": 4,
    "convert": 13,
    "decide": 23,
    "dsimp": 2,
    "exact": 207,
    "exacts": 2,
    "exists": 2,
    "ext": 31,
    "ext1": 1,
    "fun_prop": 1,
    "gcongr": 3,
    "grind": 182,
    "grw": 5,
    "have": 61,
    "if": 13,
    "induction": 24,
    "injection": 1,
    "intro": 31,
    "let": 10,
    "letI": 1,
    "lia": 18,
    "linarith": 1,
    "norm_cast": 2,
    "nth_rw": 3,
    "obtain": 47,
    "positivity": 3,
    "push": 1,
    "push_neg": 1,
    "rcases": 47,
    "refine": 64,
    "replace": 2,
    "revert": 1,
    "rfl": 14,
    "right": 2,
    "ring": 1,
    "rintro": 41,
    "rw": 487,
    "rw!": 2,
    "rwa": 30,
    "set": 2,
    "show": 2,
    "simp": 423,
    "simp_all": 14,
    "simp_all!": 3,
    "simp_rw": 40,
    "simpa": 84,
    "specialize": 1,
    "split_ifs": 5,
    "subst": 9,
    "suffices": 6,
    "symm": 2,
    "tauto": 2,
    "unfold": 8,
    "use": 12,
    "zify": 1
  },
  "representation": "structured",
  "split": {
    "n_rows": 2199,
    "n_test": 645,
    "n_test_theorems": 307,
    "n_train": 1554,
    "n_train_theorems": 715,
    "seed": 2,
    "strategy": "theorem-level random split",
    "test_ratio": 0.3,
    "test_theorems": [
      "AddCommGroup.Int.ModEq.ModEq.add_modEq_left",
      "AddCommGroup.Int.ModEq.ModEq.add_modulus_modEq_iff",
      "AddCommGroup.Int.ModEq.ModEq.add_modulus_mul_modEq_iff",
      "AddCommGroup.Int.ModEq.ModEq.add_right_cancel",
      "AddCommGroup.Int.ModEq.ModEq.cancel_left_div_gcd",
      "AddCommGroup.Int.ModEq.ModEq.dvd_iff",
      "AddCommGroup.Int.ModEq.ModEq.existsUnique_equiv",
      "AddCommGroup.Int.ModEq.ModEq.gcd_a_modEq",
      "AddCommGroup.Int.ModEq.ModEq.modEq_add_mul_modulus_iff",
      "AddCommGroup.Int.ModEq.ModEq.modEq_modulus_add_iff",
      "AddCommGroup.Int.ModEq.ModEq.modEq_natAbs",
      "AddCommGroup.Int.ModEq.ModEq.modEq_zero_iff",
      "AddCommGroup.Int.ModEq.ModEq.modulus_add_modEq_iff",
      "AddCommGroup.Int.ModEq.ModEq.mul_modulus_add_modEq_iff",
      "AddCommGroup.Int.ModEq.ModEq.mul_right_cancel'",
      "AddCommGroup.Int.ModEq.ModEq.neg",
      "AddCommGroup.Int.ModEq.ModEq.sub_modulus_modEq_iff",
      "AddCommGroup.Int.ModEq.modEq_iff_add_fac",
      "AddCommGroup.Int.ModEq.natCast_modEq_iff",
      "AddCommGroup.Int.ModEq.neg_modEq_neg",
      "AddCommGroup.Nat.ModEq.ModEq.ModEq.add_div_eq_of_le_mod_add_mod",
      "AddCommGroup.Nat.ModEq.ModEq.ModEq.add_div_of_dvd_right",
      "AddCommGroup.Nat.ModEq.ModEq.ModEq.add_le_of_lt",
      "AddCommGroup.Nat.ModEq.ModEq.ModEq.add_mod_add_ite",
      "AddCommGroup.Nat.ModEq.ModEq.ModEq.add_mod_of_add_mod_lt",
      "AddCommGroup.Nat.ModEq.ModEq.ModEq.cancel_right_of_coprime",
      "AddCommGroup.Nat.ModEq.ModEq.ModEq.coprime_of_mul_modEq_one",
      "AddCommGroup.Nat.ModEq.ModEq.ModEq.modEq_iff_eq_of_div_eq",
      "AddCommGroup.Nat.ModEq.ModEq.add",
      "AddCommGroup.Nat.ModEq.ModEq.add_modEq_left_iff",
      "AddCommGroup.Nat.ModEq.ModEq.add_modEq_right",
      "AddCommGroup.Nat.ModEq.ModEq.add_modEq_right_iff",
      "AddCommGroup.Nat.ModEq.ModEq.modEq_add_modulus_mul_iff",
      "AddCommGroup.Nat.ModEq.ModEq.modEq_add_mul_modulus_iff",
      "AddCommGroup.Nat.ModEq.ModEq.modEq_iff_exists_eq_add",
      "AddCommGroup.Nat.ModEq.ModEq.modEq_sub",
      "AddCommGroup.Nat.ModEq.ModEq.modEq_sub_modulus_iff",
      "AddCommGroup.Nat.ModEq.ModEq.modulus_mul_add_modEq_iff",
      "AddCommGroup.Nat.ModEq.ModEq.mul_left'",
      "AddCommGroup.Nat.ModEq.ModEq.mul_right'",
      "AddCommGroup.Nat.ModEq.ModEq.pow",
      "AddCommGroup.Nat.ModEq.ModEq.sub_modulus_modEq_iff",
      "AddCommGroup.intCast_modEq_intCast'",
      "AddCommGroup.modEq_iff_natModEq",
      "Bool.and_elim_right",
      "Bool.and_eq_true_eq_eq_true_and_eq_true",
      "Bool.and_intro",
      "Bool.and_le_right",
      "Bool.bne_eq_xor",
      "Bool.coe_xor_iff",
      "Bool.eq_not_iff",
      "Bool.eq_or_eq_not",
      "Bool.eq_true_eq_not_eq_false",
      "Bool.injective_iff",
      "Bool.le_iff_imp",
      "Bool.ofNat_le_ofNat",
      "Bool.toNat_bne_zero",
      "Even.of_isUnit_two",
      "Finset.Multiset.List.Finset.Equiv.Multiset.Finset.univ_finset_of_isEmpty",
      "Finset.Multiset.List.Finset.Equiv.Multiset.toFinset_replicate",
      "Finset.Multiset.List.toFinset_cons",
      "Finset.Multiset.List.toFinset_eq_empty_iff",
      "Finset.Multiset.List.toFinset_inter",
      "Finset.Multiset.List.toFinset_replicate_of_ne_zero",
      "Finset.Multiset.List.toFinset_union",
      "Finset.Multiset.toFinset_inter",
      "Finset.Multiset.toFinset_singleton",
      "Finset.Nonempty.cons_induction",
      "Finset.Nonempty.of_disjSups_left",
      "Finset.coe_eq_pair",
      "Finset.coe_eq_singleton",
      "Finset.coe_pair",
      "Finset.compls_compls",
      "Finset.cons_induction",
      "Finset.cons_subset_cons",
      "Finset.dens_biUnion_le",
      "Finset.diffs_compls_eq_infs",
      "Finset.disjSups_assoc",
      "Finset.disjSups_disjSups_disjSups_comm",
      "Finset.disjoint_disjUnion_right",
      "Finset.disjoint_erase_insert",
      "Finset.disjoint_insert_erase",
      "Finset.eq_singleton_iff_unique_mem",
      "Finset.erase_cons",
      "Finset.erase_injOn'",
      "Finset.erase_insert",
      "Finset.erase_insert_eq_erase",
      "Finset.erase_inter",
      "Finset.erase_sdiff_comm",
      "Finset.erase_sdiff_distrib",
      "Finset.erase_ssubset_insert",
      "Finset.erase_subset_iff_of_mem",
      "Finset.even_sum_iff_even_card_odd",
      "Finset.exists_compls_iff",
      "Finset.exists_mem_insert",
      "Finset.filter_and",
      "Finset.filter_and_not",
      "Finset.filter_erase",
      "Finset.filter_infs_le",
      "Finset.filter_insert",
      "Finset.filter_inter",
      "Finset.filter_mem_eq_inter",
      "Finset.filter_ne",
      "Finset.forall_mem_cons",
      "Finset.infs_compls_eq_diffs",
      "Finset.insert_inter_distrib",
      "Finset.map_infs",
      "Finset.map_sups",
      "Finset.mem_compls",
      "Finset.mem_infs",
      "Finset.ne_insert_of_notMem",
      "Finset.not_disjoint_iff_nonempty_inter",
      "Finset.odd_sum_iff_odd_card_odd",
      "Finset.pairwiseDisjoint_iff",
      "Finset.powerset_infs_powerset_self",
      "Finset.powerset_inter",
      "Finset.prod_insertNone",
      "Finset.range_inter_range",
      "Finset.sized_compls",
      "Finset.ssubset_iff_exists_subset_erase",
      "Finset.ssubset_singleton_iff",
      "Finset.univ_infs_univ",
      "Fintype.card_eq_card_units_add_one",
      "Int.mul_ediv_le_mul_ediv_assoc",
      "Int.natAbs_eq_iff_mul_self_eq",
      "List.IsRotated.cons_append_singleton",
      "List.IsRotated.cons_getLast_dropLast",
      "List.Nodup.rotate_eq_self_iff",
      "List.count_map_of_injective",
      "List.cyclicPermutations_rotate",
      "List.getElem?_iterate",
      "List.getElem_iterate",
      "List.get_cyclicPermutations",
      "List.get_eq_get_rotate",
      "List.head_cyclicPermutations",
      "List.isRotated_cyclicPermutations_iff",
      "List.isRotated_iff_mem_map_range",
      "List.isRotated_nil_iff'",
      "List.isRotated_reverse_iff",
      "List.isRotated_singleton_iff",
      "List.length_cyclicPermutations_cons",
      "List.rotate_append_length_eq",
      "List.rotate_eq_drop_append_take_mod",
      "List.rotate_eq_rotate'",
      "List.rotate_eq_self_iff_eq_replicate",
      "List.rotate_eq_singleton_iff",
      "List.rotate_nil",
      "NNReal.Real.Mathlib.Meta.Positivity.Real.NNReal.Real.sum_mul_le_sqrt_mul_sqrt",
      "NNReal.Real.Mathlib.Meta.Positivity.Real.NNReal.Real.sum_sqrt_mul_sqrt_le",
      "NNReal.Real.Mathlib.Meta.Positivity.Real.NNReal.sum_sqrt_mul_sqrt_le",
      "NNReal.Real.Mathlib.Meta.Positivity.Real.div_sqrt",
      "NNReal.Real.Mathlib.Meta.Positivity.Real.floor_real_sqrt_eq_nat_sqrt",
      "NNReal.Real.Mathlib.Meta.Positivity.Real.nat_sqrt_le_real_sqrt",
      "NNReal.Real.Mathlib.Meta.Positivity.Real.real_sqrt_lt_nat_sqrt_succ",
      "NNReal.Real.Mathlib.Meta.Positivity.Real.sqrt_div",
      "NNReal.Real.Mathlib.Meta.Positivity.Real.sqrt_div'",
      "NNReal.Real.comap_sqrt_atTop",
      "NNReal.Real.mul_self_sqrt",
      "NNReal.Real.sqrt_eq_iff_mul_self_eq",
      "NNReal.Real.sqrt_eq_one",
      "NNReal.Real.sqrt_eq_zero",
      "NNReal.Real.sqrt_le_sqrt_iff",
      "NNReal.Real.sqrt_le_sqrt_iff'",
      "NNReal.Real.sqrt_mul_self_eq_abs",
      "NNReal.Real.sqrt_one",
      "NNReal.one_le_sqrt",
      "NNReal.sqrt_eq_one",
      "NNReal.sqrt_eq_zero",
      "NNReal.sqrt_mul",
      "Nat.Function.Involutive.iterate_even",
      "Nat.Function.Involutive.iterate_odd",
      "Nat.Function.Involutive.natCast_eq_zero_or_one_of_two_eq_zero",
      "Nat.Function.Involutive.natCast_eq_zero_or_one_of_two_eq_zero'",
      "Nat.Function.Involutive.neg_one_pow_eq_neg_one_iff_odd",
      "Nat.Icc_factorization_eq_pow_dvd",
      "Nat.Ico_pow_dvd_eq_Ico_of_lt",
      "Nat.Ioc_filter_dvd_card_eq_div",
      "Nat.Odd.sub_even",
      "Nat.Prime.coprime_descFactorial_of_lt_of_le",
      "Nat.Prime.mod_two_eq_one_iff_ne_two",
      "Nat.Prime.not_coprime_iff_dvd",
      "Nat.Prime.pow_eq_iff",
      "Nat.card_units",
      "Nat.cast_div",
      "Nat.cast_div_charZero",
      "Nat.coprime_fintype_prod_left_iff",
      "Nat.coprime_list_prod_left_iff",
      "Nat.coprime_multiset_prod_right_iff",
      "Nat.coprime_or_dvd_of_prime",
      "Nat.dvd_ordCompl_of_dvd_not_dvd",
      "Nat.dvd_prime_pow",
      "Nat.exists_eq_pow_of_exponent_coprime_of_pow_eq_pow",
      "Nat.exists_factorization_lt_of_lt",
      "Nat.factorial_coe_dvd_prod",
      "Nat.factorization_div",
      "Nat.factorization_eq_card_pow_dvd",
      "Nat.factorization_eq_of_coprime_left",
      "Nat.factorization_le_factorization_mul_right",
      "Nat.factorization_le_of_le_pow",
      "Nat.factorization_lt",
      "Nat.factorization_pow_self",
      "Nat.ne_of_odd_add",
      "Nat.ne_one_iff_exists_prime_dvd",
      "Nat.not_even_bit1",
      "Nat.not_even_iff_odd",
      "Nat.not_odd_iff_even",
      "Nat.not_prime_iff_exists_mul_eq",
      "Nat.odd_mul",
      "Nat.odd_pow_iff",
      "Nat.ordCompl_pos",
      "Nat.ordCompl_self_pow_mul",
      "Nat.ordProj_mul",
      "Nat.ordProj_of_not_prime",
      "Nat.ordProj_pos",
      "Nat.ppred_eq_none",
      "Nat.setOf_pow_dvd_eq_Icc_factorization",
      "Nat.sub_eq_psub",
      "Nat.succ_dvd_or_succ_dvd_of_succ_sum_dvd_mul",
      "Odd.mul",
      "Odd.neg",
      "Odd.neg_pow",
      "Odd.pow",
      "Odd.sub_odd",
      "Option.elim'_none_some",
      "Rat.sqrt_eq",
      "Rat.sqrt_intCast",
      "Rat.sqrt_natCast",
      "Set.Ici_eq_singleton_iff_isTop",
      "Set.Ico_diff_Iio",
      "Set.Ico_inter_Ico",
      "Set.Ico_union_Ici",
      "Set.Ico_union_Ico'",
      "Set.Iic_diff_Iic",
      "Set.Iic_diff_Iio",
      "Set.Iic_union_Ioc'",
      "Set.Iio_diff_Iic",
      "Set.Iio_diff_Iio",
      "Set.Iio_subset_Iio_iff",
      "Set.Iio_union_Ioo",
      "Set.Ioc_union_Ioc'",
      "Set.Ioc_union_Ioc_left",
      "Set.Ioc_union_Ioc_symm",
      "Set.Ioc_union_Ioc_union_Ioc_cycle",
      "Set.Ioc_union_Ioi'",
      "Set.Ioo_inter_Ioc_of_right_lt",
      "Set.Ioo_inter_Ioo",
      "Set.Ioo_subset_Ioo_iff",
      "Set.Ioo_union_Ioi'",
      "Set.diff_singleton_eq_self",
      "Set.diff_singleton_ssubset",
      "Set.diff_singleton_subset_iff",
      "Set.diff_union_inter",
      "Set.insert_diff_of_mem",
      "Set.inter_compl_nonempty_iff",
      "Set.inter_diff_right_comm",
      "Set.ite_univ",
      "Set.ncard_Icc_nat",
      "Set.ncard_Iio_nat",
      "Set.ncard_Ioc_nat",
      "Set.ncard_Ioo_nat",
      "Set.ncard_uIcc_nat",
      "Set.pair_diff_left",
      "Set.ssubset_iff_sdiff_singleton",
      "Set.subset_inter_union_compl_right",
      "Set.union_inter_compl_right_subset",
      "SetRel.Function.Set.preimage_eq",
      "SetRel.cod_eq_empty_iff",
      "SetRel.comp_assoc",
      "SetRel.comp_empty",
      "SetRel.comp_sUnion",
      "SetRel.comp_univ",
      "SetRel.dom_empty",
      "SetRel.dom_eq_empty_iff",
      "SetRel.dom_univ",
      "SetRel.iUnion_comp",
      "SetRel.id_comp",
      "SetRel.image_comp",
      "SetRel.image_id",
      "SetRel.image_inter_dom",
      "SetRel.image_union",
      "SetRel.inter_dom_subset_preimage_image",
      "SetRel.left_subset_comp",
      "SetRel.preimage_eq_biUnion",
      "SetRel.preimage_eq_dom_of_cod_subset",
      "SetRel.preimage_sUnion",
      "SetRel.prod_comp_prod",
      "SetRel.right_subset_comp",
      "SetRel.univ_comp",
      "compl_le_compl_iff_le",
      "compl_le_of_compl_le",
      "compl_le_self",
      "eq_compl_iff_isCompl",
      "inf_sdiff",
      "inf_sdiff_left_comm",
      "isUnit_two_iff_forall_even",
      "odd_add_one",
      "range_two_mul_add_one",
      "sdiff_eq_right",
      "sdiff_eq_sdiff_iff_inf_eq_inf",
      "sdiff_inf_right_comm",
      "sdiff_inf_sdiff",
      "sdiff_le_sdiff_iff_le",
      "sdiff_lt",
      "sdiff_sdiff_eq_self",
      "sdiff_sup",
      "sup_eq_sdiff_sup_sdiff_sup_inf",
      "sup_lt_of_lt_sdiff_left"
    ]
  }
}