{
  "baselines": {
    "keyword_heuristic": {
      "accuracy": 0.215962441314554,
      "macro_f1": 0.023673919199620384,
      "top1_accuracy": 0.215962441314554,
      "top3_accuracy": 0.5164319248826291,
      "top5_accuracy": 0.6744913928012519
    },
    "majority_class": {
      "accuracy": 0.25039123630672927,
      "macro_f1": 0.008010012515644555,
      "top1_accuracy": 0.25039123630672927,
      "top3_accuracy": 0.5383411580594679,
      "top5_accuracy": 0.6682316118935837
    },
    "text_naive_bayes": {
      "accuracy": 0.405320813771518,
      "macro_f1": 0.05773078127526734,
      "top1_accuracy": 0.405320813771518,
      "top3_accuracy": 0.6416275430359938,
      "top5_accuracy": 0.7370892018779343
    },
    "tfidf_linear_svm": {
      "accuracy": 0.3646322378716745,
      "macro_f1": 0.13796760113867546,
      "top1_accuracy": 0.3646322378716745,
      "top3_accuracy": 0.6134585289514867,
      "top5_accuracy": 0.7355242566510172
    },
    "tfidf_logistic_regression": {
      "accuracy": 0.1705790297339593,
      "macro_f1": 0.07874263973418066,
      "top1_accuracy": 0.1705790297339593,
      "top3_accuracy": 0.3411580594679186,
      "top5_accuracy": 0.5101721439749609
    }
  },
  "label_distribution": {
    "ac_rfl": 19,
    "aesop": 67,
    "all_goals": 2,
    "apply": 31,
    "by_cases": 12,
    "by_cases!": 1,
    "by_contra": 5,
    "by_contra!": 2,
    "calc": 8,
    "cases": 17,
    "choose": 1,
    "classical": 5,
    "congr": 3,
    "constructor": 17,
    "contradiction": 1,
    "contrapose!": 5,
    "conv_lhs": 5,
    "conv_rhs": 4,
    "convert": 13,
    "decide": 23,
    "dsimp": 2,
    "exact": 207,
    "exacts": 2,
    "exists": 2,
    "ext": 31,
    "ext1": 1,
    "fun_prop": 1,
    "gcongr": 3,
    "grind": 182,
    "grw": 5,
    "have": 61,
    "if": 13,
    "induction": 24,
    "injection": 1,
    "intro": 31,
    "let": 10,
    "letI": 1,
    "lia": 18,
    "linarith": 1,
    "norm_cast": 2,
    "nth_rw": 3,
    "obtain": 47,
    "positivity": 3,
    "push": 1,
    "push_neg": 1,
    "rcases": 47,
    "refine": 64,
    "replace": 2,
    "revert": 1,
    "rfl": 14,
    "right": 2,
    "ring": 1,
    "rintro": 41,
    "rw": 487,
    "rw!": 2,
    "rwa": 30,
    "set": 2,
    "show": 2,
    "simp": 423,
    "simp_all": 14,
    "simp_all!": 3,
    "simp_rw": 40,
    "simpa": 84,
    "specialize": 1,
    "split_ifs": 5,
    "subst": 9,
    "suffices": 6,
    "symm": 2,
    "tauto": 2,
    "unfold": 8,
    "use": 12,
    "zify": 1
  },
  "representation": "premise",
  "split": {
    "n_rows": 2199,
    "n_test": 639,
    "n_test_theorems": 307,
    "n_train": 1560,
    "n_train_theorems": 715,
    "seed": 0,
    "strategy": "theorem-level random split",
    "test_ratio": 0.3,
    "test_theorems": [
      "AddCommGroup.Int.ModEq.ModEq.add_modEq_right_iff",
      "AddCommGroup.Int.ModEq.ModEq.add_modulus_modEq_iff",
      "AddCommGroup.Int.ModEq.ModEq.cancel_right_div_gcd",
      "AddCommGroup.Int.ModEq.ModEq.modEq_add_modulus_mul_iff",
      "AddCommGroup.Int.ModEq.ModEq.modEq_iff_eq_of_div_eq",
      "AddCommGroup.Int.ModEq.ModEq.modEq_modulus_add_iff",
      "AddCommGroup.Int.ModEq.ModEq.modEq_natAbs",
      "AddCommGroup.Int.ModEq.ModEq.mod_coprime",
      "AddCommGroup.Int.ModEq.ModEq.modulus_add_modEq_iff",
      "AddCommGroup.Int.ModEq.ModEq.of_div",
      "AddCommGroup.Int.ModEq.ModEq.of_mul_left",
      "AddCommGroup.Int.ModEq.ModEq.sub",
      "AddCommGroup.Int.ModEq.ModEq.sub_modulus_mul_modEq_iff",
      "AddCommGroup.Int.ModEq.modEq_iff_dvd",
      "AddCommGroup.Int.ModEq.modEq_zero_iff_dvd",
      "AddCommGroup.Int.ModEq.natCast_modEq_iff",
      "AddCommGroup.ModEq.natCast",
      "AddCommGroup.Nat.ModEq.ModEq.ModEq.add_div_le_add_div",
      "AddCommGroup.Nat.ModEq.ModEq.ModEq.add_div_of_dvd_left",
      "AddCommGroup.Nat.ModEq.ModEq.ModEq.cancel_left_of_coprime",
      "AddCommGroup.Nat.ModEq.ModEq.ModEq.cancel_right_div_gcd",
      "AddCommGroup.Nat.ModEq.ModEq.ModEq.le_of_lt_add",
      "AddCommGroup.Nat.ModEq.ModEq.ModEq.mod_sub_of_le",
      "AddCommGroup.Nat.ModEq.ModEq.add",
      "AddCommGroup.Nat.ModEq.ModEq.add_left_cancel",
      "AddCommGroup.Nat.ModEq.ModEq.add_modEq_left_iff",
      "AddCommGroup.Nat.ModEq.ModEq.add_modEq_right_iff",
      "AddCommGroup.Nat.ModEq.ModEq.add_modulus_mul_modEq_iff",
      "AddCommGroup.Nat.ModEq.ModEq.modEq_add_modulus_iff",
      "AddCommGroup.Nat.ModEq.ModEq.modEq_mul_modulus_add_iff",
      "AddCommGroup.Nat.ModEq.ModEq.modEq_sub_modulus_iff",
      "AddCommGroup.Nat.ModEq.ModEq.modulus_add_modEq_iff",
      "AddCommGroup.Nat.ModEq.ModEq.modulus_modEq_zero",
      "AddCommGroup.Nat.ModEq.ModEq.mul_left_cancel'",
      "AddCommGroup.Nat.ModEq.ModEq.mul_modulus_add_modEq_iff",
      "AddCommGroup.Nat.ModEq.ModEq.mul_right'",
      "AddCommGroup.Nat.ModEq.ModEq.sub_modulus_modEq_iff",
      "AddCommGroup.Nat.ModEq.modEq_iff_dvd",
      "AddCommGroup.Nat.ModEq.modEq_iff_dvd'",
      "AddCommGroup.modEq_iff_intModEq",
      "AddCommGroup.modEq_iff_natModEq",
      "Bool.and_le_left",
      "Bool.apply_apply_apply",
      "Bool.bne_eq_xor",
      "Bool.coe_sort_true",
      "Bool.decide_iff",
      "Bool.eq_or_eq_not",
      "Bool.lt_iff",
      "Bool.ofNat_le_ofNat",
      "Bool.or_eq_false_eq_eq_false_and_eq_false",
      "Bool.toNat_beq_one",
      "Bool.toNat_beq_zero",
      "Bool.toNat_bne_zero",
      "Bool.xor_iff_ne",
      "Even.mul_left",
      "Even.neg_one_pow",
      "Finset.Multiset.List.Finset.empty_toList",
      "Finset.Multiset.List.toFinset_cons",
      "Finset.Multiset.List.toFinset_filter",
      "Finset.Multiset.List.toFinset_union",
      "Finset.Multiset.toFinset_inter",
      "Finset.Multiset.toFinset_singleton",
      "Finset.Multiset.toFinset_union",
      "Finset.Nonempty.of_disjSups_left",
      "Finset.coe_insert",
      "Finset.coe_pair",
      "Finset.coe_singleton",
      "Finset.compls_infs",
      "Finset.compls_infs_eq_diffs",
      "Finset.cons_induction",
      "Finset.cons_subset_cons",
      "Finset.disjSups_comm",
      "Finset.disjSups_empty_right",
      "Finset.disjSups_inter_subset_left",
      "Finset.disjSups_union_left",
      "Finset.disjSups_union_right",
      "Finset.disjoint_disjUnion_left",
      "Finset.disjoint_insert_erase",
      "Finset.disjoint_of_erase_left",
      "Finset.disjoint_or_nonempty_inter",
      "Finset.disjoint_union_left",
      "Finset.eq_singleton_iff_nonempty_unique_mem",
      "Finset.erase_cons",
      "Finset.erase_cons_of_ne",
      "Finset.erase_eq_empty_iff",
      "Finset.erase_insert",
      "Finset.erase_insert_eq_erase",
      "Finset.erase_sdiff_distrib",
      "Finset.erase_subset_iff_of_mem",
      "Finset.exists_compls_iff",
      "Finset.filter_and",
      "Finset.filter_and_not",
      "Finset.filter_cons",
      "Finset.filter_eq",
      "Finset.filter_eq'",
      "Finset.filter_union_right",
      "Finset.forall_disjSups_iff",
      "Finset.infs_self",
      "Finset.insert_erase",
      "Finset.insert_idem",
      "Finset.insert_inter_distrib",
      "Finset.insert_subset_insert_iff",
      "Finset.inter_erase",
      "Finset.map_infs",
      "Finset.ne_insert_of_notMem",
      "Finset.nonempty_iff_eq_singleton_default",
      "Finset.not_nontrivial_empty",
      "Finset.not_nontrivial_singleton",
      "Finset.odd_sum_iff_odd_card_odd",
      "Finset.powerset_infs_powerset_self",
      "Finset.powerset_union",
      "Finset.range_inter_range",
      "Finset.range_union_range",
      "Finset.sdiff_insert",
      "Finset.sdiff_union_erase_cancel",
      "Finset.singleton_iff_unique_mem",
      "Finset.singleton_subset_set_iff",
      "Finset.ssubset_iff_exists_subset_erase",
      "Finset.subset_union_elim",
      "Fintype.card_eq_card_units_add_one",
      "Fintype.card_units",
      "HasSubset.Subset.diff_ssubset_of_nonempty",
      "Int.Prime.dvd_natAbs_of_coe_dvd_sq",
      "Int.fdiv_fdiv_eq_fdiv_mul",
      "Int.natAbs_eq_iff_mul_self_eq",
      "List.countP_lt_length_iff",
      "List.getElem_cyclicPermutations",
      "List.getElem_rotate",
      "List.get_cyclicPermutations",
      "List.get_rotate",
      "List.head?_rotate",
      "List.isRotated_iff_mod",
      "List.isRotated_nil_iff",
      "List.isRotated_nil_iff'",
      "List.isRotated_reverse_comm_iff",
      "List.mem_rotate",
      "List.rotate'_cons_succ",
      "List.rotate'_length",
      "List.rotate'_rotate'",
      "List.rotate_append_length_eq",
      "List.rotate_cons_succ",
      "List.rotate_eq_nil_iff",
      "List.rotate_perm",
      "List.rotate_replicate",
      "List.rotate_reverse",
      "List.zipWith_rotate_one",
      "Multiset.sum_map_div",
      "NNReal.Real.Mathlib.Meta.Positivity.Real.floor_real_sqrt_eq_nat_sqrt",
      "NNReal.Real.Mathlib.Meta.Positivity.Real.nat_floor_real_sqrt_eq_nat_sqrt",
      "NNReal.Real.Mathlib.Meta.Positivity.Real.nat_sqrt_le_real_sqrt",
      "NNReal.Real.Mathlib.Meta.Positivity.Real.sqrt_div'",
      "NNReal.Real.Mathlib.Meta.Positivity.Real.sqrt_div_self",
      "NNReal.Real.Mathlib.Meta.Positivity.Real.sqrt_inv",
      "NNReal.Real.Mathlib.Meta.Positivity.Real.sqrt_one_add_le",
      "NNReal.Real.Mathlib.Meta.Positivity.Real.sqrt_two_lt_three_halves",
      "NNReal.Real.abs_le_sqrt",
      "NNReal.Real.coe_sqrt",
      "NNReal.Real.continuous_sqrt",
      "NNReal.Real.mul_self_sqrt",
      "NNReal.Real.sqrt_eq_zero'",
      "NNReal.Real.sqrt_le_iff",
      "NNReal.Real.sqrt_le_one",
      "NNReal.Real.sqrt_le_sqrt",
      "NNReal.Real.sqrt_le_sqrt_iff'",
      "NNReal.Real.sqrt_lt",
      "NNReal.Real.sqrt_mul_self_eq_abs",
      "NNReal.Real.sqrt_one",
      "NNReal.Real.sqrt_sq_eq_abs",
      "NNReal.sqrt_le_one",
      "NNReal.sqrt_mul",
      "NNReal.sqrt_mul_self",
      "NNReal.sqrt_pos",
      "Nat.Function.Involutive.Even.neg_zpow",
      "Nat.Function.Involutive.iterate_eq_id",
      "Nat.Function.Involutive.iterate_eq_self",
      "Nat.Function.Involutive.neg_one_pow_congr",
      "Nat.Function.Involutive.neg_one_pow_eq_ite",
      "Nat.Function.Involutive.neg_one_pow_eq_one_iff_even",
      "Nat.Ico_pow_dvd_eq_Ico_of_lt",
      "Nat.Odd.sub_even",
      "Nat.Odd.sub_odd",
      "Nat.Prime.dvd_choose_add",
      "Nat.Prime.dvd_factorial",
      "Nat.Prime.dvd_iff_one_le_factorization",
      "Nat.Prime.even_iff",
      "Nat.Prime.factorization_self",
      "Nat.Prime.pow_dvd_iff_dvd_ordProj",
      "Nat.card_eq_card_units_add_one",
      "Nat.coprime_or_dvd_of_prime",
      "Nat.coprime_prod_right_iff",
      "Nat.descFactorial_eq_prod_range",
      "Nat.dvd_iff_prime_pow_dvd_dvd",
      "Nat.eq_one_iff_not_exists_prime_dvd",
      "Nat.exists_factorization_lt_of_lt",
      "Nat.factorial_coe_dvd_prod",
      "Nat.factorial_eq_prod_range_add_one",
      "Nat.factorization_eq_of_coprime_right",
      "Nat.factorization_eq_zero_iff_remainder",
      "Nat.factorization_lcm",
      "Nat.factorization_le_factorization_mul_right",
      "Nat.factorization_pow_self",
      "Nat.ne_of_odd_add",
      "Nat.not_even_bit1",
      "Nat.not_even_two_mul_add_one",
      "Nat.ordCompl_dvd_ordCompl_of_dvd",
      "Nat.ordCompl_eq_self_iff_zero_or_not_dvd",
      "Nat.ordCompl_of_not_prime",
      "Nat.ordCompl_pos",
      "Nat.ordProj_dvd_ordProj_of_dvd",
      "Nat.ordProj_of_not_prime",
      "Nat.ordProj_self_pow",
      "Nat.pairwise_coprime_pow_primeFactors_factorization",
      "Nat.psub_add",
      "Nat.psub_eq_none",
      "Nat.succ_dvd_or_succ_dvd_of_succ_sum_dvd_mul",
      "Nat.succ_mod_two_add_mod_two",
      "Nat.two_dvd_mul_sub_one",
      "Odd.neg_pow",
      "Odd.not_two_dvd_nat",
      "Option.elim'_eq_elim",
      "Rat.exists_mul_self",
      "Rat.sqrt_natCast",
      "Set.Icc_union_Icc",
      "Set.Icc_union_Ici",
      "Set.Icc_union_Ici'",
      "Set.Ici_eq_singleton_iff_isTop",
      "Set.Ico_diff_Iio",
      "Set.Ico_inter_Ico",
      "Set.Ico_inter_Iio",
      "Set.Ico_union_Ici",
      "Set.Iic_diff_Ioc",
      "Set.Iic_union_Ioc'",
      "Set.Iio_ssubset_Iio_iff",
      "Set.Iio_subset_Iic_iff",
      "Set.Iio_union_Ico'",
      "Set.Iio_union_Ioo",
      "Set.Ioc_diff_Iic",
      "Set.Ioc_inter_Ioi",
      "Set.Ioc_inter_Ioo_of_right_le",
      "Set.Ioc_subset_Ioc_iff",
      "Set.Ioc_union_Ioc'",
      "Set.Ioc_union_Ioc_symm",
      "Set.Ioc_union_Ioc_union_Ioc_cycle",
      "Set.Ioc_union_Ioi",
      "Set.Ioc_union_Ioi'",
      "Set.Ioo_inter_Ioc_of_right_lt",
      "Set.Ioo_inter_Ioo",
      "Set.Ioo_union_Ioi'",
      "Set.compl_union_self",
      "Set.diff_eq_compl_inter",
      "Set.insert_diff_self_of_mem",
      "Set.ite_inter_compl_self",
      "Set.ite_inter_of_inter_eq",
      "Set.ite_left",
      "Set.ite_right",
      "Set.ncard_Ico_nat",
      "Set.ncard_Ioo_nat",
      "Set.subset_inter_union_compl_right",
      "Set.union_symmDiff_union_subset",
      "SetRel.Function.Set.preimage_eq_core",
      "SetRel.cod_eq_empty_iff",
      "SetRel.cod_univ",
      "SetRel.comp_univ",
      "SetRel.core_inter",
      "SetRel.core_univ",
      "SetRel.dom_empty",
      "SetRel.id_subset",
      "SetRel.image_empty_right",
      "SetRel.image_eq_biUnion",
      "SetRel.image_eq_cod_of_dom_subset",
      "SetRel.image_inter_dom",
      "SetRel.inter_cod_subset_image_preimage",
      "SetRel.left_subset_comp",
      "SetRel.preimage_eq_dom_of_cod_subset",
      "SetRel.preimage_eq_image",
      "SetRel.preimage_univ_left",
      "SetRel.prod_comp_prod",
      "SetRel.right_subset_comp",
      "compl_lt_self",
      "compl_sdiff",
      "compl_sup_eq_top",
      "disjoint_compl_right_iff",
      "disjoint_sdiff_comm",
      "even_sub_two",
      "even_two",
      "himp_eq_left",
      "inf_sdiff_distrib_left",
      "inf_sdiff_inf",
      "isGLB_iUnion_iff_of_isLUB",
      "isUnit_two_iff_forall_even",
      "odd_iff_exists_bit1",
      "odd_sub_one",
      "sdiff_compl",
      "sdiff_eq_sdiff_iff_inf_eq_inf",
      "sdiff_eq_symm",
      "sdiff_inf_right_comm",
      "sdiff_inf_sdiff",
      "sdiff_le_sdiff_iff_le",
      "sdiff_lt",
      "sdiff_lt_left",
      "sdiff_sdiff_left'",
      "sdiff_sdiff_right_self",
      "sdiff_sup",
      "sdiff_sup_self'",
      "sdiff_unique",
      "sup_inf_inf_compl",
      "sup_lt_of_lt_sdiff_left"
    ]
  }
}