{
  "baselines": {
    "keyword_heuristic": {
      "accuracy": 0.17543859649122806,
      "macro_f1": 0.02089252423860095,
      "top1_accuracy": 0.17543859649122806,
      "top3_accuracy": 0.49415204678362573,
      "top5_accuracy": 0.6418128654970761
    },
    "majority_class": {
      "accuracy": 0.22953216374269006,
      "macro_f1": 0.007619694726880051,
      "top1_accuracy": 0.22953216374269006,
      "top3_accuracy": 0.5307017543859649,
      "top5_accuracy": 0.631578947368421
    },
    "text_naive_bayes": {
      "accuracy": 0.40058479532163743,
      "macro_f1": 0.06483420584838161,
      "top1_accuracy": 0.40058479532163743,
      "top3_accuracy": 0.6330409356725146,
      "top5_accuracy": 0.7046783625730995
    },
    "tfidf_linear_svm": {
      "accuracy": 0.30994152046783624,
      "macro_f1": 0.12748625446848946,
      "top1_accuracy": 0.30994152046783624,
      "top3_accuracy": 0.5292397660818714,
      "top5_accuracy": 0.6432748538011696
    },
    "tfidf_logistic_regression": {
      "accuracy": 0.1608187134502924,
      "macro_f1": 0.08617500783787886,
      "top1_accuracy": 0.1608187134502924,
      "top3_accuracy": 0.2807017543859649,
      "top5_accuracy": 0.41812865497076024
    }
  },
  "label_distribution": {
    "ac_rfl": 19,
    "aesop": 67,
    "all_goals": 2,
    "apply": 31,
    "by_cases": 12,
    "by_cases!": 1,
    "by_contra": 5,
    "by_contra!": 2,
    "calc": 8,
    "cases": 17,
    "choose": 1,
    "classical": 5,
    "congr": 3,
    "constructor": 17,
    "contradiction": 1,
    "contrapose!": 5,
    "conv_lhs": 5,
    "conv_rhs": 4,
    "convert": 13,
    "decide": 23,
    "dsimp": 2,
    "exact": 207,
    "exacts": 2,
    "exists": 2,
    "ext": 31,
    "ext1": 1,
    "fun_prop": 1,
    "gcongr": 3,
    "grind": 182,
    "grw": 5,
    "have": 61,
    "if": 13,
    "induction": 24,
    "injection": 1,
    "intro": 31,
    "let": 10,
    "letI": 1,
    "lia": 18,
    "linarith": 1,
    "norm_cast": 2,
    "nth_rw": 3,
    "obtain": 47,
    "positivity": 3,
    "push": 1,
    "push_neg": 1,
    "rcases": 47,
    "refine": 64,
    "replace": 2,
    "revert": 1,
    "rfl": 14,
    "right": 2,
    "ring": 1,
    "rintro": 41,
    "rw": 487,
    "rw!": 2,
    "rwa": 30,
    "set": 2,
    "show": 2,
    "simp": 423,
    "simp_all": 14,
    "simp_all!": 3,
    "simp_rw": 40,
    "simpa": 84,
    "specialize": 1,
    "split_ifs": 5,
    "subst": 9,
    "suffices": 6,
    "symm": 2,
    "tauto": 2,
    "unfold": 8,
    "use": 12,
    "zify": 1
  },
  "representation": "premise",
  "split": {
    "n_rows": 2199,
    "n_test": 684,
    "n_test_theorems": 307,
    "n_train": 1515,
    "n_train_theorems": 715,
    "seed": 4,
    "strategy": "theorem-level random split",
    "test_ratio": 0.3,
    "test_theorems": [
      "AddCommGroup.Int.ModEq.ModEq.add_modulus_modEq_iff",
      "AddCommGroup.Int.ModEq.ModEq.add_mul_modulus_modEq_iff",
      "AddCommGroup.Int.ModEq.ModEq.cancel_right_div_gcd",
      "AddCommGroup.Int.ModEq.ModEq.dvd_iff",
      "AddCommGroup.Int.ModEq.ModEq.left_modEq_add_iff",
      "AddCommGroup.Int.ModEq.ModEq.modEq_add_modulus_mul_iff",
      "AddCommGroup.Int.ModEq.ModEq.modEq_and_modEq_iff_modEq_mul",
      "AddCommGroup.Int.ModEq.ModEq.modEq_iff_eq_of_div_eq",
      "AddCommGroup.Int.ModEq.ModEq.modEq_natAbs",
      "AddCommGroup.Int.ModEq.ModEq.modEq_sub_fac",
      "AddCommGroup.Int.ModEq.ModEq.modEq_zero_iff",
      "AddCommGroup.Int.ModEq.ModEq.mul_left'",
      "AddCommGroup.Int.ModEq.ModEq.mul_left_cancel'",
      "AddCommGroup.Int.ModEq.ModEq.mul_modulus_add_modEq_iff",
      "AddCommGroup.Int.ModEq.ModEq.pow",
      "AddCommGroup.Int.ModEq.ModEq.sub_modulus_modEq_iff",
      "AddCommGroup.Int.ModEq.ModEq.sub_modulus_mul_modEq_iff",
      "AddCommGroup.Int.ModEq.modEq_iff_add_fac",
      "AddCommGroup.Int.ModEq.natCast_modEq_iff",
      "AddCommGroup.ModEq.natCast",
      "AddCommGroup.Nat.ModEq.ModEq.ModEq.add_mod_add_ite",
      "AddCommGroup.Nat.ModEq.ModEq.ModEq.add_mod_add_of_le_add_mod",
      "AddCommGroup.Nat.ModEq.ModEq.ModEq.add_mod_of_add_mod_lt",
      "AddCommGroup.Nat.ModEq.ModEq.ModEq.chineseRemainder'_lt_lcm",
      "AddCommGroup.Nat.ModEq.ModEq.ModEq.chineseRemainder_modEq_unique",
      "AddCommGroup.Nat.ModEq.ModEq.ModEq.coprime_of_mul_modEq_one",
      "AddCommGroup.Nat.ModEq.ModEq.ModEq.eq_of_abs_lt",
      "AddCommGroup.Nat.ModEq.ModEq.ModEq.odd_mod_four_iff",
      "AddCommGroup.Nat.ModEq.ModEq.modEq_add_modulus_iff",
      "AddCommGroup.Nat.ModEq.ModEq.modEq_iff_exists_eq_add",
      "AddCommGroup.Nat.ModEq.ModEq.modulus_mul_add_modEq_iff",
      "AddCommGroup.Nat.ModEq.ModEq.mul_left'",
      "AddCommGroup.Nat.ModEq.ModEq.mul_modulus_add_modEq_iff",
      "AddCommGroup.Nat.ModEq.ModEq.sub'",
      "AddCommGroup.Nat.ModEq.modEq_zero_iff_dvd",
      "AddCommGroup.modEq_iff_intModEq",
      "Bool.and_elim_left",
      "Bool.and_le_left",
      "Bool.and_le_right",
      "Bool.coe_xor_iff",
      "Bool.eq_false_eq_not_eq_true",
      "Bool.eq_false_of_not_eq_true'",
      "Bool.eq_not_iff",
      "Bool.eq_true_of_not_eq_false'",
      "Bool.not_eq_true_eq_eq_false",
      "Bool.or_inl",
      "Bool.toNat_beq_one",
      "Bool.toNat_bne_one",
      "Bool.toNat_le_toNat",
      "Even.mul_left",
      "Even.neg_one_pow",
      "Even.of_isUnit_two",
      "Even.pow_of_ne_zero",
      "Even.sub_odd",
      "Finset.Multiset.List.Finset.Equiv.Finset.union_symm_right",
      "Finset.Multiset.List.Finset.Equiv.Multiset.Finset.univ_finset_of_isEmpty",
      "Finset.Multiset.List.Finset.empty_toList",
      "Finset.Multiset.List.Finset.toList_eq_singleton_iff",
      "Finset.Multiset.toFinset_inter",
      "Finset.Multiset.toFinset_union",
      "Finset.Nonempty.cons_induction",
      "Finset.Nontrivial.erase_nonempty",
      "Finset.Nontrivial.exists_cons_eq",
      "Finset.attach_nonempty_iff",
      "Finset.coe_eq_pair",
      "Finset.coe_eq_singleton",
      "Finset.coe_insert",
      "Finset.coe_singleton",
      "Finset.compls_infs",
      "Finset.compls_univ",
      "Finset.cons_induction",
      "Finset.dens_disjiUnion",
      "Finset.disjSups_assoc",
      "Finset.disjSups_comm",
      "Finset.disjSups_singleton",
      "Finset.disjUnion_eq_union",
      "Finset.disjoint_of_erase_left",
      "Finset.disjoint_union_left",
      "Finset.eq_singleton_iff_unique_mem",
      "Finset.erase_eq_empty_iff",
      "Finset.erase_eq_iff_eq_insert",
      "Finset.erase_insert_of_ne",
      "Finset.erase_nonempty",
      "Finset.erase_sdiff_comm",
      "Finset.erase_ssubset",
      "Finset.erase_ssubset_insert",
      "Finset.filter_and",
      "Finset.filter_eq'",
      "Finset.filter_not",
      "Finset.filter_notMem_eq_sdiff",
      "Finset.filter_or",
      "Finset.infs_compls_eq_diffs",
      "Finset.infs_self",
      "Finset.insert_comm",
      "Finset.insert_subset_insert",
      "Finset.insert_val_of_notMem",
      "Finset.mem_compls",
      "Finset.mem_diffs",
      "Finset.mem_disjSups",
      "Finset.mem_symmDiff",
      "Finset.nonempty_mk",
      "Finset.odd_sum_iff_odd_card_odd",
      "Finset.powerset_union",
      "Finset.range_filter_eq",
      "Finset.range_inter_range",
      "Finset.sdiff_insert_insert_of_mem_of_notMem",
      "Finset.ssubset_iff_exists_subset_erase",
      "Finset.subset_singleton_iff",
      "Finset.subset_union_elim",
      "Finset.sum_div",
      "Finset.sups_eq_self",
      "Finset.union_erase_of_mem",
      "Finset.univ_infs_univ",
      "Finset.val_eq_singleton_iff",
      "Fintype.card_units",
      "Int.Prime.dvd_natAbs_of_coe_dvd_sq",
      "Int.abs_le_sqrt",
      "Int.exists_mul_self",
      "Int.natAbs_eq_iff_mul_self_eq",
      "Int.sqrt_eq",
      "Int.sqrt_natCast",
      "List.IsRotated.cons_getLast_dropLast",
      "List.IsRotated.dropLast_tail",
      "List.Nodup.rotate_eq_self_iff",
      "List.countP_diff",
      "List.exists_mem_zipIdx",
      "List.exists_mem_zipIdx'",
      "List.getElem_eq_getElem_rotate",
      "List.getElem_rotate",
      "List.head?_rotate",
      "List.iterate_eq_nil",
      "List.length_cyclicPermutations_of_ne_nil",
      "List.length_mem_cyclicPermutations",
      "List.length_rotate",
      "List.map_rotate",
      "List.rotate'_eq_drop_append_take",
      "List.rotate'_rotate'",
      "List.rotate_append_length_eq",
      "List.rotate_eq_drop_append_take",
      "List.rotate_eq_rotate'",
      "List.rotate_eq_self_iff_eq_replicate",
      "List.rotate_eq_singleton_iff",
      "List.rotate_mod",
      "List.rotate_nil",
      "List.rotate_one_eq_self_iff_eq_replicate",
      "List.rotate_reverse",
      "List.rotate_rotate",
      "NNReal.Real.Mathlib.Meta.Positivity.Real.NNReal.Real.sum_mul_le_sqrt_mul_sqrt",
      "NNReal.Real.Mathlib.Meta.Positivity.Real.NNReal.Real.sum_sqrt_mul_sqrt_le",
      "NNReal.Real.Mathlib.Meta.Positivity.Real.inv_sqrt_two_sub_one",
      "NNReal.Real.Mathlib.Meta.Positivity.Real.nat_sqrt_le_real_sqrt",
      "NNReal.Real.Mathlib.Meta.Positivity.Real.one_lt_sqrt_two",
      "NNReal.Real.Mathlib.Meta.Positivity.Real.real_sqrt_lt_nat_sqrt_succ",
      "NNReal.Real.Mathlib.Meta.Positivity.Real.sqrt_div",
      "NNReal.Real.Mathlib.Meta.Positivity.Real.sqrt_inv",
      "NNReal.Real.Mathlib.Meta.Positivity.Real.sqrt_mul",
      "NNReal.Real.Mathlib.Meta.Positivity.Real.sqrt_two_lt_three_halves",
      "NNReal.Real.coe_sqrt",
      "NNReal.Real.comap_sqrt_atTop",
      "NNReal.Real.sq_le",
      "NNReal.Real.sqrt_eq_cases",
      "NNReal.Real.sqrt_eq_zero'",
      "NNReal.Real.sqrt_eq_zero_of_nonpos",
      "NNReal.Real.sqrt_le_iff",
      "NNReal.Real.sqrt_le_sqrt_iff'",
      "NNReal.Real.sqrt_lt",
      "NNReal.Real.sqrt_mul_self_eq_abs",
      "NNReal.Real.sqrt_sq",
      "NNReal.one_le_sqrt",
      "NNReal.sqrt_le_one",
      "NNReal.sqrt_mul",
      "NNReal.sqrt_pos",
      "NNReal.sqrt_zero",
      "Nat.Function.Involutive.iterate_eq_id",
      "Nat.Function.Involutive.neg_one_pow_eq_one_iff_even",
      "Nat.Icc_factorization_eq_pow_dvd",
      "Nat.Ico_filter_pow_dvd_eq",
      "Nat.Odd.sub_odd",
      "Nat.Prime.coprime_factorial_of_lt",
      "Nat.Prime.dvd_factorial",
      "Nat.Prime.eq_of_factorization_pos",
      "Nat.Prime.even_iff",
      "Nat.Prime.even_sub_one",
      "Nat.Prime.factorization_self",
      "Nat.Prime.mul_eq_prime_sq_iff",
      "Nat.Prime.pow_dvd_iff_le_factorization",
      "Nat.Prime.pow_inj",
      "Nat.ascFactorial_eq_prod_range",
      "Nat.cast_div_div_div_cancel_right",
      "Nat.coprime_factorial_iff",
      "Nat.coprime_fintype_prod_left_iff",
      "Nat.div_two_mul_two_add_one_of_odd",
      "Nat.dvd_iff_div_factorization_eq_tsub",
      "Nat.dvd_prime_pow",
      "Nat.eq_factorization_iff",
      "Nat.factorial_coe_dvd_prod",
      "Nat.factorization_div",
      "Nat.factorization_le_factorization_mul_right",
      "Nat.factorization_ordCompl",
      "Nat.factorization_prod_apply",
      "Nat.mod_two_add_add_odd_mod_two",
      "Nat.mod_two_add_succ_mod_two",
      "Nat.not_dvd_ordCompl",
      "Nat.not_odd_iff",
      "Nat.not_prime_mul",
      "Nat.odd_add'",
      "Nat.odd_iff",
      "Nat.odd_mul",
      "Nat.ordCompl_dvd_ordCompl_of_dvd",
      "Nat.ordCompl_pos",
      "Nat.ordCompl_self_pow_mul",
      "Nat.ordProj_dvd_ordProj_of_dvd",
      "Nat.ordProj_pos",
      "Nat.setOf_pow_dvd_eq_Icc_factorization",
      "Nat.succ_dvd_or_succ_dvd_of_succ_sum_dvd_mul",
      "Odd.mul",
      "Odd.pow",
      "Odd.sub_even",
      "Odd.sub_odd",
      "Set.Icc_union_Icc'",
      "Set.Icc_union_Ici'",
      "Set.Ici_diff_Ici",
      "Set.Ici_eq_singleton_iff_isTop",
      "Set.Ico_union_Ici",
      "Set.Iic_diff_Iic",
      "Set.Iio_diff_Iic",
      "Set.Iio_ssubset_Iio_iff",
      "Set.Iio_subset_Iio_iff",
      "Set.Iio_union_Ico'",
      "Set.Iio_union_Ioo'",
      "Set.Ioc_diff_Iic",
      "Set.Ioc_eq_Ioc_iff",
      "Set.Ioc_inter_Ioc",
      "Set.Ioc_inter_Ioo_of_left_lt",
      "Set.Ioc_union_Ioi'",
      "Set.Ioi_inter_Ioo",
      "Set.Ioi_subset_Ici_iff",
      "Set.Ioo_inter_Iio",
      "Set.Ioo_subset_Ioo_iff",
      "Set.Ioo_union_Ioi",
      "Set.Ioo_union_Ioo",
      "Set.diff_insert_of_notMem",
      "Set.diff_inter_right_comm",
      "Set.diff_union_inter",
      "Set.insert_diff_of_notMem",
      "Set.insert_diff_self_of_notMem",
      "Set.insert_diff_singleton",
      "Set.insert_diff_singleton_comm",
      "Set.ite_empty",
      "Set.ite_empty_left",
      "Set.ite_eq_of_subset_right",
      "Set.ite_inter_inter",
      "Set.ite_inter_self",
      "Set.ite_univ",
      "Set.ncard_Iio_nat",
      "Set.ncard_Ioc_nat",
      "Set.pair_diff_right",
      "Set.union_inter_compl_left_subset",
      "SetRel.Function.Equiv.graph_inv",
      "SetRel.Function.graph_injective",
      "SetRel.cod_univ",
      "SetRel.comp_assoc",
      "SetRel.core_univ",
      "SetRel.dom_empty",
      "SetRel.iUnion_comp",
      "SetRel.image_eq_biUnion",
      "SetRel.image_eq_cod_of_dom_subset",
      "SetRel.image_iUnion",
      "SetRel.image_sUnion",
      "SetRel.image_union",
      "SetRel.image_univ_right",
      "SetRel.inv_eq_self_iff",
      "SetRel.inv_id",
      "SetRel.preimage_empty_left",
      "SetRel.preimage_empty_right",
      "SetRel.preimage_eq_biUnion",
      "SetRel.preimage_eq_dom_of_cod_subset",
      "SetRel.preimage_iUnion",
      "SetRel.preimage_univ_left",
      "SetRel.prod_comp_prod_of_inter_nonempty",
      "compl_le_compl_iff_le",
      "compl_le_of_compl_le",
      "disjoint_sdiff_comm",
      "eq_of_sdiff_eq_sdiff",
      "even_iff_two_dvd",
      "even_neg_two",
      "even_sub_two",
      "even_two",
      "inf_sdiff_distrib_right",
      "inf_sdiff_inf",
      "inf_sdiff_self_right",
      "odd_add_self_one'",
      "odd_add_two",
      "odd_iff_exists_bit1",
      "odd_neg_one",
      "sdiff_eq_right",
      "sdiff_le_sdiff_iff_le",
      "sdiff_lt_left",
      "sdiff_sdiff_eq_sdiff_sup",
      "sdiff_sdiff_eq_self",
      "sdiff_sdiff_sup_sdiff'",
      "sdiff_sup",
      "star_finsuppProd",
      "star_finsuppSum",
      "sup_inf_inf_sdiff",
      "sup_lt_of_lt_sdiff_left",
      "sup_sdiff_inf"
    ]
  }
}