{
  "baselines": {
    "keyword_heuristic": {
      "accuracy": 0.18867924528301888,
      "macro_f1": 0.10342555994729909,
      "top1_accuracy": 0.18867924528301888,
      "top3_accuracy": 0.2830188679245283,
      "top5_accuracy": 0.2830188679245283
    },
    "majority_class": {
      "accuracy": 0.1320754716981132,
      "macro_f1": 0.012280701754385965,
      "top1_accuracy": 0.1320754716981132,
      "top3_accuracy": 0.24528301886792453,
      "top5_accuracy": 0.2641509433962264
    },
    "text_naive_bayes": {
      "accuracy": 0.24528301886792453,
      "macro_f1": 0.07096153846153846,
      "top1_accuracy": 0.24528301886792453,
      "top3_accuracy": 0.3018867924528302,
      "top5_accuracy": 0.3018867924528302
    },
    "tfidf_linear_svm": {
      "accuracy": 0.22641509433962265,
      "macro_f1": 0.06397243107769424,
      "top1_accuracy": 0.22641509433962265,
      "top3_accuracy": 0.37735849056603776,
      "top5_accuracy": 0.4716981132075472
    },
    "tfidf_logistic_regression": {
      "accuracy": 0.20754716981132076,
      "macro_f1": 0.06397243107769424,
      "top1_accuracy": 0.20754716981132076,
      "top3_accuracy": 0.3584905660377358,
      "top5_accuracy": 0.39622641509433965
    }
  },
  "label_distribution": {
    "all_goals": 1,
    "apply": 6,
    "assumption": 1,
    "by_contra": 1,
    "cases": 2,
    "constructor": 5,
    "contradiction": 1,
    "decide": 3,
    "exact": 23,
    "grind": 1,
    "have": 7,
    "intro": 12,
    "left": 1,
    "linarith": 1,
    "obtain": 1,
    "refine": 2,
    "rfl": 2,
    "right": 1,
    "ring": 3,
    "rintro": 6,
    "rw": 12,
    "simp": 9,
    "simp_all": 3,
    "simp_rw": 3,
    "simpa": 2
  },
  "representation": "structured",
  "split": {
    "n_rows": 109,
    "n_test": 53,
    "n_test_theorems": 10,
    "n_train": 56,
    "n_train_theorems": 25,
    "seed": 4,
    "strategy": "theorem-level random split",
    "test_ratio": 0.3,
    "test_theorems": [
      "LeanResearch.imp_trans",
      "LeanResearch.not_not",
      "LeanResearch.or_comm",
      "LeanResearch.or_intro_left",
      "LeanResearch.or_intro_right",
      "LeanResearch.polynomial_factorization_30",
      "exists_rat_of_not_irrational",
      "irrational_sqrt_natCast_iff",
      "irrational_sqrt_ratCast_iff",
      "irrational_sqrt_ratCast_iff_of_nonneg"
    ]
  }
}