{
  "split": {
    "strategy": "theorem-level random split",
    "seed": 42,
    "test_ratio": 0.3,
    "n_rows": 92,
    "n_train": 55,
    "n_test": 37,
    "n_train_theorems": 27,
    "n_test_theorems": 11
  },
  "label_distribution": {
    "simp": 5,
    "rintro": 3,
    "exact": 17,
    "grind": 1,
    "term": 4,
    "refine": 2,
    "constructor": 4,
    "obtain": 1,
    "simp_rw": 1,
    "rw": 9,
    "rfl": 2,
    "intro": 16,
    "apply": 6,
    "cases": 4,
    "left": 1,
    "right": 1,
    "by_contra": 1,
    "contradiction": 1,
    "linarith": 1,
    "ring": 1,
    "have": 7,
    "exact_mod_cast": 1,
    "assumption": 2,
    "simp_all": 1
  },
  "baselines": {
    "majority_class": {
      "accuracy": 0.16216216216216217,
      "macro_f1": 0.016415868673050615
    },
    "keyword_heuristic": {
      "accuracy": 0.2702702702702703,
      "macro_f1": 0.10316985645933015
    },
    "text_naive_bayes": {
      "accuracy": 0.21621621621621623,
      "macro_f1": 0.04611528822055138
    }
  }
}