{
  "baselines": {
    "keyword_heuristic": {
      "accuracy": 0.13043478260869565,
      "macro_f1": 0.04,
      "top1_accuracy": 0.13043478260869565,
      "top3_accuracy": 0.5652173913043478,
      "top5_accuracy": 0.9130434782608695
    },
    "majority_class": {
      "accuracy": 0.17391304347826086,
      "macro_f1": 0.04938271604938272,
      "top1_accuracy": 0.17391304347826086,
      "top3_accuracy": 0.8695652173913043,
      "top5_accuracy": 0.9130434782608695
    },
    "text_naive_bayes": {
      "accuracy": 0.7391304347826086,
      "macro_f1": 0.4050925925925926,
      "top1_accuracy": 0.7391304347826086,
      "top3_accuracy": 0.9565217391304348,
      "top5_accuracy": 0.9565217391304348
    },
    "tfidf_linear_svm": {
      "accuracy": 0.5652173913043478,
      "macro_f1": 0.4138257575757575,
      "top1_accuracy": 0.5652173913043478,
      "top3_accuracy": 0.8260869565217391,
      "top5_accuracy": 0.8260869565217391
    },
    "tfidf_logistic_regression": {
      "accuracy": 0.6086956521739131,
      "macro_f1": 0.45047905525846704,
      "top1_accuracy": 0.6086956521739131,
      "top3_accuracy": 0.782608695652174,
      "top5_accuracy": 0.9130434782608695
    }
  },
  "label_distribution": {
    "apply": 1,
    "cases": 7,
    "constructor": 4,
    "decide": 19,
    "exact": 4,
    "grind": 16,
    "induction": 1,
    "injection": 1,
    "obtain": 1,
    "rcases": 1,
    "refine": 1,
    "rw": 5,
    "simp": 23,
    "split_ifs": 1
  },
  "representation": "raw",
  "split": {
    "n_rows": 85,
    "n_test": 23,
    "n_test_theorems": 19,
    "n_train": 62,
    "n_train_theorems": 43,
    "seed": 42,
    "strategy": "theorem-level random split",
    "test_ratio": 0.3,
    "test_theorems": [
      "Bool.and_eq_true_eq_eq_true_and_eq_true",
      "Bool.bool_iff_false",
      "Bool.coe_sort_false",
      "Bool.dichotomy",
      "Bool.eq_false_of_not_eq_true'",
      "Bool.eq_not_iff",
      "Bool.eq_or_eq_not",
      "Bool.eq_true_eq_not_eq_false",
      "Bool.false_eq_true_eq_False",
      "Bool.not_eq_false_eq_eq_true",
      "Bool.not_eq_true_eq_eq_false",
      "Bool.not_ne_self",
      "Bool.or_eq_false_eq_eq_false_and_eq_false",
      "Bool.or_inr",
      "Bool.toNat_bne_one",
      "Nat.ppred_eq_none",
      "Nat.psub_eq_some",
      "Rat.sqrt_intCast",
      "Rat.sqrt_natCast"
    ]
  }
}