{
  "armor_rm_score": {
    "accuracy": 0.4528233657858136,
    "precision": 0.6914683100582348,
    "recall": 0.2652065488452781,
    "f1": 0.3833735619573054,
    "true_positives": 12230,
    "true_negatives": 20328,
    "false_positives": 5457,
    "false_negatives": 33885,
    "total": 71900,
    "normalized_precision": 0.6823408560838098,
    "normalized_recall": 0.2577739585507254,
    "selection_accuracy": 0.6995827538247567,
    "solvable_selection_accuracy": 0.71045197740113
  },
  "gpm_scores": {
    "accuracy": 0.4547287899860918,
    "precision": 0.5771825574122063,
    "recall": 0.5602732299685569,
    "f1": 0.5686022073306265,
    "true_positives": 25837,
    "true_negatives": 6858,
    "false_positives": 18927,
    "false_negatives": 20278,
    "total": 71900,
    "normalized_precision": 0.6339222623724408,
    "normalized_recall": 0.6120104752017441,
    "selection_accuracy": 0.5563282336578581,
    "solvable_selection_accuracy": 0.5649717514124294
  },
  "grm_gemma_scores": {
    "accuracy": 0.4451877607788595,
    "precision": 0.7521471398476746,
    "recall": 0.20130109508836605,
    "f1": 0.31760097165437845,
    "true_positives": 9283,
    "true_negatives": 22726,
    "false_positives": 3059,
    "false_negatives": 36832,
    "total": 71900,
    "normalized_precision": 0.6859634700056684,
    "normalized_recall": 0.1802497418481706,
    "selection_accuracy": 0.7051460361613352,
    "solvable_selection_accuracy": 0.7161016949152542
  },
  "grm_llama32_scores": {
    "accuracy": 0.43022253129346316,
    "precision": 0.7498543972044264,
    "recall": 0.16751599262712782,
    "f1": 0.2738536256802028,
    "true_positives": 7725,
    "true_negatives": 23208,
    "false_positives": 2577,
    "false_negatives": 38390,
    "total": 71900,
    "normalized_precision": 0.6736446545018289,
    "normalized_recall": 0.14880504375263676,
    "selection_accuracy": 0.7121001390820584,
    "solvable_selection_accuracy": 0.7231638418079096
  },
  "grm_scores": {
    "accuracy": 0.4039777468706537,
    "precision": 0.8201452974671117,
    "recall": 0.09057790306841591,
    "f1": 0.16313857209810967,
    "true_positives": 4177,
    "true_negatives": 24869,
    "false_positives": 916,
    "false_negatives": 41938,
    "total": 71900,
    "normalized_precision": 0.6095884501883405,
    "normalized_recall": 0.07521662529299908,
    "selection_accuracy": 0.6981919332406119,
    "solvable_selection_accuracy": 0.7090395480225988
  },
  "internlm_scores": {
    "accuracy": 0.44358057831124215,
    "precision": 0.8199245757385293,
    "recall": 0.1697315348917899,
    "f1": 0.2812432626661876,
    "true_positives": 7827,
    "true_negatives": 24066,
    "false_positives": 1719,
    "false_negatives": 38287,
    "total": 71899,
    "normalized_precision": 0.7064994485962137,
    "normalized_recall": 0.14099704734847987,
    "selection_accuracy": 0.717663421418637,
    "solvable_selection_accuracy": 0.7288135593220338
  },
  "offset_bias_scores": {
    "accuracy": 0.45061196105702367,
    "precision": 0.6721499219156689,
    "recall": 0.27999566301637213,
    "f1": 0.39531572904707235,
    "true_positives": 12912,
    "true_negatives": 19487,
    "false_positives": 6298,
    "false_negatives": 33203,
    "total": 71900,
    "normalized_precision": 0.677346339394245,
    "normalized_recall": 0.2802944320318698,
    "selection_accuracy": 0.7093184979137691,
    "solvable_selection_accuracy": 0.7203389830508474
  },
  "qrm_scores": {
    "accuracy": 0.47870653685674547,
    "precision": 0.7464041095890411,
    "recall": 0.2835736745093787,
    "f1": 0.4110002357193368,
    "true_positives": 13077,
    "true_negatives": 21342,
    "false_positives": 4443,
    "false_negatives": 33038,
    "total": 71900,
    "normalized_precision": 0.6949828784880694,
    "normalized_recall": 0.25481141092947984,
    "selection_accuracy": 0.717663421418637,
    "solvable_selection_accuracy": 0.7288135593220338
  },
  "skyworks_scores": {
    "accuracy": 0.4471905424200278,
    "precision": 0.7809246514910888,
    "recall": 0.19193321045213055,
    "f1": 0.3081341711779143,
    "true_positives": 8851,
    "true_negatives": 23302,
    "false_positives": 2483,
    "false_negatives": 37264,
    "total": 71900,
    "normalized_precision": 0.6982056051189748,
    "normalized_recall": 0.16433149123457474,
    "selection_accuracy": 0.7190542420027817,
    "solvable_selection_accuracy": 0.730225988700565
  },
  "urm_scores": {
    "accuracy": 0.6412378303198887,
    "precision": 0.6418320909065528,
    "recall": 0.9970074812967581,
    "f1": 0.7809323221428631,
    "true_positives": 45977,
    "true_negatives": 128,
    "false_positives": 25657,
    "false_negatives": 138,
    "total": 71900,
    "normalized_precision": 0.6516628802322076,
    "normalized_recall": 0.9970704313069563,
    "selection_accuracy": 0.6995827538247567,
    "solvable_selection_accuracy": 0.71045197740113
  }
}