{
  "ArmorRM_scores": {
    "accuracy": 0.18634782608695652,
    "precision": 0.06583365760156802,
    "recall": 0.8704268292682927,
    "f1": 0.12240905741274201,
    "true_positives": 4568,
    "true_negatives": 10433,
    "false_positives": 64819,
    "false_negatives": 680,
    "total": 80500,
    "normalized_precision": 0.09142697538147596,
    "normalized_recall": 0.864680777457463,
    "selection_accuracy": 0.0670807453416149,
    "solvable_selection_accuracy": 0.09391304347826086
  },
  "GPM_scores": {
    "accuracy": 0.916024844720497,
    "precision": 0.07384441939120631,
    "recall": 0.02496189024390244,
    "f1": 0.0373113073198519,
    "true_positives": 131,
    "true_negatives": 73609,
    "false_positives": 1643,
    "false_negatives": 5117,
    "total": 80500,
    "normalized_precision": 0.08446238785369221,
    "normalized_recall": 0.021235276896363228,
    "selection_accuracy": 0.06832298136645963,
    "solvable_selection_accuracy": 0.09565217391304348
  },
  "GRMGemma_scores": {
    "accuracy": 0.9075403726708074,
    "precision": 0.013735046521931768,
    "recall": 0.005907012195121951,
    "f1": 0.00826115922718188,
    "true_positives": 31,
    "true_negatives": 73026,
    "false_positives": 2226,
    "false_negatives": 5217,
    "total": 80500,
    "normalized_precision": 0.01995130232086754,
    "normalized_recall": 0.010628821965750353,
    "selection_accuracy": 0.058385093167701865,
    "solvable_selection_accuracy": 0.0817391304347826
  },
  "GRMLlama32_scores": {
    "accuracy": 0.9202857142857143,
    "precision": 0.012510425354462052,
    "recall": 0.002858231707317073,
    "f1": 0.004653327128897162,
    "true_positives": 15,
    "true_negatives": 74068,
    "false_positives": 1184,
    "false_negatives": 5233,
    "total": 80500,
    "normalized_precision": 0.01258550724637681,
    "normalized_recall": 0.006158121261283848,
    "selection_accuracy": 0.08571428571428572,
    "solvable_selection_accuracy": 0.12
  },
  "GRM_scores": {
    "accuracy": 0.9197515527950311,
    "precision": 0.005709624796084829,
    "recall": 0.0013338414634146342,
    "f1": 0.002162496138399753,
    "true_positives": 7,
    "true_negatives": 74033,
    "false_positives": 1219,
    "false_negatives": 5241,
    "total": 80500,
    "normalized_precision": 0.00484472049689441,
    "normalized_recall": 0.0012882145968389732,
    "selection_accuracy": 0.06832298136645963,
    "solvable_selection_accuracy": 0.09565217391304348
  },
  "OffsetBias_scores": {
    "accuracy": 0.7557391304347826,
    "precision": 0.05174451147459419,
    "recall": 0.15853658536585366,
    "f1": 0.0780231631265532,
    "true_positives": 832,
    "true_negatives": 60005,
    "false_positives": 15247,
    "false_negatives": 4416,
    "total": 80500,
    "normalized_precision": 0.0995903756975953,
    "normalized_recall": 0.18128918955432863,
    "selection_accuracy": 0.07453416149068323,
    "solvable_selection_accuracy": 0.10434782608695652
  },
  "QRM_scores": {
    "accuracy": 0.8112546583850931,
    "precision": 0.0596777049760935,
    "recall": 0.12842987804878048,
    "f1": 0.08148954177245799,
    "true_positives": 674,
    "true_negatives": 64632,
    "false_positives": 10620,
    "false_negatives": 4574,
    "total": 80500,
    "normalized_precision": 0.09674135263136807,
    "normalized_recall": 0.11688305422443007,
    "selection_accuracy": 0.06956521739130435,
    "solvable_selection_accuracy": 0.09739130434782609
  },
  "Skyworks_scores": {
    "accuracy": 0.9154782608695652,
    "precision": 0.046091015169194866,
    "recall": 0.015053353658536585,
    "f1": 0.022694627980465384,
    "true_positives": 79,
    "true_negatives": 73617,
    "false_positives": 1635,
    "false_negatives": 5169,
    "total": 80500,
    "normalized_precision": 0.044205654249132496,
    "normalized_recall": 0.012853776527017025,
    "selection_accuracy": 0.09440993788819876,
    "solvable_selection_accuracy": 0.13217391304347825
  },
  "URM_scores": {
    "accuracy": 0.2120248447204969,
    "precision": 0.06547974668419165,
    "recall": 0.8353658536585366,
    "f1": 0.12144044321329639,
    "true_positives": 4384,
    "true_negatives": 12684,
    "false_positives": 62568,
    "false_negatives": 864,
    "total": 80500,
    "normalized_precision": 0.09166307170060574,
    "normalized_recall": 0.8252425632403755,
    "selection_accuracy": 0.10186335403726708,
    "solvable_selection_accuracy": 0.1426086956521739
  }
}