{
  "ArmorRM_scores": {
    "accuracy": 0.5420288115246098,
    "precision": 0.5753373190891568,
    "recall": 0.7434825744622464,
    "f1": 0.6486909596559568,
    "true_positives": 35221,
    "true_negatives": 9930,
    "false_positives": 25997,
    "false_negatives": 12152,
    "total": 83300,
    "normalized_precision": 0.575060212552224,
    "normalized_recall": 0.7426538940486773,
    "selection_accuracy": 0.5894357743097239,
    "solvable_selection_accuracy": 0.5922798552472859
  },
  "EurusPRMStage1_avg_scores": {
    "accuracy": 0.5685234093637455,
    "precision": 0.5688904959922859,
    "recall": 0.996305912650666,
    "f1": 0.7242400527858338,
    "true_positives": 47198,
    "true_negatives": 160,
    "false_positives": 35767,
    "false_negatives": 175,
    "total": 83300,
    "normalized_precision": 0.5716685139315947,
    "normalized_recall": 0.9967049017659821,
    "selection_accuracy": 0.595438175270108,
    "solvable_selection_accuracy": 0.5983112183353438
  },
  "EurusPRMStage1_max_scores": {
    "accuracy": 0.43202881152460987,
    "precision": 0.6265560165975104,
    "recall": 0.003187469655711059,
    "f1": 0.006342672323266266,
    "true_positives": 151,
    "true_negatives": 35837,
    "false_positives": 90,
    "false_negatives": 47222,
    "total": 83300,
    "normalized_precision": 0.1124045034177724,
    "normalized_recall": 0.002898425208595753,
    "selection_accuracy": 0.5798319327731093,
    "solvable_selection_accuracy": 0.5826296743063932
  },
  "EurusPRMStage1_min_scores": {
    "accuracy": 0.5684753901560624,
    "precision": 0.5687073848262925,
    "recall": 0.9982901652840226,
    "f1": 0.7246150310273501,
    "true_positives": 47292,
    "true_negatives": 62,
    "false_positives": 35865,
    "false_negatives": 81,
    "total": 83300,
    "normalized_precision": 0.571456963890828,
    "normalized_recall": 0.9982773066098004,
    "selection_accuracy": 0.6110444177671068,
    "solvable_selection_accuracy": 0.6139927623642943
  },
  "EurusPRMStage2_avg_scores": {
    "accuracy": 0.5685114045618247,
    "precision": 0.568693206404154,
    "recall": 0.9987334557659426,
    "f1": 0.7247202628495278,
    "true_positives": 47313,
    "true_negatives": 44,
    "false_positives": 35883,
    "false_negatives": 60,
    "total": 83300,
    "normalized_precision": 0.5714977418050662,
    "normalized_recall": 0.9988938727704997,
    "selection_accuracy": 0.6650660264105642,
    "solvable_selection_accuracy": 0.6682750301568154
  },
  "EurusPRMStage2_max_scores": {
    "accuracy": 0.4313565426170468,
    "precision": 0.7777777777777778,
    "recall": 0.00014776349397336035,
    "f1": 0.00029547085391076777,
    "true_positives": 7,
    "true_negatives": 35925,
    "false_positives": 2,
    "false_negatives": 47366,
    "total": 83300,
    "normalized_precision": 0.008443908323281062,
    "normalized_recall": 0.0001452166910078262,
    "selection_accuracy": 0.6350540216086434,
    "solvable_selection_accuracy": 0.638118214716526
  },
  "EurusPRMStage2_min_scores": {
    "accuracy": 0.5684633853541416,
    "precision": 0.5687617351114534,
    "recall": 0.9975091296730205,
    "f1": 0.7244532681266623,
    "true_positives": 47255,
    "true_negatives": 98,
    "false_positives": 35829,
    "false_negatives": 118,
    "total": 83300,
    "normalized_precision": 0.5715260010137885,
    "normalized_recall": 0.9975081720638826,
    "selection_accuracy": 0.6554621848739496,
    "solvable_selection_accuracy": 0.6586248492159228
  },
  "GPM_scores": {
    "accuracy": 0.4341296518607443,
    "precision": 0.5618448637316562,
    "recall": 0.022628923648491756,
    "f1": 0.04350561068160143,
    "true_positives": 1072,
    "true_negatives": 35091,
    "false_positives": 836,
    "false_negatives": 46301,
    "total": 83300,
    "normalized_precision": 0.49917140559480727,
    "normalized_recall": 0.023041634400537157,
    "selection_accuracy": 0.5738295318127251,
    "solvable_selection_accuracy": 0.5765983112183354
  },
  "GRMGemma_scores": {
    "accuracy": 0.4694357743097239,
    "precision": 0.5658172778123057,
    "recall": 0.28826546767145844,
    "f1": 0.3819432790736701,
    "true_positives": 13656,
    "true_negatives": 25448,
    "false_positives": 10479,
    "false_negatives": 33717,
    "total": 83300,
    "normalized_precision": 0.5875719975809135,
    "normalized_recall": 0.3030022392851423,
    "selection_accuracy": 0.5870348139255702,
    "solvable_selection_accuracy": 0.5898673100120627
  },
  "GRMLlama32_scores": {
    "accuracy": 0.4702280912364946,
    "precision": 0.5631105748647491,
    "recall": 0.30540603297236824,
    "f1": 0.3960255111816714,
    "true_positives": 14468,
    "true_negatives": 24702,
    "false_positives": 11225,
    "false_negatives": 32905,
    "total": 83300,
    "normalized_precision": 0.5866836693384434,
    "normalized_recall": 0.32014980548537403,
    "selection_accuracy": 0.6386554621848739,
    "solvable_selection_accuracy": 0.6417370325693607
  },
  "GRM_scores": {
    "accuracy": 0.46122448979591835,
    "precision": 0.6129382984506659,
    "recall": 0.14280286238996898,
    "f1": 0.23163841807909605,
    "true_positives": 6765,
    "true_negatives": 31655,
    "false_positives": 4272,
    "false_negatives": 40608,
    "total": 83300,
    "normalized_precision": 0.6132240753705116,
    "normalized_recall": 0.14001569430517835,
    "selection_accuracy": 0.6326530612244898,
    "solvable_selection_accuracy": 0.6357056694813028
  },
  "OffsetBias_scores": {
    "accuracy": 0.469327731092437,
    "precision": 0.5616006844520495,
    "recall": 0.30483608806704243,
    "f1": 0.39517287616128727,
    "true_positives": 14441,
    "true_negatives": 24654,
    "false_positives": 11273,
    "false_negatives": 32932,
    "total": 83300,
    "normalized_precision": 0.5867499448844451,
    "normalized_recall": 0.3214071842999711,
    "selection_accuracy": 0.6110444177671068,
    "solvable_selection_accuracy": 0.6139927623642943
  },
  "QRM_scores": {
    "accuracy": 0.475906362545018,
    "precision": 0.5786754742547425,
    "recall": 0.28847655837713465,
    "f1": 0.3850173970615166,
    "true_positives": 13666,
    "true_negatives": 25977,
    "false_positives": 9950,
    "false_negatives": 33707,
    "total": 83300,
    "normalized_precision": 0.5991638731313531,
    "normalized_recall": 0.2996790623765848,
    "selection_accuracy": 0.6410564225690276,
    "solvable_selection_accuracy": 0.6441495778045838
  },
  "Skyworks_scores": {
    "accuracy": 0.4748739495798319,
    "precision": 0.5933161953727506,
    "recall": 0.24359867435036836,
    "f1": 0.34539006030857633,
    "true_positives": 11540,
    "true_negatives": 28017,
    "false_positives": 7910,
    "false_negatives": 35833,
    "total": 83300,
    "normalized_precision": 0.6096564648092688,
    "normalized_recall": 0.25158137267558617,
    "selection_accuracy": 0.6374549819927972,
    "solvable_selection_accuracy": 0.6405307599517491
  },
  "URM_scores": {
    "accuracy": 0.5669027611044418,
    "precision": 0.5694335169158143,
    "recall": 0.9777721486922931,
    "f1": 0.7197184521081132,
    "true_positives": 46320,
    "true_negatives": 903,
    "false_positives": 35024,
    "false_negatives": 1053,
    "total": 83300,
    "normalized_precision": 0.5717661633103892,
    "normalized_recall": 0.9770248675449388,
    "selection_accuracy": 0.5678271308523409,
    "solvable_selection_accuracy": 0.5705669481302774
  }
}