{
  "gemini-2.5-flash-lite": {
    "ar-2": {
      "total": 8053,
      "true_positives": 2772,
      "false_positives": 1431,
      "true_negatives": 2160,
      "false_negatives": 1690,
      "security": 0.6015037593984962,
      "utility": 0.6212460779919319
    },
    "masking": {
      "total": 8053,
      "true_positives": 3796,
      "false_positives": 2301,
      "true_negatives": 1290,
      "false_negatives": 666,
      "security": 0.3592314118629908,
      "utility": 0.8507395786642761
    },
    "ar-1": {
      "total": 8053,
      "true_positives": 3149,
      "false_positives": 1715,
      "true_negatives": 1876,
      "false_negatives": 1313,
      "security": 0.5224171539961013,
      "utility": 0.7057373375168086
    }
  },
  "gpt-5": {
    "ar-1": {
      "total": 8053,
      "true_positives": 2174,
      "false_positives": 994,
      "true_negatives": 2597,
      "false_negatives": 2288,
      "security": 0.723196881091618,
      "utility": 0.4872254594352308
    },
    "ar-2": {
      "total": 8053,
      "true_positives": 2035,
      "false_positives": 824,
      "true_negatives": 2767,
      "false_negatives": 2427,
      "security": 0.7705374547479811,
      "utility": 0.4560735096369341
    },
    "masking": {
      "total": 8053,
      "true_positives": 3580,
      "false_positives": 2193,
      "true_negatives": 1398,
      "false_negatives": 882,
      "security": 0.3893065998329156,
      "utility": 0.8023307933662035
    }
  },
  "gpt-4.1-mini": {
    "ar-1": {
      "total": 8053,
      "true_positives": 3046,
      "false_positives": 1661,
      "true_negatives": 1930,
      "false_negatives": 1416,
      "security": 0.5374547479810637,
      "utility": 0.682653518601524
    },
    "ar-2": {
      "total": 8053,
      "true_positives": 2807,
      "false_positives": 1428,
      "true_negatives": 2163,
      "false_negatives": 1655,
      "security": 0.6023391812865497,
      "utility": 0.6290900941281936
    },
    "ar-4": {
      "total": 8053,
      "true_positives": 1941,
      "false_positives": 833,
      "true_negatives": 2758,
      "false_negatives": 2521,
      "security": 0.7680311890838206,
      "utility": 0.4350067234424025
    },
    "ar-7": {
      "total": 8053,
      "true_positives": 1806,
      "false_positives": 775,
      "true_negatives": 2816,
      "false_negatives": 2656,
      "security": 0.784182678919521,
      "utility": 0.4047512326311071
    },
    "ar-6": {
      "total": 8053,
      "true_positives": 1858,
      "false_positives": 776,
      "true_negatives": 2815,
      "false_negatives": 2604,
      "security": 0.7839042049568365,
      "utility": 0.4164051994621246
    },
    "masking": {
      "total": 8053,
      "true_positives": 3607,
      "false_positives": 2255,
      "true_negatives": 1336,
      "false_negatives": 855,
      "security": 0.3720412141464773,
      "utility": 0.8083818915284626
    },
    "ar-5": {
      "total": 8053,
      "true_positives": 1969,
      "false_positives": 813,
      "true_negatives": 2778,
      "false_negatives": 2493,
      "security": 0.7736006683375104,
      "utility": 0.44128193635141194
    },
    "ar-3": {
      "total": 8053,
      "true_positives": 2097,
      "false_positives": 892,
      "true_negatives": 2699,
      "false_negatives": 2365,
      "security": 0.7516012252854358,
      "utility": 0.46996862393545497
    }
  },
  "gpt-4.1-nano": {
    "masking": {
      "total": 8053,
      "true_positives": 3426,
      "false_positives": 2131,
      "true_negatives": 1460,
      "false_negatives": 1036,
      "security": 0.4065719855193539,
      "utility": 0.7678171223666517
    },
    "ar-2": {
      "total": 8053,
      "true_positives": 2438,
      "false_positives": 1377,
      "true_negatives": 2214,
      "false_negatives": 2024,
      "security": 0.6165413533834586,
      "utility": 0.5463917525773195
    },
    "ar-1": {
      "total": 8053,
      "true_positives": 2348,
      "false_positives": 1288,
      "true_negatives": 2303,
      "false_negatives": 2114,
      "security": 0.6413255360623782,
      "utility": 0.5262214253697893
    }
  },
  "claude-sonnet-4": {
    "ar-1": {
      "total": 8053,
      "true_positives": 3062,
      "false_positives": 1455,
      "true_negatives": 2136,
      "false_negatives": 1400,
      "security": 0.5948203842940685,
      "utility": 0.6862393545495293
    },
    "masking": {
      "total": 8053,
      "true_positives": 3492,
      "false_positives": 1989,
      "true_negatives": 1602,
      "false_negatives": 970,
      "security": 0.44611528822055135,
      "utility": 0.782608695652174
    },
    "ar-2": {
      "total": 8053,
      "true_positives": 2492,
      "false_positives": 1130,
      "true_negatives": 2461,
      "false_negatives": 1970,
      "security": 0.6853244221665274,
      "utility": 0.5584939489018378
    }
  },
  "gpt-5-mini": {
    "ar-2": {
      "total": 8053,
      "true_positives": 1678,
      "false_positives": 687,
      "true_negatives": 2904,
      "false_negatives": 2784,
      "security": 0.808688387635756,
      "utility": 0.3760645450470641
    },
    "masking": {
      "total": 8053,
      "true_positives": 3380,
      "false_positives": 2090,
      "true_negatives": 1501,
      "false_negatives": 1082,
      "security": 0.41798941798941797,
      "utility": 0.7575078440161362
    },
    "ar-1": {
      "total": 8053,
      "true_positives": 2552,
      "false_positives": 1315,
      "true_negatives": 2276,
      "false_negatives": 1910,
      "security": 0.6338067390698969,
      "utility": 0.5719408337068579
    }
  },
  "gemini-2.5-flash": {
    "ar-2": {
      "total": 8053,
      "true_positives": 2680,
      "false_positives": 1375,
      "true_negatives": 2216,
      "false_negatives": 1782,
      "security": 0.6170983013088276,
      "utility": 0.6006275212909009
    },
    "ar-1": {
      "total": 8053,
      "true_positives": 3095,
      "false_positives": 1573,
      "true_negatives": 2018,
      "false_negatives": 1367,
      "security": 0.5619604566972988,
      "utility": 0.6936351411922904
    },
    "masking": {
      "total": 8053,
      "true_positives": 3408,
      "false_positives": 2014,
      "true_negatives": 1577,
      "false_negatives": 1054,
      "security": 0.43915343915343913,
      "utility": 0.7637830569251457
    }
  },
  "gpt-5-nano": {
    "ar-1": {
      "total": 8053,
      "true_positives": 3190,
      "false_positives": 1728,
      "true_negatives": 1863,
      "false_negatives": 1272,
      "security": 0.518796992481203,
      "utility": 0.7149260421335724
    },
    "masking": {
      "total": 8053,
      "true_positives": 3663,
      "false_positives": 2210,
      "true_negatives": 1381,
      "false_negatives": 799,
      "security": 0.3845725424672793,
      "utility": 0.8209323173464814
    },
    "ar-2": {
      "total": 8053,
      "true_positives": 2892,
      "false_positives": 1501,
      "true_negatives": 2090,
      "false_negatives": 1570,
      "security": 0.582010582010582,
      "utility": 0.6481398476019722
    }
  },
  "gpt-4.1": {
    "masking": {
      "total": 8053,
      "true_positives": 3661,
      "false_positives": 2285,
      "true_negatives": 1306,
      "false_negatives": 801,
      "security": 0.3636869952659426,
      "utility": 0.8204840878529808
    },
    "ar-1": {
      "total": 8053,
      "true_positives": 2457,
      "false_positives": 1141,
      "true_negatives": 2450,
      "false_negatives": 2005,
      "security": 0.682261208576998,
      "utility": 0.550649932765576
    },
    "ar-2": {
      "total": 8053,
      "true_positives": 1983,
      "false_positives": 825,
      "true_negatives": 2766,
      "false_negatives": 2479,
      "security": 0.7702589807852965,
      "utility": 0.4444195428059166
    }
  }
}