{
  "config": {
    "name": "top_k",
    "description": "",
    "parameters": {
      "detection_pipeline.top_k_semantic_search": {
        "min": 1.0,
        "max": 10.0,
        "increment": 1.0,
        "type": "range"
      }
    },
    "created": "2025-06-07T12:20:31.435134",
    "filename": "top_k.json"
  },
  "results": {
    "aegis_v2_english": {
      "top__100": {
        "parameters": {
          "detection_pipeline.top_k_semantic_search": 1.0
        },
        "metrics": {
          "num_samples": 1964,
          "accuracy": 0.5417515274949084,
          "precision_unsafe": 0.5406649616368286,
          "recall_unsafe": 0.9981114258734656,
          "f1_unsafe": 0.7013934970139349,
          "fpr_unsafe": 0.9922651933701657,
          "fnr_unsafe": 0.0018885741265344666,
          "confusion_matrix_values": {
            "TN": 7,
            "FP": 898,
            "FN": 2,
            "TP": 1057
          },
          "num_true_safe": 905,
          "num_true_unsafe": 1059,
          "num_pred_safe": 9,
          "num_pred_unsafe": 1955,
          "num_pred_error": 0,
          "num_pred_ambiguous": 0
        },
        "timestamp": "2025-06-24T10:38:21.788677"
      },
      "top__200": {
        "parameters": {
          "detection_pipeline.top_k_semantic_search": 2.0
        },
        "metrics": {
          "num_samples": 1964,
          "accuracy": 0.5453156822810591,
          "precision_unsafe": 0.5426515930113053,
          "recall_unsafe": 0.9971671388101983,
          "f1_unsafe": 0.702828618968386,
          "fpr_unsafe": 0.9834254143646409,
          "fnr_unsafe": 0.0028328611898017,
          "confusion_matrix_values": {
            "TN": 15,
            "FP": 890,
            "FN": 3,
            "TP": 1056
          },
          "num_true_safe": 905,
          "num_true_unsafe": 1059,
          "num_pred_safe": 18,
          "num_pred_unsafe": 1946,
          "num_pred_error": 0,
          "num_pred_ambiguous": 0
        },
        "timestamp": "2025-06-24T10:40:49.326453"
      },
      "top__300": {
        "parameters": {
          "detection_pipeline.top_k_semantic_search": 3.0
        },
        "metrics": {
          "num_samples": 1964,
          "accuracy": 0.5458248472505092,
          "precision_unsafe": 0.5430190623390005,
          "recall_unsafe": 0.9952785646836638,
          "f1_unsafe": 0.7026666666666667,
          "fpr_unsafe": 0.980110497237569,
          "fnr_unsafe": 0.004721435316336166,
          "confusion_matrix_values": {
            "TN": 18,
            "FP": 887,
            "FN": 5,
            "TP": 1054
          },
          "num_true_safe": 905,
          "num_true_unsafe": 1059,
          "num_pred_safe": 23,
          "num_pred_unsafe": 1941,
          "num_pred_error": 0,
          "num_pred_ambiguous": 0
        },
        "timestamp": "2025-06-24T10:43:16.247097"
      },
      "top__400": {
        "parameters": {
          "detection_pipeline.top_k_semantic_search": 4.0
        },
        "metrics": {
          "num_samples": 1964,
          "accuracy": 0.5488798370672098,
          "precision_unsafe": 0.5447490946714951,
          "recall_unsafe": 0.9943342776203966,
          "f1_unsafe": 0.7038770053475936,
          "fpr_unsafe": 0.9723756906077348,
          "fnr_unsafe": 0.0056657223796034,
          "confusion_matrix_values": {
            "TN": 25,
            "FP": 880,
            "FN": 6,
            "TP": 1053
          },
          "num_true_safe": 905,
          "num_true_unsafe": 1059,
          "num_pred_safe": 31,
          "num_pred_unsafe": 1933,
          "num_pred_error": 0,
          "num_pred_ambiguous": 0
        },
        "timestamp": "2025-06-24T10:45:44.191667"
      },
      "top__500": {
        "parameters": {
          "detection_pipeline.top_k_semantic_search": 5.0
        },
        "metrics": {
          "num_samples": 1964,
          "accuracy": 0.5519348268839104,
          "precision_unsafe": 0.5464452516865594,
          "recall_unsafe": 0.9943342776203966,
          "f1_unsafe": 0.7052913596784997,
          "fpr_unsafe": 0.9657458563535911,
          "fnr_unsafe": 0.0056657223796034,
          "confusion_matrix_values": {
            "TN": 31,
            "FP": 874,
            "FN": 6,
            "TP": 1053
          },
          "num_true_safe": 905,
          "num_true_unsafe": 1059,
          "num_pred_safe": 37,
          "num_pred_unsafe": 1927,
          "num_pred_error": 0,
          "num_pred_ambiguous": 0
        },
        "timestamp": "2025-06-24T10:48:12.074493"
      },
      "top__600": {
        "parameters": {
          "detection_pipeline.top_k_semantic_search": 6.0
        },
        "metrics": {
          "num_samples": 1964,
          "accuracy": 0.5519348268839104,
          "precision_unsafe": 0.5465418616744669,
          "recall_unsafe": 0.9924457034938622,
          "f1_unsafe": 0.7048960429242119,
          "fpr_unsafe": 0.96353591160221,
          "fnr_unsafe": 0.007554296506137866,
          "confusion_matrix_values": {
            "TN": 33,
            "FP": 872,
            "FN": 8,
            "TP": 1051
          },
          "num_true_safe": 905,
          "num_true_unsafe": 1059,
          "num_pred_safe": 41,
          "num_pred_unsafe": 1923,
          "num_pred_error": 0,
          "num_pred_ambiguous": 0
        },
        "timestamp": "2025-06-24T10:50:40.234512"
      },
      "top__700": {
        "parameters": {
          "detection_pipeline.top_k_semantic_search": 7.0
        },
        "metrics": {
          "num_samples": 1964,
          "accuracy": 0.5539714867617108,
          "precision_unsafe": 0.547780678851175,
          "recall_unsafe": 0.9905571293673276,
          "f1_unsafe": 0.7054472091459314,
          "fpr_unsafe": 0.9569060773480663,
          "fnr_unsafe": 0.009442870632672332,
          "confusion_matrix_values": {
            "TN": 39,
            "FP": 866,
            "FN": 10,
            "TP": 1049
          },
          "num_true_safe": 905,
          "num_true_unsafe": 1059,
          "num_pred_safe": 49,
          "num_pred_unsafe": 1915,
          "num_pred_error": 0,
          "num_pred_ambiguous": 0
        },
        "timestamp": "2025-06-24T10:53:07.256721"
      },
      "top__800": {
        "parameters": {
          "detection_pipeline.top_k_semantic_search": 8.0
        },
        "metrics": {
          "num_samples": 1964,
          "accuracy": 0.5560081466395111,
          "precision_unsafe": 0.5489272632129775,
          "recall_unsafe": 0.9905571293673276,
          "f1_unsafe": 0.7063973063973064,
          "fpr_unsafe": 0.9524861878453039,
          "fnr_unsafe": 0.009442870632672332,
          "confusion_matrix_values": {
            "TN": 43,
            "FP": 862,
            "FN": 10,
            "TP": 1049
          },
          "num_true_safe": 905,
          "num_true_unsafe": 1059,
          "num_pred_safe": 53,
          "num_pred_unsafe": 1911,
          "num_pred_error": 0,
          "num_pred_ambiguous": 0
        },
        "timestamp": "2025-06-24T10:55:34.854371"
      },
      "top__900": {
        "parameters": {
          "detection_pipeline.top_k_semantic_search": 9.0
        },
        "metrics": {
          "num_samples": 1964,
          "accuracy": 0.5570264765784114,
          "precision_unsafe": 0.5495542737283692,
          "recall_unsafe": 0.9896128423040604,
          "f1_unsafe": 0.7066756574511126,
          "fpr_unsafe": 0.949171270718232,
          "fnr_unsafe": 0.010387157695939566,
          "confusion_matrix_values": {
            "TN": 46,
            "FP": 859,
            "FN": 11,
            "TP": 1048
          },
          "num_true_safe": 905,
          "num_true_unsafe": 1059,
          "num_pred_safe": 57,
          "num_pred_unsafe": 1907,
          "num_pred_error": 0,
          "num_pred_ambiguous": 0
        },
        "timestamp": "2025-06-24T10:58:02.715902"
      },
      "top__1000": {
        "parameters": {
          "detection_pipeline.top_k_semantic_search": 10.0
        },
        "metrics": {
          "num_samples": 1964,
          "accuracy": 0.5575356415478615,
          "precision_unsafe": 0.5499474237644585,
          "recall_unsafe": 0.987724268177526,
          "f1_unsafe": 0.7065180682201959,
          "fpr_unsafe": 0.9458563535911603,
          "fnr_unsafe": 0.012275731822474031,
          "confusion_matrix_values": {
            "TN": 49,
            "FP": 856,
            "FN": 13,
            "TP": 1046
          },
          "num_true_safe": 905,
          "num_true_unsafe": 1059,
          "num_pred_safe": 62,
          "num_pred_unsafe": 1902,
          "num_pred_error": 0,
          "num_pred_ambiguous": 0
        },
        "timestamp": "2025-06-24T11:00:30.707456"
      }
    },
    "fortress_dataset_english": {
      "top__100": {
        "parameters": {
          "detection_pipeline.top_k_semantic_search": 1.0
        },
        "metrics": {
          "num_samples": 2354,
          "accuracy": 0.6614273576890399,
          "precision_unsafe": 0.6283018867924528,
          "recall_unsafe": 0.9932885906040269,
          "f1_unsafe": 0.7697197341808726,
          "fpr_unsafe": 0.7778874629812438,
          "fnr_unsafe": 0.006711409395973154,
          "confusion_matrix_values": {
            "TN": 225,
            "FP": 788,
            "FN": 9,
            "TP": 1332
          },
          "num_true_safe": 1013,
          "num_true_unsafe": 1341,
          "num_pred_safe": 234,
          "num_pred_unsafe": 2120,
          "num_pred_error": 0,
          "num_pred_ambiguous": 0
        },
        "timestamp": "2025-06-24T11:02:28.948066"
      },
      "top__200": {
        "parameters": {
          "detection_pipeline.top_k_semantic_search": 2.0
        },
        "metrics": {
          "num_samples": 2354,
          "accuracy": 0.6699235344095157,
          "precision_unsafe": 0.6342857142857142,
          "recall_unsafe": 0.9932885906040269,
          "f1_unsafe": 0.7741935483870968,
          "fpr_unsafe": 0.7581441263573544,
          "fnr_unsafe": 0.006711409395973154,
          "confusion_matrix_values": {
            "TN": 245,
            "FP": 768,
            "FN": 9,
            "TP": 1332
          },
          "num_true_safe": 1013,
          "num_true_unsafe": 1341,
          "num_pred_safe": 254,
          "num_pred_unsafe": 2100,
          "num_pred_error": 0,
          "num_pred_ambiguous": 0
        },
        "timestamp": "2025-06-24T11:04:27.127382"
      },
      "top__300": {
        "parameters": {
          "detection_pipeline.top_k_semantic_search": 3.0
        },
        "metrics": {
          "num_samples": 2354,
          "accuracy": 0.6728971962616822,
          "precision_unsafe": 0.636668262326472,
          "recall_unsafe": 0.9917971662938105,
          "f1_unsafe": 0.7755102040816326,
          "fpr_unsafe": 0.7492596248766041,
          "fnr_unsafe": 0.00820283370618941,
          "confusion_matrix_values": {
            "TN": 254,
            "FP": 759,
            "FN": 11,
            "TP": 1330
          },
          "num_true_safe": 1013,
          "num_true_unsafe": 1341,
          "num_pred_safe": 265,
          "num_pred_unsafe": 2089,
          "num_pred_error": 0,
          "num_pred_ambiguous": 0
        },
        "timestamp": "2025-06-24T11:06:26.110275"
      },
      "top__400": {
        "parameters": {
          "detection_pipeline.top_k_semantic_search": 4.0
        },
        "metrics": {
          "num_samples": 2354,
          "accuracy": 0.6784197111299916,
          "precision_unsafe": 0.640926640926641,
          "recall_unsafe": 0.9903057419835943,
          "f1_unsafe": 0.7782009961910343,
          "fpr_unsafe": 0.7344521224086871,
          "fnr_unsafe": 0.009694258016405667,
          "confusion_matrix_values": {
            "TN": 269,
            "FP": 744,
            "FN": 13,
            "TP": 1328
          },
          "num_true_safe": 1013,
          "num_true_unsafe": 1341,
          "num_pred_safe": 282,
          "num_pred_unsafe": 2072,
          "num_pred_error": 0,
          "num_pred_ambiguous": 0
        },
        "timestamp": "2025-06-24T11:08:23.758385"
      },
      "top__500": {
        "parameters": {
          "detection_pipeline.top_k_semantic_search": 5.0
        },
        "metrics": {
          "num_samples": 2354,
          "accuracy": 0.6813933729821581,
          "precision_unsafe": 0.6435162700339971,
          "recall_unsafe": 0.9880686055182699,
          "f1_unsafe": 0.7794117647058824,
          "fpr_unsafe": 0.7245804540967423,
          "fnr_unsafe": 0.011931394481730051,
          "confusion_matrix_values": {
            "TN": 279,
            "FP": 734,
            "FN": 16,
            "TP": 1325
          },
          "num_true_safe": 1013,
          "num_true_unsafe": 1341,
          "num_pred_safe": 295,
          "num_pred_unsafe": 2059,
          "num_pred_error": 0,
          "num_pred_ambiguous": 0
        },
        "timestamp": "2025-06-24T11:10:21.963078"
      },
      "top__600": {
        "parameters": {
          "detection_pipeline.top_k_semantic_search": 6.0
        },
        "metrics": {
          "num_samples": 2354,
          "accuracy": 0.6826677994902294,
          "precision_unsafe": 0.6448780487804878,
          "recall_unsafe": 0.9858314690529456,
          "f1_unsafe": 0.7797109997051017,
          "fpr_unsafe": 0.7186574531095755,
          "fnr_unsafe": 0.014168530947054437,
          "confusion_matrix_values": {
            "TN": 285,
            "FP": 728,
            "FN": 19,
            "TP": 1322
          },
          "num_true_safe": 1013,
          "num_true_unsafe": 1341,
          "num_pred_safe": 304,
          "num_pred_unsafe": 2050,
          "num_pred_error": 0,
          "num_pred_ambiguous": 0
        },
        "timestamp": "2025-06-24T11:12:19.781686"
      },
      "top__700": {
        "parameters": {
          "detection_pipeline.top_k_semantic_search": 7.0
        },
        "metrics": {
          "num_samples": 2354,
          "accuracy": 0.6873406966864911,
          "precision_unsafe": 0.6485027000490918,
          "recall_unsafe": 0.9850857568978374,
          "f1_unsafe": 0.7821195973949082,
          "fpr_unsafe": 0.7068114511352419,
          "fnr_unsafe": 0.014914243102162566,
          "confusion_matrix_values": {
            "TN": 297,
            "FP": 716,
            "FN": 20,
            "TP": 1321
          },
          "num_true_safe": 1013,
          "num_true_unsafe": 1341,
          "num_pred_safe": 317,
          "num_pred_unsafe": 2037,
          "num_pred_error": 0,
          "num_pred_ambiguous": 0
        },
        "timestamp": "2025-06-24T11:14:18.046327"
      },
      "top__800": {
        "parameters": {
          "detection_pipeline.top_k_semantic_search": 8.0
        },
        "metrics": {
          "num_samples": 2354,
          "accuracy": 0.6907391673746814,
          "precision_unsafe": 0.6510596352883193,
          "recall_unsafe": 0.9850857568978374,
          "f1_unsafe": 0.7839762611275964,
          "fpr_unsafe": 0.6989141164856861,
          "fnr_unsafe": 0.014914243102162566,
          "confusion_matrix_values": {
            "TN": 305,
            "FP": 708,
            "FN": 20,
            "TP": 1321
          },
          "num_true_safe": 1013,
          "num_true_unsafe": 1341,
          "num_pred_safe": 325,
          "num_pred_unsafe": 2029,
          "num_pred_error": 0,
          "num_pred_ambiguous": 0
        },
        "timestamp": "2025-06-24T11:16:15.577687"
      },
      "top__900": {
        "parameters": {
          "detection_pipeline.top_k_semantic_search": 9.0
        },
        "metrics": {
          "num_samples": 2354,
          "accuracy": 0.6924384027187765,
          "precision_unsafe": 0.652496292634701,
          "recall_unsafe": 0.9843400447427293,
          "f1_unsafe": 0.7847800237812128,
          "fpr_unsafe": 0.6939782823297137,
          "fnr_unsafe": 0.015659955257270694,
          "confusion_matrix_values": {
            "TN": 310,
            "FP": 703,
            "FN": 21,
            "TP": 1320
          },
          "num_true_safe": 1013,
          "num_true_unsafe": 1341,
          "num_pred_safe": 331,
          "num_pred_unsafe": 2023,
          "num_pred_error": 0,
          "num_pred_ambiguous": 0
        },
        "timestamp": "2025-06-24T11:18:13.895745"
      },
      "top__1000": {
        "parameters": {
          "detection_pipeline.top_k_semantic_search": 10.0
        },
        "metrics": {
          "num_samples": 2354,
          "accuracy": 0.6949872557349193,
          "precision_unsafe": 0.6552067762830095,
          "recall_unsafe": 0.9806114839671887,
          "f1_unsafe": 0.7855436081242533,
          "fpr_unsafe": 0.6831194471865746,
          "fnr_unsafe": 0.019388516032811335,
          "confusion_matrix_values": {
            "TN": 321,
            "FP": 692,
            "FN": 26,
            "TP": 1315
          },
          "num_true_safe": 1013,
          "num_true_unsafe": 1341,
          "num_pred_safe": 347,
          "num_pred_unsafe": 2007,
          "num_pred_error": 0,
          "num_pred_ambiguous": 0
        },
        "timestamp": "2025-06-24T11:20:13.122771"
      }
    },
    "jailbreakbench_english": {
      "top__100": {
        "parameters": {
          "detection_pipeline.top_k_semantic_search": 1.0
        },
        "metrics": {
          "num_samples": 300,
          "accuracy": 0.6966666666666667,
          "precision_unsafe": 0.7026022304832714,
          "recall_unsafe": 0.945,
          "f1_unsafe": 0.8059701492537313,
          "fpr_unsafe": 0.8,
          "fnr_unsafe": 0.055,
          "confusion_matrix_values": {
            "TN": 20,
            "FP": 80,
            "FN": 11,
            "TP": 189
          },
          "num_true_safe": 100,
          "num_true_unsafe": 200,
          "num_pred_safe": 31,
          "num_pred_unsafe": 269,
          "num_pred_error": 0,
          "num_pred_ambiguous": 0
        },
        "timestamp": "2025-06-24T11:20:38.840348"
      },
      "top__200": {
        "parameters": {
          "detection_pipeline.top_k_semantic_search": 2.0
        },
        "metrics": {
          "num_samples": 300,
          "accuracy": 0.7433333333333333,
          "precision_unsafe": 0.7489878542510121,
          "recall_unsafe": 0.925,
          "f1_unsafe": 0.8277404921700223,
          "fpr_unsafe": 0.62,
          "fnr_unsafe": 0.075,
          "confusion_matrix_values": {
            "TN": 38,
            "FP": 62,
            "FN": 15,
            "TP": 185
          },
          "num_true_safe": 100,
          "num_true_unsafe": 200,
          "num_pred_safe": 53,
          "num_pred_unsafe": 247,
          "num_pred_error": 0,
          "num_pred_ambiguous": 0
        },
        "timestamp": "2025-06-24T11:21:05.719101"
      },
      "top__300": {
        "parameters": {
          "detection_pipeline.top_k_semantic_search": 3.0
        },
        "metrics": {
          "num_samples": 300,
          "accuracy": 0.7433333333333333,
          "precision_unsafe": 0.7510204081632653,
          "recall_unsafe": 0.92,
          "f1_unsafe": 0.8269662921348314,
          "fpr_unsafe": 0.61,
          "fnr_unsafe": 0.08,
          "confusion_matrix_values": {
            "TN": 39,
            "FP": 61,
            "FN": 16,
            "TP": 184
          },
          "num_true_safe": 100,
          "num_true_unsafe": 200,
          "num_pred_safe": 55,
          "num_pred_unsafe": 245,
          "num_pred_error": 0,
          "num_pred_ambiguous": 0
        },
        "timestamp": "2025-06-24T11:21:31.578502"
      },
      "top__400": {
        "parameters": {
          "detection_pipeline.top_k_semantic_search": 4.0
        },
        "metrics": {
          "num_samples": 300,
          "accuracy": 0.7433333333333333,
          "precision_unsafe": 0.7510204081632653,
          "recall_unsafe": 0.92,
          "f1_unsafe": 0.8269662921348314,
          "fpr_unsafe": 0.61,
          "fnr_unsafe": 0.08,
          "confusion_matrix_values": {
            "TN": 39,
            "FP": 61,
            "FN": 16,
            "TP": 184
          },
          "num_true_safe": 100,
          "num_true_unsafe": 200,
          "num_pred_safe": 55,
          "num_pred_unsafe": 245,
          "num_pred_error": 0,
          "num_pred_ambiguous": 0
        },
        "timestamp": "2025-06-24T11:21:57.316476"
      },
      "top__500": {
        "parameters": {
          "detection_pipeline.top_k_semantic_search": 5.0
        },
        "metrics": {
          "num_samples": 300,
          "accuracy": 0.74,
          "precision_unsafe": 0.7520661157024794,
          "recall_unsafe": 0.91,
          "f1_unsafe": 0.8235294117647058,
          "fpr_unsafe": 0.6,
          "fnr_unsafe": 0.09,
          "confusion_matrix_values": {
            "TN": 40,
            "FP": 60,
            "FN": 18,
            "TP": 182
          },
          "num_true_safe": 100,
          "num_true_unsafe": 200,
          "num_pred_safe": 58,
          "num_pred_unsafe": 242,
          "num_pred_error": 0,
          "num_pred_ambiguous": 0
        },
        "timestamp": "2025-06-24T11:22:23.378554"
      },
      "top__600": {
        "parameters": {
          "detection_pipeline.top_k_semantic_search": 6.0
        },
        "metrics": {
          "num_samples": 300,
          "accuracy": 0.7333333333333333,
          "precision_unsafe": 0.7521008403361344,
          "recall_unsafe": 0.895,
          "f1_unsafe": 0.817351598173516,
          "fpr_unsafe": 0.59,
          "fnr_unsafe": 0.105,
          "confusion_matrix_values": {
            "TN": 41,
            "FP": 59,
            "FN": 21,
            "TP": 179
          },
          "num_true_safe": 100,
          "num_true_unsafe": 200,
          "num_pred_safe": 62,
          "num_pred_unsafe": 238,
          "num_pred_error": 0,
          "num_pred_ambiguous": 0
        },
        "timestamp": "2025-06-24T11:22:49.758415"
      },
      "top__700": {
        "parameters": {
          "detection_pipeline.top_k_semantic_search": 7.0
        },
        "metrics": {
          "num_samples": 300,
          "accuracy": 0.73,
          "precision_unsafe": 0.7510548523206751,
          "recall_unsafe": 0.89,
          "f1_unsafe": 0.8146453089244852,
          "fpr_unsafe": 0.59,
          "fnr_unsafe": 0.11,
          "confusion_matrix_values": {
            "TN": 41,
            "FP": 59,
            "FN": 22,
            "TP": 178
          },
          "num_true_safe": 100,
          "num_true_unsafe": 200,
          "num_pred_safe": 63,
          "num_pred_unsafe": 237,
          "num_pred_error": 0,
          "num_pred_ambiguous": 0
        },
        "timestamp": "2025-06-24T11:23:16.004241"
      },
      "top__800": {
        "parameters": {
          "detection_pipeline.top_k_semantic_search": 8.0
        },
        "metrics": {
          "num_samples": 300,
          "accuracy": 0.7233333333333334,
          "precision_unsafe": 0.7489361702127659,
          "recall_unsafe": 0.88,
          "f1_unsafe": 0.8091954022988506,
          "fpr_unsafe": 0.59,
          "fnr_unsafe": 0.12,
          "confusion_matrix_values": {
            "TN": 41,
            "FP": 59,
            "FN": 24,
            "TP": 176
          },
          "num_true_safe": 100,
          "num_true_unsafe": 200,
          "num_pred_safe": 65,
          "num_pred_unsafe": 235,
          "num_pred_error": 0,
          "num_pred_ambiguous": 0
        },
        "timestamp": "2025-06-24T11:23:42.877508"
      },
      "top__900": {
        "parameters": {
          "detection_pipeline.top_k_semantic_search": 9.0
        },
        "metrics": {
          "num_samples": 300,
          "accuracy": 0.7166666666666667,
          "precision_unsafe": 0.7467811158798283,
          "recall_unsafe": 0.87,
          "f1_unsafe": 0.8036951501154734,
          "fpr_unsafe": 0.59,
          "fnr_unsafe": 0.13,
          "confusion_matrix_values": {
            "TN": 41,
            "FP": 59,
            "FN": 26,
            "TP": 174
          },
          "num_true_safe": 100,
          "num_true_unsafe": 200,
          "num_pred_safe": 67,
          "num_pred_unsafe": 233,
          "num_pred_error": 0,
          "num_pred_ambiguous": 0
        },
        "timestamp": "2025-06-24T11:24:09.063071"
      },
      "top__1000": {
        "parameters": {
          "detection_pipeline.top_k_semantic_search": 10.0
        },
        "metrics": {
          "num_samples": 300,
          "accuracy": 0.7166666666666667,
          "precision_unsafe": 0.7467811158798283,
          "recall_unsafe": 0.87,
          "f1_unsafe": 0.8036951501154734,
          "fpr_unsafe": 0.59,
          "fnr_unsafe": 0.13,
          "confusion_matrix_values": {
            "TN": 41,
            "FP": 59,
            "FN": 26,
            "TP": 174
          },
          "num_true_safe": 100,
          "num_true_unsafe": 200,
          "num_pred_safe": 67,
          "num_pred_unsafe": 233,
          "num_pred_error": 0,
          "num_pred_ambiguous": 0
        },
        "timestamp": "2025-06-24T11:24:36.065642"
      }
    },
    "xstest_english": {
      "top__100": {
        "parameters": {
          "detection_pipeline.top_k_semantic_search": 1.0
        },
        "metrics": {
          "num_samples": 450,
          "accuracy": 0.5177777777777778,
          "precision_unsafe": 0.47901234567901235,
          "recall_unsafe": 0.97,
          "f1_unsafe": 0.6413223140495867,
          "fpr_unsafe": 0.844,
          "fnr_unsafe": 0.03,
          "confusion_matrix_values": {
            "TN": 39,
            "FP": 211,
            "FN": 6,
            "TP": 194
          },
          "num_true_safe": 250,
          "num_true_unsafe": 200,
          "num_pred_safe": 45,
          "num_pred_unsafe": 405,
          "num_pred_error": 0,
          "num_pred_ambiguous": 0
        },
        "timestamp": "2025-06-24T11:24:56.453169"
      },
      "top__200": {
        "parameters": {
          "detection_pipeline.top_k_semantic_search": 2.0
        },
        "metrics": {
          "num_samples": 450,
          "accuracy": 0.6288888888888889,
          "precision_unsafe": 0.546742209631728,
          "recall_unsafe": 0.965,
          "f1_unsafe": 0.6980108499095841,
          "fpr_unsafe": 0.64,
          "fnr_unsafe": 0.035,
          "confusion_matrix_values": {
            "TN": 90,
            "FP": 160,
            "FN": 7,
            "TP": 193
          },
          "num_true_safe": 250,
          "num_true_unsafe": 200,
          "num_pred_safe": 97,
          "num_pred_unsafe": 353,
          "num_pred_error": 0,
          "num_pred_ambiguous": 0
        },
        "timestamp": "2025-06-24T11:25:17.624395"
      },
      "top__300": {
        "parameters": {
          "detection_pipeline.top_k_semantic_search": 3.0
        },
        "metrics": {
          "num_samples": 450,
          "accuracy": 0.6311111111111111,
          "precision_unsafe": 0.5485714285714286,
          "recall_unsafe": 0.96,
          "f1_unsafe": 0.6981818181818182,
          "fpr_unsafe": 0.632,
          "fnr_unsafe": 0.04,
          "confusion_matrix_values": {
            "TN": 92,
            "FP": 158,
            "FN": 8,
            "TP": 192
          },
          "num_true_safe": 250,
          "num_true_unsafe": 200,
          "num_pred_safe": 100,
          "num_pred_unsafe": 350,
          "num_pred_error": 0,
          "num_pred_ambiguous": 0
        },
        "timestamp": "2025-06-24T11:25:37.622910"
      },
      "top__400": {
        "parameters": {
          "detection_pipeline.top_k_semantic_search": 4.0
        },
        "metrics": {
          "num_samples": 450,
          "accuracy": 0.6311111111111111,
          "precision_unsafe": 0.5488505747126436,
          "recall_unsafe": 0.955,
          "f1_unsafe": 0.6970802919708029,
          "fpr_unsafe": 0.628,
          "fnr_unsafe": 0.045,
          "confusion_matrix_values": {
            "TN": 93,
            "FP": 157,
            "FN": 9,
            "TP": 191
          },
          "num_true_safe": 250,
          "num_true_unsafe": 200,
          "num_pred_safe": 102,
          "num_pred_unsafe": 348,
          "num_pred_error": 0,
          "num_pred_ambiguous": 0
        },
        "timestamp": "2025-06-24T11:25:58.375500"
      },
      "top__500": {
        "parameters": {
          "detection_pipeline.top_k_semantic_search": 5.0
        },
        "metrics": {
          "num_samples": 450,
          "accuracy": 0.6422222222222222,
          "precision_unsafe": 0.5565217391304348,
          "recall_unsafe": 0.96,
          "f1_unsafe": 0.7045871559633028,
          "fpr_unsafe": 0.612,
          "fnr_unsafe": 0.04,
          "confusion_matrix_values": {
            "TN": 97,
            "FP": 153,
            "FN": 8,
            "TP": 192
          },
          "num_true_safe": 250,
          "num_true_unsafe": 200,
          "num_pred_safe": 105,
          "num_pred_unsafe": 345,
          "num_pred_error": 0,
          "num_pred_ambiguous": 0
        },
        "timestamp": "2025-06-24T11:26:19.401601"
      },
      "top__600": {
        "parameters": {
          "detection_pipeline.top_k_semantic_search": 6.0
        },
        "metrics": {
          "num_samples": 450,
          "accuracy": 0.6422222222222222,
          "precision_unsafe": 0.5568513119533528,
          "recall_unsafe": 0.955,
          "f1_unsafe": 0.7034990791896869,
          "fpr_unsafe": 0.608,
          "fnr_unsafe": 0.045,
          "confusion_matrix_values": {
            "TN": 98,
            "FP": 152,
            "FN": 9,
            "TP": 191
          },
          "num_true_safe": 250,
          "num_true_unsafe": 200,
          "num_pred_safe": 107,
          "num_pred_unsafe": 343,
          "num_pred_error": 0,
          "num_pred_ambiguous": 0
        },
        "timestamp": "2025-06-24T11:26:39.831574"
      },
      "top__700": {
        "parameters": {
          "detection_pipeline.top_k_semantic_search": 7.0
        },
        "metrics": {
          "num_samples": 450,
          "accuracy": 0.6488888888888888,
          "precision_unsafe": 0.5606936416184971,
          "recall_unsafe": 0.97,
          "f1_unsafe": 0.7106227106227107,
          "fpr_unsafe": 0.608,
          "fnr_unsafe": 0.03,
          "confusion_matrix_values": {
            "TN": 98,
            "FP": 152,
            "FN": 6,
            "TP": 194
          },
          "num_true_safe": 250,
          "num_true_unsafe": 200,
          "num_pred_safe": 104,
          "num_pred_unsafe": 346,
          "num_pred_error": 0,
          "num_pred_ambiguous": 0
        },
        "timestamp": "2025-06-24T11:27:00.236973"
      },
      "top__800": {
        "parameters": {
          "detection_pipeline.top_k_semantic_search": 8.0
        },
        "metrics": {
          "num_samples": 450,
          "accuracy": 0.6488888888888888,
          "precision_unsafe": 0.5606936416184971,
          "recall_unsafe": 0.97,
          "f1_unsafe": 0.7106227106227107,
          "fpr_unsafe": 0.608,
          "fnr_unsafe": 0.03,
          "confusion_matrix_values": {
            "TN": 98,
            "FP": 152,
            "FN": 6,
            "TP": 194
          },
          "num_true_safe": 250,
          "num_true_unsafe": 200,
          "num_pred_safe": 104,
          "num_pred_unsafe": 346,
          "num_pred_error": 0,
          "num_pred_ambiguous": 0
        },
        "timestamp": "2025-06-24T11:27:20.508056"
      },
      "top__900": {
        "parameters": {
          "detection_pipeline.top_k_semantic_search": 9.0
        },
        "metrics": {
          "num_samples": 450,
          "accuracy": 0.6511111111111111,
          "precision_unsafe": 0.5623188405797102,
          "recall_unsafe": 0.97,
          "f1_unsafe": 0.7119266055045872,
          "fpr_unsafe": 0.604,
          "fnr_unsafe": 0.03,
          "confusion_matrix_values": {
            "TN": 99,
            "FP": 151,
            "FN": 6,
            "TP": 194
          },
          "num_true_safe": 250,
          "num_true_unsafe": 200,
          "num_pred_safe": 105,
          "num_pred_unsafe": 345,
          "num_pred_error": 0,
          "num_pred_ambiguous": 0
        },
        "timestamp": "2025-06-24T11:27:40.502199"
      },
      "top__1000": {
        "parameters": {
          "detection_pipeline.top_k_semantic_search": 10.0
        },
        "metrics": {
          "num_samples": 450,
          "accuracy": 0.6511111111111111,
          "precision_unsafe": 0.5626822157434402,
          "recall_unsafe": 0.965,
          "f1_unsafe": 0.7108655616942909,
          "fpr_unsafe": 0.6,
          "fnr_unsafe": 0.035,
          "confusion_matrix_values": {
            "TN": 100,
            "FP": 150,
            "FN": 7,
            "TP": 193
          },
          "num_true_safe": 250,
          "num_true_unsafe": 200,
          "num_pred_safe": 107,
          "num_pred_unsafe": 343,
          "num_pred_error": 0,
          "num_pred_ambiguous": 0
        },
        "timestamp": "2025-06-24T11:28:01.024388"
      }
    }
  },
  "completed": "2025-06-24T11:28:01.032103"
}