dataset_name,noise_level,run_number,f1_unsafe,accuracy,fpr_unsafe,fnr_unsafe
fortress_dataset,0.05,1,0.9151785714285714,0.903143585386576,0.11549851924975321,0.08277404921700224
xstest,0.05,1,0.8324324324324325,0.8622222222222222,0.064,0.23
jailbreakbench,0.05,1,0.8994708994708994,0.8733333333333333,0.08,0.15
aegis_v2,0.05,1,0.7797447509263071,0.7275967413441955,0.46740331491712706,0.10576015108593012
fortress_dataset,0.05,2,0.9128816083395384,0.9005947323704333,0.11747285291214216,0.08575689783743475
xstest,0.05,2,0.8310991957104558,0.86,0.072,0.225
jailbreakbench,0.05,2,0.900523560209424,0.8733333333333333,0.1,0.14
aegis_v2,0.05,2,0.7788778877887789,0.7270875763747454,0.46519337016574586,0.10859301227573183
fortress_dataset,0.05,3,0.9129464285714286,0.9005947323704333,0.11846001974333663,0.08501118568232663
xstest,0.05,3,0.8292682926829268,0.86,0.064,0.235
jailbreakbench,0.05,3,0.8847184986595175,0.8566666666666667,0.08,0.175
aegis_v2,0.05,3,0.7778237484484899,0.7265784114052953,0.46187845303867403,0.11237016052880075
fortress_dataset,0.05,4,0.9136448598130841,0.9018691588785047,0.11056268509378085,0.08873974645786727
xstest,0.05,4,0.8342245989304813,0.8622222222222222,0.072,0.22
jailbreakbench,0.05,4,0.8918205804749341,0.8633333333333333,0.1,0.155
aegis_v2,0.05,4,0.7824285122254455,0.7326883910386965,0.4530386740331492,0.10859301227573183
fortress_dataset,0.05,5,0.9128816083395384,0.9005947323704333,0.11747285291214216,0.08575689783743475
xstest,0.05,5,0.8421052631578947,0.8666666666666667,0.08,0.2
jailbreakbench,0.05,5,0.900523560209424,0.8733333333333333,0.1,0.14
aegis_v2,0.05,5,0.7818181818181819,0.7311608961303462,0.4585635359116022,0.10670443814919736
fortress_dataset,0.10,1,0.9112426035502958,0.8980458793542906,0.12931885488647582,0.08128262490678598
xstest,0.10,1,0.7862796833773087,0.82,0.12,0.255
jailbreakbench,0.10,1,0.9025641025641026,0.8733333333333333,0.14,0.12
aegis_v2,0.10,1,0.766721044045677,0.7087576374745418,0.5005524861878453,0.11237016052880075
fortress_dataset,0.10,2,0.9137994820569737,0.9010195412064571,0.12537018756169793,0.0790454884414616
xstest,0.10,2,0.8241469816272966,0.8511111111111112,0.096,0.215
jailbreakbench,0.10,2,0.890625,0.86,0.13,0.145
aegis_v2,0.10,2,0.76904075751338,0.7143584521384929,0.481767955801105,0.11803588290840415
fortress_dataset,0.10,3,0.9051310446659284,0.8908241291418861,0.140177690029615,0.08575689783743475
xstest,0.10,3,0.8222811671087533,0.8511111111111112,0.088,0.225
jailbreakbench,0.10,3,0.8746666666666667,0.8433333333333334,0.11,0.18
aegis_v2,0.10,3,0.7747230201066886,0.7204684317718941,0.47955801104972373,0.10859301227573183
fortress_dataset,0.10,4,0.9119286510590858,0.8993203058623619,0.12142152023692004,0.08501118568232663
xstest,0.10,4,0.8324607329842932,0.8577777777777778,0.092,0.205
jailbreakbench,0.10,4,0.8871391076115486,0.8566666666666667,0.12,0.155
aegis_v2,0.10,4,0.7797029702970297,0.7281059063136456,0.46408839779005523,0.10764872521246459
fortress_dataset,0.10,5,0.9086859688195991,0.8954970263381479,0.12734452122408688,0.087248322147651
xstest,0.10,5,0.8290155440414507,0.8533333333333334,0.104,0.2
jailbreakbench,0.10,5,0.9028871391076115,0.8766666666666667,0.09,0.14
aegis_v2,0.10,5,0.7724477244772447,0.7174134419551935,0.4839779005524862,0.11048158640226628
fortress_dataset,0.15,1,0.9043097151205259,0.8887000849617672,0.15695952615992104,0.07680835197613721
xstest,0.15,1,0.746031746031746,0.7866666666666666,0.148,0.295
jailbreakbench,0.15,1,0.9063291139240506,0.8766666666666667,0.16,0.105
aegis_v2,0.15,1,0.7577235772357723,0.6965376782077393,0.518232044198895,0.11992445703493862
fortress_dataset,0.15,2,0.907957462412908,0.8933729821580288,0.14610069101678183,0.07680835197613721
xstest,0.15,2,0.7837150127226463,0.8111111111111111,0.156,0.23
jailbreakbench,0.15,2,0.8711340206185567,0.8333333333333334,0.19,0.155
aegis_v2,0.15,2,0.7619047619047619,0.6995926680244399,0.5248618784530387,0.10859301227573183
fortress_dataset,0.15,3,0.8931047063115651,0.8755310110450297,0.17374136229022705,0.087248322147651
xstest,0.15,3,0.7946666666666666,0.8288888888888889,0.104,0.255
jailbreakbench,0.15,3,0.8123249299719888,0.7766666666666666,0.12,0.275
aegis_v2,0.15,3,0.766302146618064,0.7062118126272913,0.512707182320442,0.10670443814919736
fortress_dataset,0.15,4,0.8977065890061886,0.8806287170773152,0.17077986179664364,0.08053691275167785
xstest,0.15,4,0.8041237113402062,0.8311111111111111,0.128,0.22
jailbreakbench,0.15,4,0.8772845953002611,0.8433333333333334,0.15,0.16
aegis_v2,0.15,4,0.7640081799591002,0.7062118126272913,0.4994475138121547,0.11803588290840415
fortress_dataset,0.15,5,0.9005847953216374,0.8844519966015293,0.16090819348469892,0.08128262490678598
xstest,0.15,5,0.8132992327365729,0.8377777777777777,0.128,0.205
jailbreakbench,0.15,5,0.8509485094850948,0.8166666666666667,0.12,0.215
aegis_v2,0.15,5,0.7657188626351622,0.7021384928716904,0.532596685082873,0.09726156751652502
fortress_dataset,0.20,1,0.8921639108554996,0.8725573491928632,0.19743336623889438,0.07457121551081283
xstest,0.20,1,0.745,0.7733333333333333,0.204,0.255
jailbreakbench,0.20,1,0.8737373737373737,0.8333333333333334,0.23,0.135
aegis_v2,0.20,1,0.7495987158908507,0.6822810590631364,0.5513812154696133,0.11803588290840415
fortress_dataset,0.20,2,0.8927161822748475,0.872982158028887,0.19940769990128332,0.07233407904548844
xstest,0.20,2,0.7741935483870968,0.7977777777777778,0.188,0.22
jailbreakbench,0.20,2,0.8787878787878788,0.84,0.22,0.13
aegis_v2,0.20,2,0.7538767395626242,0.6848268839103869,0.5613259668508287,0.1048158640226629
fortress_dataset,0.20,3,0.8836874324810947,0.862786745964316,0.2063178677196446,0.08501118568232663
xstest,0.20,3,0.7810026385224275,0.8155555555555556,0.124,0.26
jailbreakbench,0.20,3,0.7863247863247863,0.75,0.13,0.31
aegis_v2,0.20,3,0.7554304102976669,0.6904276985743381,0.5392265193370166,0.11331444759206799
fortress_dataset,0.20,4,0.8805755395683453,0.8589634664401019,0.21224086870681144,0.087248322147651
xstest,0.20,4,0.7777777777777778,0.8044444444444444,0.168,0.23
jailbreakbench,0.20,4,0.8630490956072352,0.8233333333333334,0.2,0.165
aegis_v2,0.20,4,0.7575880210441117,0.695010183299389,0.5259668508287293,0.11614730878186968
fortress_dataset,0.20,5,0.8887277999275099,0.8695836873406967,0.1895360315893386,0.08575689783743475
xstest,0.20,5,0.7761194029850746,0.8,0.184,0.22
jailbreakbench,0.20,5,0.8525469168900804,0.8166666666666667,0.14,0.205
aegis_v2,0.20,5,0.7540594059405941,0.6838085539714868,0.5679558011049723,0.10103871576959396
fortress_dataset,0.25,1,0.8736692689850958,0.848768054375531,0.2428430404738401,0.08202833706189411
xstest,0.25,1,0.7330097087378641,0.7555555555555555,0.244,0.245
jailbreakbench,0.25,1,0.8542713567839196,0.8066666666666666,0.28,0.15
aegis_v2,0.25,1,0.7382178217821782,0.6634419551934827,0.5900552486187846,0.11992445703493862
fortress_dataset,0.25,2,0.8746478873239436,0.848768054375531,0.25370187561697927,0.0738255033557047
xstest,0.25,2,0.7445255474452555,0.7666666666666667,0.232,0.235
jailbreakbench,0.25,2,0.8585858585858586,0.8133333333333334,0.26,0.15
aegis_v2,0.25,2,0.7408572552103815,0.6644602851323829,0.5988950276243094,0.11048158640226628
fortress_dataset,0.25,3,0.8657243816254417,0.8385726423109601,0.26061204343534056,0.08650260999254288
xstest,0.25,3,0.7568922305764411,0.7844444444444445,0.192,0.245
jailbreakbench,0.25,3,0.768361581920904,0.7266666666666667,0.18,0.32
aegis_v2,0.25,3,0.7426736250501806,0.6736252545824847,0.5602209944751381,0.12653446647780925
fortress_dataset,0.25,4,0.8647308781869688,0.8377230246389125,0.25863770977295164,0.0894854586129754
xstest,0.25,4,0.7487437185929648,0.7777777777777778,0.196,0.255
jailbreakbench,0.25,4,0.8564102564102564,0.8133333333333334,0.23,0.165
aegis_v2,0.25,4,0.7366336633663366,0.6614052953156823,0.5922651933701657,0.12181303116147309
fortress_dataset,0.25,5,0.8673323823109843,0.8419711129991504,0.24383020730503455,0.09321401938851603
xstest,0.25,5,0.7432762836185819,0.7666666666666667,0.228,0.24
jailbreakbench,0.25,5,0.8222811671087533,0.7766666666666666,0.22,0.225
aegis_v2,0.25,5,0.7433768287860815,0.6695519348268839,0.585635359116022,0.11237016052880075
fortress_dataset,0.30,1,0.8510786360473208,0.8181818181818182,0.3060217176702863,0.08799403430275914
xstest,0.30,1,0.7067307692307693,0.7288888888888889,0.276,0.265
jailbreakbench,0.30,1,0.8478802992518704,0.7966666666666666,0.31,0.15
aegis_v2,0.30,1,0.7227022780832679,0.6405295315682281,0.6265193370165746,0.13125590179414542
fortress_dataset,0.30,2,0.8503448275862069,0.8156329651656754,0.32181638696939785,0.08053691275167785
xstest,0.30,2,0.7276995305164319,0.7422222222222222,0.284,0.225
jailbreakbench,0.30,2,0.8613861386138614,0.8133333333333334,0.3,0.13
aegis_v2,0.30,2,0.7222222222222222,0.6384928716904277,0.6342541436464089,0.12842304060434373
fortress_dataset,0.30,3,0.8416666666666667,0.806287170773152,0.3228035538005923,0.09619686800894854
xstest,0.30,3,0.7378640776699029,0.76,0.24,0.24
jailbreakbench,0.30,3,0.8043478260869565,0.76,0.2,0.26
aegis_v2,0.30,3,0.723302897975387,0.645112016293279,0.6066298342541436,0.1397544853635505
fortress_dataset,0.30,4,0.8450606585788561,0.8101104502973662,0.32082922013820336,0.09097688292319164
xstest,0.30,4,0.7347931873479319,0.7577777777777778,0.24,0.245
jailbreakbench,0.30,4,0.8607594936708861,0.8166666666666667,0.25,0.15
aegis_v2,0.30,4,0.7219819111285882,0.640020366598778,0.625414364640884,0.13314447592067988
fortress_dataset,0.30,5,0.8401408450704225,0.8071367884451996,0.3020730503455084,0.11036539895600299
xstest,0.30,5,0.7255813953488373,0.7377777777777778,0.296,0.22
jailbreakbench,0.30,5,0.8167539267015707,0.7666666666666667,0.26,0.22
aegis_v2,0.30,5,0.7261345852895149,0.6435845213849287,0.6287292817679558,0.12370160528800755
fortress_dataset,0.35,1,0.8295841854124063,0.7875955819881053,0.3711747285291214,0.0924683072334079
xstest,0.35,1,0.6886792452830188,0.7066666666666667,0.312,0.27
jailbreakbench,0.35,1,0.8668280871670703,0.8166666666666667,0.34,0.105
aegis_v2,0.35,1,0.7066614725360343,0.6165987780040734,0.6640883977900552,0.14353163361661944
fortress_dataset,0.35,2,0.8202670318384115,0.7769753610875106,0.3770977295162882,0.10663683818046234
xstest,0.35,2,0.6915887850467289,0.7066666666666667,0.32,0.26
jailbreakbench,0.35,2,0.7938144329896907,0.7333333333333333,0.34,0.23
aegis_v2,0.35,2,0.7103393843725335,0.6262729124236253,0.6353591160220995,0.1501416430594901
fortress_dataset,0.35,3,0.8120300751879699,0.7663551401869159,0.39190523198420535,0.11409395973154363
xstest,0.35,3,0.7082405345211581,0.7088888888888889,0.36,0.205
jailbreakbench,0.35,3,0.7958115183246073,0.74,0.3,0.24
aegis_v2,0.35,3,0.6932395466979289,0.6003054989816701,0.6773480662983425,0.16241737488196412
fortress_dataset,0.35,4,0.8028263795423957,0.7510620220900595,0.43237907206317866,0.11036539895600299
xstest,0.35,4,0.7194570135746606,0.7244444444444444,0.332,0.205
jailbreakbench,0.35,4,0.8391959798994975,0.7866666666666666,0.31,0.165
aegis_v2,0.35,4,0.6986518636003172,0.6130346232179226,0.6430939226519337,0.1680830972615675
fortress_dataset,0.35,5,0.8084526244035446,0.7612574341546304,0.40177690029615004,0.11558538404175989
xstest,0.35,5,0.683371298405467,0.6911111111111111,0.356,0.25
jailbreakbench,0.35,5,0.8220551378446115,0.7633333333333333,0.35,0.18
aegis_v2,0.35,5,0.6976744186046512,0.6094704684317719,0.6552486187845303,0.1643059490084986
fortress_dataset,0.40,1,0.7924400944988188,0.7387425658453696,0.4422507403751234,0.12453392990305742
xstest,0.40,1,0.639080459770115,0.6511111111111111,0.384,0.305
jailbreakbench,0.40,1,0.8398058252427184,0.78,0.39,0.135
aegis_v2,0.40,1,0.6869395711500975,0.5911405295315683,0.6906077348066298,0.1680830972615675
fortress_dataset,0.40,2,0.7797979797979798,0.7221750212404418,0.46495557749259625,0.13646532438478748
xstest,0.40,2,0.6284403669724771,0.64,0.396,0.315
jailbreakbench,0.40,2,0.7751937984496124,0.71,0.37,0.25
aegis_v2,0.40,2,0.6918238993710691,0.6008146639511202,0.6685082872928176,0.16902738432483475
fortress_dataset,0.40,3,0.7784109956419711,0.7192013593882752,0.47482724580454094,0.1342281879194631
xstest,0.40,3,0.6622807017543859,0.6577777777777778,0.42,0.245
jailbreakbench,0.40,3,0.7700258397932817,0.7033333333333334,0.38,0.255
aegis_v2,0.40,3,0.6700507614213198,0.5697556008146639,0.7116022099447514,0.18980169971671387
fortress_dataset,0.40,4,0.7688710754843019,0.7060322854715378,0.49555774925962487,0.14168530947054436
xstest,0.40,4,0.6817155756207675,0.6866666666666666,0.368,0.245
jailbreakbench,0.40,4,0.8241206030150754,0.7666666666666667,0.34,0.18
aegis_v2,0.40,4,0.6737756714060031,0.5794297352342159,0.6850828729281768,0.19452313503305005
fortress_dataset,0.40,5,0.7726507241495453,0.7132540356839422,0.47482724580454094,0.14466815809097688
xstest,0.40,5,0.6279569892473118,0.6155555555555555,0.476,0.27
jailbreakbench,0.40,5,0.7821782178217822,0.7066666666666667,0.46,0.21
aegis_v2,0.40,5,0.6722222222222223,0.5794297352342159,0.6784530386740332,0.20018885741265344
fortress_dataset,0.45,1,0.7554658594012782,0.6911639762107051,0.5024679170779862,0.16256524981357195
xstest,0.45,1,0.5954545454545455,0.6044444444444445,0.436,0.345
jailbreakbench,0.45,1,0.8184019370460048,0.75,0.44,0.155
aegis_v2,0.45,1,0.6611764705882353,0.560081466395112,0.7160220994475138,0.20396600566572237
fortress_dataset,0.45,2,0.7414829659318637,0.6711979609175871,0.5360315893385982,0.17225950782997762
xstest,0.45,2,0.6075388026607539,0.6066666666666667,0.456,0.315
jailbreakbench,0.45,2,0.6330532212885154,0.5633333333333334,0.44,0.435
aegis_v2,0.45,2,0.6634844868735084,0.5692464358452138,0.6861878453038674,0.21246458923512748
fortress_dataset,0.45,3,0.7368770764119601,0.6635514018691588,0.5528134254689042,0.17300521998508575
xstest,0.45,3,0.6209850107066381,0.6066666666666667,0.488,0.275
jailbreakbench,0.45,3,0.7146529562982005,0.63,0.5,0.305
aegis_v2,0.45,3,0.65078125,0.544806517311609,0.7381215469613259,0.21340887629839472
fortress_dataset,0.45,4,0.7354795884500498,0.6614273576890399,0.5567620927936822,0.17375093214019388
xstest,0.45,4,0.6311111111111111,0.6311111111111111,0.432,0.29
jailbreakbench,0.45,4,0.7919799498746867,0.7233333333333334,0.41,0.21
aegis_v2,0.45,4,0.647876141325923,0.5483706720977597,0.7116022099447514,0.22946175637393768
fortress_dataset,0.45,5,0.7321965897693079,0.6597281223449448,0.5478775913129319,0.18344519015659955
xstest,0.45,5,0.5840336134453782,0.56,0.548,0.305
jailbreakbench,0.45,5,0.699228791773779,0.61,0.53,0.32
aegis_v2,0.45,5,0.6500198176773682,0.5504073319755601,0.7116022099447514,0.22568460812086874
fortress_dataset,0.50,1,0.701766304347826,0.627017841971113,0.562685093780849,0.2296793437733035
xstest,0.50,1,0.5506607929515418,0.5466666666666666,0.516,0.375
jailbreakbench,0.50,1,0.7942583732057417,0.7133333333333334,0.52,0.17
aegis_v2,0.50,1,0.6228209191759112,0.515274949083503,0.7502762430939226,0.2577903682719547
fortress_dataset,0.50,2,0.6964643095396932,0.6134239592183517,0.6051332675222113,0.2214765100671141
xstest,0.50,2,0.540084388185654,0.5155555555555555,0.584,0.36
jailbreakbench,0.50,2,0.574585635359116,0.4866666666666667,0.58,0.48
aegis_v2,0.50,2,0.6253476360746921,0.519857433808554,0.7414364640883978,0.25684608120868746
fortress_dataset,0.50,3,0.68335001668335,0.596856414613424,0.6238894373149062,0.23639075316927666
xstest,0.50,3,0.5658747300215983,0.5533333333333333,0.528,0.345
jailbreakbench,0.50,3,0.7175572519083969,0.63,0.52,0.295
aegis_v2,0.50,3,0.6076649545634136,0.4943991853360489,0.7767955801104972,0.2738432483474976
fortress_dataset,0.50,4,0.6813040585495675,0.5930331350892099,0.6327739387956565,0.23639075316927666
xstest,0.50,4,0.592274678111588,0.5777777777777777,0.512,0.31
jailbreakbench,0.50,4,0.7647058823529411,0.68,0.52,0.22
aegis_v2,0.50,4,0.6313694267515924,0.5285132382892057,0.7292817679558011,0.251180358829084
fortress_dataset,0.50,5,0.6795856999665887,0.592608326253186,0.6268509378084897,0.24161073825503357
xstest,0.50,5,0.5428571428571428,0.5022222222222222,0.628,0.335
jailbreakbench,0.50,5,0.6597402597402597,0.5633333333333334,0.58,0.365
aegis_v2,0.50,5,0.6290003951007507,0.5218940936863544,0.7469613259668508,0.24834749763928235
