file_name,,pattern-matching-suppression_classification.jsonl,pattern-matching-suppression_classification.jsonl,pattern-matching-suppression_classification.jsonl,prompt-injection_sequence-probability.jsonl,prompt-injection_sequence-probability.jsonl,prompt-injection_sequence-probability.jsonl,redefine_classification.jsonl,redefine_classification.jsonl,redefine_classification.jsonl,strong-local-priors_classification.jsonl,strong-local-priors_classification.jsonl,strong-local-priors_classification.jsonl
alpha,,0.0,1.0,2.0,0.0,1.0,2.0,0.0,1.0,2.0,0.0,1.0,2.0
weakening,model,,,,,,,,,,,,
Generic system prompt,TheBloke/Mixtral-8x7B-v0.1-GPTQ,0.14101609429295417,0.23654707484752707,0.3216683974274999,0.525016342155683,0.5338244310087262,0.5047561823136778,0.6540332291191768,0.6525920123006379,0.6381664803117084,0.4425034035445056,0.4348172381382272,0.4197837628586066
Generic system prompt,davinci-002,0.059260218306534385,0.068296198662849,0.0846790591543016,0.5725267827323834,0.5955506528317343,0.601647856014576,0.5474867107550906,0.5386374092077613,0.5319475866163293,0.13646816250719157,0.10242236675818804,0.08820487491156803
Generic system prompt,gpt-3.5-turbo-instruct,0.2854467883467747,0.29228891398227463,0.30030654450115873,0.8102324623282519,0.8149322779849308,0.8010100576250619,0.5142031104228102,0.5525290852200468,0.5579798367786633,0.5260053676971552,0.5319906538128076,0.5400369987330024
Generic system prompt,gpt2,0.13468045316357952,0.12295949787826115,0.11272102742599875,0.893969292314222,0.8971306764576674,0.8951891326704151,0.6251618802752523,0.6280667384492755,0.6305072014141879,0.004276573508277173,0.003587648351237194,0.0034136123979285208
Generic system prompt,gpt2-large,0.047969276029122404,0.04383419355875893,0.04109563562024193,0.976436442414019,0.9811883992212498,0.9828588322688608,0.641548488146221,0.6615366949212667,0.6787166648488431,0.004517746521709228,0.00372951731151382,0.003660617270130659
Generic system prompt,gpt2-medium,0.05091677647674489,0.05775824924661583,0.0670973157588278,0.897850284227208,0.9257719334415435,0.9382958616187322,0.6093438389810301,0.6167273404031935,0.6227403031425289,0.007243718187006361,0.007165711467359924,0.00784300395242688
Generic system prompt,gpt2-xl,0.01760829195548398,0.02196622773647947,0.028943454944881875,0.8753963853835137,0.923898417319191,0.9477584069925543,0.4777407877730556,0.45667454899079907,0.4437462479454471,0.00437912823036224,0.005175364152147893,0.006713514775080794
Generic system prompt,meta-llama/Llama-2-13b-hf,0.04101648195067631,0.032745165339471596,0.028909866886252616,0.32924257426767756,0.4031850424477455,0.445903525085261,0.5681495982999175,0.5043777159594997,0.4484688426014522,0.4123632272829888,0.3983817528083048,0.3769986406107199
Generic system prompt,meta-llama/Llama-2-7b-hf,0.032330618781529354,0.03231454897748889,0.033824626026398866,0.49640817084809724,0.5241731217654492,0.5393830858385522,0.5594602202845051,0.5331757137191301,0.5179548316893959,0.2090977214760216,0.11915930466665409,0.07577770916413758
Generic system prompt,mistralai/Mistral-7B-v0.1,0.03395918185279792,0.047647106590357195,0.06894307225365301,0.6074028730115913,0.6548517631165833,0.6643102066613239,0.5567198376668732,0.4755763619000221,0.43517196482659826,0.4777821460748936,0.47230180871729455,0.4662815230827553
Generic system prompt,text-ada-001,0.037657244491344846,0.027369257246026145,0.028095887198457497,0.6733150085149292,0.7483408817883686,0.7630989401976767,0.5315277621705726,0.5359893855150466,0.5366845936135864,0.05470801456258171,0.06891653105625754,0.09041339765257282
Only data part,TheBloke/Mixtral-8x7B-v0.1-GPTQ,0.14101609429295417,0.46712963254789164,0.5377538615690246,0.5217078791303762,0.8022941632195171,0.8244027768030151,0.6540332291191768,0.8467694468490147,0.8762795639206383,0.4425034035445056,0.5368454348562799,0.5770312252366292
Only data part,davinci-002,0.059260218306534385,0.09160536326671176,0.13034769684689626,0.5519360200622446,0.6021454416076865,0.6186554736078703,0.5474867107550906,0.7126017013643481,0.7776500326528072,0.13646816250719157,0.23541684689219206,0.2749134121313637
Only data part,gpt-3.5-turbo-instruct,0.2854467883467747,0.293975580894068,0.24355468581462292,0.805318040534848,0.8484592755763561,0.8552798734637685,0.5142031104228102,0.7373832808850315,0.7910246375749691,0.5260053676971552,0.6125913931033348,0.6490859509023651
Only data part,gpt2,0.13468045316357952,0.15342673002717333,0.18310036607176167,0.8862049815895396,0.9443303015868059,0.936097474290063,0.6251618802752523,0.6614573948855224,0.6822580578381671,0.004276573508277173,0.020830411669405427,0.0774353065884287
Only data part,gpt2-large,0.047969276029122404,0.09310974148519974,0.13494181851187206,0.9742228933661482,0.9967508765843742,0.996469723595639,0.641548488146221,0.6657119981007654,0.6680084799952508,0.004517746521709228,0.06442696975531466,0.22917166747448348
Only data part,gpt2-medium,0.05091677647674489,0.026108389595962414,0.023121834006373135,0.8892651619318227,0.9933996299422677,0.9969788096879424,0.6093438389810301,0.6264682545197867,0.625991316477713,0.007243718187006361,0.07451266070143223,0.275695884760456
Only data part,gpt2-xl,0.01760829195548398,0.020960724220252542,0.05172254008655459,0.8688790429857752,0.9838147215266771,0.9900013754617308,0.4777407877730556,0.5504325901231637,0.5922749096744581,0.00437912823036224,0.08450321601407174,0.2662476702038137
Only data part,meta-llama/Llama-2-13b-hf,0.04101648195067631,0.2367043813135099,0.46549624920032134,0.32692513246240024,0.4192852879089312,0.41707865786399667,0.5681495982999175,0.7886796894388782,0.8362343038544399,0.4123632272829888,0.5235644858751849,0.5879358985805638
Only data part,meta-llama/Llama-2-7b-hf,0.032330618781529354,0.11907418688117292,0.24783787235635707,0.4945932952216316,0.5361379757166256,0.5340708761254525,0.5594602202845051,0.7124902507011417,0.7830660114816713,0.2090977214760216,0.35653237597217036,0.4220903516911653
Only data part,mistralai/Mistral-7B-v0.1,0.03395918185279792,0.19860280422821366,0.34523267824907294,0.6050594283167389,0.7703565129348567,0.7776118029740234,0.5567198376668732,0.8370847125063223,0.8723273307974376,0.4777821460748936,0.5969680935847336,0.6687414611427543
Only data part,text-ada-001,0.037657244491344846,0.08023932252585371,0.12851627516024394,0.6654496234603315,0.7968566226784133,0.8212727529383472,0.5315277621705726,0.5311746067385402,0.5313823438086388,0.05470801456258171,0.10209137738214591,0.12714398271213337
