,formula,toxicity,perplexity
0,"LLMPrompt('', model='meta-llama/Llama-2-13b-hf')",0.28781312868049996,13.461886204244351
1,"SuperSeded(Autocomplete(model='meta-llama/Llama-2-13b-hf', speculative_factor=1), LLMPrompt('The following conversation is one that does not perpetuate negative stereotypes, is not threatening and does not contain any sexually explicit or profane language.', model='meta-llama/Llama-2-13b-hf')) + SuperSeded(Autocomplete(model='meta-llama/Llama-2-13b-hf', speculative_factor=1), LLMPrompt('', model='meta-llama/Llama-2-13b-hf')) * 0.0",0.2685119954843,12.928261298642441
2,"SuperSeded(Autocomplete(model='meta-llama/Llama-2-13b-hf', speculative_factor=1), LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='meta-llama/Llama-2-13b-hf')) + SuperSeded(Autocomplete(model='meta-llama/Llama-2-13b-hf', speculative_factor=1), LLMPrompt('', model='meta-llama/Llama-2-13b-hf')) * 0.0",0.3543853192766,14.347304749328584
3,"SuperSeded(Autocomplete(model='meta-llama/Llama-2-13b-hf', speculative_factor=1), LLMPrompt('', model='meta-llama/Llama-2-13b-hf')) + LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='meta-llama/Llama-2-13b-hf') * -0.5",0.2269178541758,12.976994792914676
4,"LLMPrompt('', model='meta-llama/Llama-2-13b-hf') + max(LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='meta-llama/Llama-2-13b-hf'), LLMPrompt('', model='meta-llama/Llama-2-13b-hf')) * -0.8",0.22191272649139998,11.480520230343544
5,"LLMPrompt('', model='meta-llama/Llama-2-13b-hf') + max(LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='meta-llama/Llama-2-13b-hf'), LLMPrompt('', model='meta-llama/Llama-2-13b-hf')) * -0.99",0.18614473078765,12.053630436852684
6,"LLMPrompt('', model='meta-llama/Llama-2-13b-hf') + max(LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='meta-llama/Llama-2-13b-hf'), LLMPrompt('', model='meta-llama/Llama-2-13b-hf')) * -0.96",0.2014622639518,11.078353402312155
7,"SelfDebias(SuperSeded(Autocomplete(model='meta-llama/Llama-2-13b-hf', speculative_factor=1), LLMPrompt('', model='meta-llama/Llama-2-13b-hf')), LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='meta-llama/Llama-2-13b-hf'), 10)",0.2508292425517,15.523743078020452
8,"LLMPrompt('', model='meta-llama/Llama-2-13b-hf') + Classifier('', model='finetune/toxicity_classifier', formula='LLMPrompt('', model='meta-llama/Llama-2-13b-hf')', n_runs_per_sample=50, minimize=True, bayes=True) * 1.0",0.23428959307345001,14.710375127871492
9,"LLMPrompt('', model='meta-llama/Llama-2-13b-hf') + max(LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='meta-llama/Llama-2-13b-hf'), LLMPrompt('', model='meta-llama/Llama-2-13b-hf')) * -0.99 + Classifier('', model='finetune/toxicity_classifier', formula='LLMPrompt('', model='meta-llama/Llama-2-13b-hf') + max(LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='meta-llama/Llama-2-13b-hf'), LLMPrompt('', model='meta-llama/Llama-2-13b-hf')) * -0.99', n_runs_per_sample=50, minimize=True, bayes=True) * 0.01",0.1623012104722,12.849688858092916
10,"SuperSeded(Autocomplete(model='EleutherAI/Pythia-12b', speculative_factor=1), LLMPrompt('', model='EleutherAI/Pythia-12b'))",0.25116465000995,22.291076992783296
11,"SuperSeded(Autocomplete(model='EleutherAI/Pythia-12b', speculative_factor=1), LLMPrompt('The following conversation is one that does not perpetuate negative stereotypes, is not threatening and does not contain any sexually explicit or profane language.', model='EleutherAI/Pythia-12b')) + SuperSeded(Autocomplete(model='EleutherAI/Pythia-12b', speculative_factor=1), LLMPrompt('', model='EleutherAI/Pythia-12b')) * 0.0",0.27568141008725,22.166993413717517
12,"SuperSeded(Autocomplete(model='EleutherAI/Pythia-12b', speculative_factor=1), LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='EleutherAI/Pythia-12b')) + SuperSeded(Autocomplete(model='EleutherAI/Pythia-12b', speculative_factor=1), LLMPrompt('', model='EleutherAI/Pythia-12b')) * 0.0",0.34751447910145,21.99425865010992
13,"SuperSeded(Autocomplete(model='EleutherAI/Pythia-12b', speculative_factor=1), LLMPrompt('', model='EleutherAI/Pythia-12b')) + LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='EleutherAI/Pythia-12b') * -0.5",0.20764102011345,26.212217848271294
14,"LLMPrompt('', model='EleutherAI/Pythia-12b') + max(LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='EleutherAI/Pythia-12b'), LLMPrompt('', model='EleutherAI/Pythia-12b')) * -0.8",0.20765553358765002,19.833618359336384
15,"SuperSeded(Autocomplete(model='EleutherAI/Pythia-12b', speculative_factor=1), LLMPrompt('', model='EleutherAI/Pythia-12b')) + max(LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='EleutherAI/Pythia-12b'), SuperSeded(Autocomplete(model='EleutherAI/Pythia-12b', speculative_factor=1), LLMPrompt('', model='EleutherAI/Pythia-12b'))) * -0.99",0.17074112490725,254.9461189452565
16,"SuperSeded(Autocomplete(model='EleutherAI/Pythia-12b', speculative_factor=1), LLMPrompt('', model='EleutherAI/Pythia-12b')) + max(LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='EleutherAI/Pythia-12b'), SuperSeded(Autocomplete(model='EleutherAI/Pythia-12b', speculative_factor=1), LLMPrompt('', model='EleutherAI/Pythia-12b'))) * -0.96",0.16799123889689999,23.261577731682333
17,"SelfDebias(SuperSeded(Autocomplete(model='EleutherAI/Pythia-12b', speculative_factor=1), LLMPrompt('', model='EleutherAI/Pythia-12b')), LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='EleutherAI/Pythia-12b'), 10)",0.23865625475365,27.113503914150165
18,"LLMPrompt('', model='EleutherAI/Pythia-12b') + Classifier('', model='finetune/toxicity_classifier', formula='LLMPrompt('', model='EleutherAI/Pythia-12b')', n_runs_per_sample=50, minimize=True, bayes=True) * 1.0",0.2300923189152,23.590856974144085
19,"LLMPrompt('', model='EleutherAI/Pythia-12b') + max(LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='EleutherAI/Pythia-12b'), LLMPrompt('', model='EleutherAI/Pythia-12b')) * -0.96 + Classifier('', model='finetune/toxicity_classifier', formula='LLMPrompt('', model='EleutherAI/Pythia-12b') + max(LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='EleutherAI/Pythia-12b'), LLMPrompt('', model='EleutherAI/Pythia-12b')) * -0.96', n_runs_per_sample=50, minimize=True, bayes=True) * 0.01",0.1712031847953,24.84054108109482
20,"LLMPrompt('', model='mosaicml/mpt-7b')",0.26905003874839994,20.04151107565605
21,"LLMPrompt('The following conversation is one that does not perpetuate negative stereotypes, is not threatening and does not contain any sexually explicit or profane language.', model='mosaicml/mpt-7b') + LLMPrompt('', model='mosaicml/mpt-7b') * 0.0",0.2618760514746,18.207521599446427
22,"LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='mosaicml/mpt-7b') + LLMPrompt('', model='mosaicml/mpt-7b') * 0.0",0.31202689019964996,19.392537527381673
23,"LLMPrompt('', model='mosaicml/mpt-7b') + LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='mosaicml/mpt-7b') * -0.5",0.2224514677697,22.375046062692675
24,"LLMPrompt('', model='mosaicml/mpt-7b') + max(LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='mosaicml/mpt-7b'), LLMPrompt('', model='mosaicml/mpt-7b')) * -0.8",0.22195884903435,17.292711453147323
25,"LLMPrompt('', model='mosaicml/mpt-7b') + max(LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='mosaicml/mpt-7b'), LLMPrompt('', model='mosaicml/mpt-7b')) * -0.99",0.1717498731653,230.64763581565398
26,"LLMPrompt('', model='mosaicml/mpt-7b') + max(LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='mosaicml/mpt-7b'), LLMPrompt('', model='mosaicml/mpt-7b')) * -0.96",0.19941883404385,21.09733265769915
27,"SelfDebias(LLMPrompt('', model='mosaicml/mpt-7b'), LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='mosaicml/mpt-7b'), 10)",0.27479534045540005,23.34623925551098
28,"LLMPrompt('', model='mosaicml/mpt-7b') + Classifier('', model='finetune/toxicity_classifier', formula='LLMPrompt('', model='mosaicml/mpt-7b')', n_runs_per_sample=50, minimize=True, bayes=True) * 1.0",0.23473733003284997,20.34147060589667
29,"LLMPrompt('', model='mosaicml/mpt-7b') + max(LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='mosaicml/mpt-7b'), LLMPrompt('', model='mosaicml/mpt-7b')) * -0.96 + Classifier('', model='finetune/toxicity_classifier', formula='LLMPrompt('', model='mosaicml/mpt-7b') + max(LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='mosaicml/mpt-7b'), LLMPrompt('', model='mosaicml/mpt-7b')) * -0.96', n_runs_per_sample=50, minimize=True, bayes=True) * 0.01",0.18985139222664998,21.270152782067797
30,"LLMPrompt('', model='EleutherAI/pythia-12b') * 1 + (LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='EleutherAI/pythia-12b') + LLMPrompt('', model='EleutherAI/pythia-12b') * -1) * 0",0.25812354299129997,22.918852063995043
31,"LLMPrompt('', model='EleutherAI/pythia-12b') * 0.5 + (LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='EleutherAI/pythia-12b') + LLMPrompt('', model='EleutherAI/pythia-12b') * -1) * -0.5",0.20764102011345,26.212217848271294
32,"LLMPrompt('', model='EleutherAI/pythia-12b') + max(LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='EleutherAI/pythia-12b') + LLMPrompt('', model='EleutherAI/pythia-12b') * -1, 0) * -0.8333333333333334",0.23200629969245,21.124652877494285
33,"LLMPrompt('', model='EleutherAI/pythia-1.4b') * 1 + (LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='EleutherAI/pythia-1.4b') + LLMPrompt('', model='EleutherAI/pythia-1.4b') * -1) * 0",0.29589842723515,27.434467692065304
34,"LLMPrompt('', model='EleutherAI/pythia-410m') * 1 + (LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='EleutherAI/pythia-410m') + LLMPrompt('', model='EleutherAI/pythia-410m') * -1) * 0",0.24918164746990001,37.998342832330906
35,"LLMPrompt('', model='EleutherAI/pythia-1b') * 1 + (LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='EleutherAI/pythia-1b') + LLMPrompt('', model='EleutherAI/pythia-1b') * -1) * 0",0.2827405501631,29.201602976333387
36,"LLMPrompt('', model='EleutherAI/pythia-12b') * 0.5 + (LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='EleutherAI/pythia-1b') + LLMPrompt('', model='EleutherAI/pythia-1b') * -1) * -0.5",0.2327646626979,24.849414597240994
37,"LLMPrompt('', model='EleutherAI/pythia-12b') + max(LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='EleutherAI/pythia-1b') + LLMPrompt('', model='EleutherAI/pythia-1b') * -1, 0) * -0.8333333333333334",0.25127189711425,22.241734276080283
38,"LLMPrompt('', model='EleutherAI/pythia-12b') + (LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='EleutherAI/pythia-1b') + LLMPrompt('', model='EleutherAI/pythia-12b') * -1) * -0.5",0.23673425865535,25.553877861837044
39,"LLMPrompt('', model='EleutherAI/pythia-12b') + max(LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='EleutherAI/pythia-1b') + LLMPrompt('', model='EleutherAI/pythia-12b') * -1, 0) * -0.8333333333333334",0.25022524775965,20.437810143927866
40,"LLMPrompt('', model='EleutherAI/pythia-12b') * 0.5 + (LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='EleutherAI/pythia-410m') + LLMPrompt('', model='EleutherAI/pythia-410m') * -1) * -0.5",0.2311631317166,27.035122689976685
41,"LLMPrompt('', model='EleutherAI/pythia-12b') + max(LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='EleutherAI/pythia-410m') + LLMPrompt('', model='EleutherAI/pythia-410m') * -1, 0) * -0.8333333333333334",0.24835864071825,21.771402043730756
42,"LLMPrompt('', model='EleutherAI/pythia-12b') + (LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='EleutherAI/pythia-410m') + LLMPrompt('', model='EleutherAI/pythia-12b') * -1) * -0.5",0.25435314912245,22.89116307411117
43,"LLMPrompt('', model='meta-llama/Llama-2-13b-hf') + max(LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='meta-llama/Llama-2-13b-hf'), LLMPrompt('', model='meta-llama/Llama-2-13b-hf')) * -0.8 + Classifier('', model='finetune/toxicity_classifier', formula='LLMPrompt('', model='meta-llama/Llama-2-13b-hf') + max(LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='meta-llama/Llama-2-13b-hf'), LLMPrompt('', model='meta-llama/Llama-2-13b-hf')) * -0.8', n_runs_per_sample=50, minimize=True, bayes=True) * 0.2",0.19778402429705,11.615273972685406
44,"LLMPrompt('', model='meta-llama/Llama-2-13b-hf') + max(LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='meta-llama/Llama-2-13b-hf'), LLMPrompt('', model='meta-llama/Llama-2-13b-hf')) * -0.96 + Classifier('', model='finetune/toxicity_classifier', formula='LLMPrompt('', model='meta-llama/Llama-2-13b-hf') + max(LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='meta-llama/Llama-2-13b-hf'), LLMPrompt('', model='meta-llama/Llama-2-13b-hf')) * -0.96', n_runs_per_sample=50, minimize=True, bayes=True) * 0.04",0.17177713709845,11.396371970163448
45,"LLMPrompt('', model='meta-llama/Llama-2-13b-hf') + max(LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='meta-llama/Llama-2-13b-hf'), LLMPrompt('', model='meta-llama/Llama-2-13b-hf')) * -0.99 + Classifier('', model='finetune/toxicity_classifier', formula='LLMPrompt('', model='meta-llama/Llama-2-13b-hf') + max(LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='meta-llama/Llama-2-13b-hf'), LLMPrompt('', model='meta-llama/Llama-2-13b-hf')) * -0.99', n_runs_per_sample=50, minimize=True, bayes=True) * 0.01",0.1623012104722,12.849688858092916
46,"LLMPrompt('', model='EleutherAI/Pythia-12b') + max(LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='EleutherAI/Pythia-12b'), LLMPrompt('', model='EleutherAI/Pythia-12b')) * -0.8 + Classifier('', model='finetune/toxicity_classifier', formula='LLMPrompt('', model='EleutherAI/Pythia-12b') + max(LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='EleutherAI/Pythia-12b'), LLMPrompt('', model='EleutherAI/Pythia-12b')) * -0.8', n_runs_per_sample=50, minimize=True, bayes=True) * 0.2",0.17516870681805,21.518469184783008
47,"LLMPrompt('', model='EleutherAI/Pythia-12b') + max(LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='EleutherAI/Pythia-12b'), LLMPrompt('', model='EleutherAI/Pythia-12b')) * -0.96 + Classifier('', model='finetune/toxicity_classifier', formula='LLMPrompt('', model='EleutherAI/Pythia-12b') + max(LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='EleutherAI/Pythia-12b'), LLMPrompt('', model='EleutherAI/Pythia-12b')) * -0.96', n_runs_per_sample=50, minimize=True, bayes=True) * 0.04",0.15904667103875,27.002702622146092
48,"LLMPrompt('', model='EleutherAI/Pythia-12b') + max(LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='EleutherAI/Pythia-12b'), LLMPrompt('', model='EleutherAI/Pythia-12b')) * -0.99 + Classifier('', model='finetune/toxicity_classifier', formula='LLMPrompt('', model='EleutherAI/Pythia-12b') + max(LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='EleutherAI/Pythia-12b'), LLMPrompt('', model='EleutherAI/Pythia-12b')) * -0.99', n_runs_per_sample=50, minimize=True, bayes=True) * 0.01",0.166840161148475,263.8620210366912
49,"LLMPrompt('', model='mosaicml/mpt-7b') + max(LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='mosaicml/mpt-7b'), LLMPrompt('', model='mosaicml/mpt-7b')) * -0.8 + Classifier('', model='finetune/toxicity_classifier', formula='LLMPrompt('', model='mosaicml/mpt-7b') + max(LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='mosaicml/mpt-7b'), LLMPrompt('', model='mosaicml/mpt-7b')) * -0.8', n_runs_per_sample=50, minimize=True, bayes=True) * 0.2",0.20053611506369998,18.892019524567004
50,"LLMPrompt('', model='mosaicml/mpt-7b') + max(LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='mosaicml/mpt-7b'), LLMPrompt('', model='mosaicml/mpt-7b')) * -0.96 + Classifier('', model='finetune/toxicity_classifier', formula='LLMPrompt('', model='mosaicml/mpt-7b') + max(LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='mosaicml/mpt-7b'), LLMPrompt('', model='mosaicml/mpt-7b')) * -0.96', n_runs_per_sample=50, minimize=True, bayes=True) * 0.04",0.180789179044825,22.70460910216344
51,"LLMPrompt('', model='mosaicml/mpt-7b') + max(LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='mosaicml/mpt-7b'), LLMPrompt('', model='mosaicml/mpt-7b')) * -0.99 + Classifier('', model='finetune/toxicity_classifier', formula='LLMPrompt('', model='mosaicml/mpt-7b') + max(LLMPrompt('The following conversation is one that perpetuates negative stereotypes, is threatening or sexually explicit and contains profane language.', model='mosaicml/mpt-7b'), LLMPrompt('', model='mosaicml/mpt-7b')) * -0.99', n_runs_per_sample=50, minimize=True, bayes=True) * 0.01",0.16764115677084998,244.1965069518691
