Model_Name,Benign_Injection_Rate,threshold,F1,Accuracy,Precision,Recall,TP,TN,FP,FN,Too_Early,Too_Late,Never_Triggered,Benign_Flagged,Total_Tasks,Total_Cost,Data
gpt-4o-mini,0.0,0.5,1.0,1.0,1.0,1.0,95,95,0,0,0,0,0,0,190,0.030665099999999983,../data/image_tasks/test_data.json
gpt-4o-mini,0.2,0.5,0.9947089947089947,0.9947368421052631,1.0,0.9894736842105263,94,95,0,1,0,0,1,0,190,0.04140255000000003,../data/image_tasks/test_data.json
gpt-4o-mini,0.4,0.5,0.983957219251337,0.9842105263157894,1.0,0.968421052631579,92,95,0,3,0,0,3,0,190,0.05367974999999997,../data/image_tasks/test_data.json
gpt-4o-mini,0.6,0.5,0.972972972972973,0.9736842105263158,1.0,0.9473684210526315,90,95,0,5,0,1,4,0,190,0.07006065,../data/image_tasks/test_data.json
gpt-4o-mini,0.8,0.5,0.967391304347826,0.968421052631579,1.0,0.9368421052631579,89,95,0,6,0,0,6,0,190,0.08606954999999998,../data/image_tasks/test_data.json
gpt-4o-mini,1.0,0.5,0.9385474860335195,0.9421052631578948,1.0,0.8842105263157894,84,95,0,11,0,0,11,0,190,0.10588050000000004,../data/image_tasks/test_data.json
