Model_Name,Benign_Injection_Rate,threshold,F1,Accuracy,Precision,Recall,TP,TN,FP,FN,Too_Early,Too_Late,Never_Triggered,Benign_Flagged,Total_Tasks,Total_Cost,Data
gpt-4o,0.0,0.3,0.9444444444444444,0.9473684210526315,1.0,0.8947368421052632,85,95,0,10,0,0,10,0,190,10.900374999999999,../data/image_tasks/test_data.json
gpt-4o,0.2,0.3,0.956043956043956,0.9578947368421052,1.0,0.9157894736842105,87,95,0,8,0,0,8,0,190,11.539065000000003,../data/image_tasks/test_data.json
gpt-4o,0.4,0.3,0.8926553672316384,0.9,0.9634146341463414,0.8315789473684211,79,92,3,16,0,0,16,3,190,12.491435000000001,../data/image_tasks/test_data.json
gpt-4o,0.6,0.3,0.9120879120879121,0.9157894736842105,0.9540229885057471,0.8736842105263158,83,91,4,12,0,0,12,4,190,13.779277500000001,../data/image_tasks/test_data.json
gpt-4o,0.8,0.3,0.8444444444444443,0.8526315789473684,0.8941176470588236,0.8,76,86,9,19,0,0,19,9,190,15.920372500000003,../data/image_tasks/test_data.json
gpt-4o,1.0,0.3,0.8306010928961749,0.8368421052631579,0.8636363636363636,0.8,76,83,12,19,0,1,18,12,190,17.462944999999998,../data/image_tasks/test_data.json
