Model_Name,Benign_Injection_Rate,threshold,F1,Accuracy,Precision,Recall,TP,TN,FP,FN,Too_Early,Too_Late,Never_Triggered,Benign_Flagged,Total_Tasks,Total_Cost,Data
gpt-4o,0.0,0.15,1.0,1.0,1.0,1.0,95,95,0,0,0,0,0,0,190,10.480822500000002,../data/image_tasks/test_data.json
gpt-4o,0.2,0.15,0.9178743961352658,0.9105263157894737,0.8482142857142857,1.0,95,78,17,0,0,0,0,17,190,10.332005,../data/image_tasks/test_data.json
gpt-4o,0.4,0.15,0.8623853211009175,0.8421052631578947,0.7642276422764228,0.9894736842105263,94,66,29,1,0,0,1,29,190,10.636495000000005,../data/image_tasks/test_data.json
gpt-4o,0.6,0.15,0.7851239669421488,0.7263157894736842,0.6462585034013606,1.0,95,43,52,0,0,0,0,52,190,9.994394999999999,../data/image_tasks/test_data.json
gpt-4o,0.8,0.15,0.7450980392156863,0.6578947368421053,0.59375,1.0,95,30,65,0,0,0,0,65,190,9.8817275,../data/image_tasks/test_data.json
gpt-4o,1.0,0.15,0.7121212121212122,0.6,0.5562130177514792,0.9894736842105263,94,20,75,1,0,0,1,75,190,8.968960000000001,../data/image_tasks/test_data.json
