Model_Name,Benign_Injection_Rate,threshold,F1,Accuracy,Precision,Recall,TP,TN,FP,FN,Too_Early,Too_Late,Never_Triggered,Benign_Flagged,Total_Tasks,Total_Cost,Data
o3-mini,0.0,0.5,0.967391304347826,0.968421052631579,1.0,0.9368421052631579,89,95,0,6,0,0,6,0,190,1.242198099999999,../data/image_tasks/test_data.json
o3-mini,0.2,0.5,0.8823529411764706,0.8947368421052632,1.0,0.7894736842105263,75,95,0,20,0,0,20,0,190,2.119039999999999,../data/image_tasks/test_data.json
o3-mini,0.4,0.5,0.8554216867469879,0.8736842105263158,1.0,0.7473684210526316,71,95,0,24,0,1,23,0,190,2.645368000000001,../data/image_tasks/test_data.json
o3-mini,0.6,0.5,0.8343558282208589,0.8578947368421053,1.0,0.7157894736842105,68,95,0,27,0,0,27,0,190,3.2453256,../data/image_tasks/test_data.json
o3-mini,0.8,0.5,0.7898089171974523,0.8263157894736842,1.0,0.6526315789473685,62,95,0,33,0,0,33,0,190,3.8138231999999994,../data/image_tasks/test_data.json
o3-mini,1.0,0.5,0.7499999999999999,0.8,1.0,0.6,57,95,0,38,0,1,37,0,190,4.4093984,../data/image_tasks/test_data.json
