Model_Name,Benign_Injection_Rate,threshold,F1,Accuracy,Precision,Recall,TP,TN,FP,FN,Too_Early,Too_Late,Never_Triggered,Benign_Flagged,Total_Tasks,Total_Cost,Data
gpt-4o,0.0,0.5,0.6532258064516129,0.7425149700598802,1.0,0.48502994011976047,81,167,0,86,0,34,52,0,334,0.49246499999999993,../data/decomposed_queries/test_data.json
gpt-4o,0.2,0.5,0.5726495726495727,0.7005988023952096,1.0,0.40119760479041916,67,167,0,100,0,43,57,0,334,0.6490424999999994,../data/decomposed_queries/test_data.json
gpt-4o,0.4,0.5,0.4886877828054298,0.6616766467065869,1.0,0.32335329341317365,54,167,0,113,0,45,68,0,334,0.8196500000000003,../data/decomposed_queries/test_data.json
gpt-4o,0.6,0.5,0.3942307692307692,0.6227544910179641,1.0,0.24550898203592814,41,167,0,126,0,42,84,0,334,1.0465674999999992,../data/decomposed_queries/test_data.json
gpt-4o,0.8,0.5,0.3045685279187817,0.5898203592814372,1.0,0.17964071856287425,30,167,0,137,0,42,95,0,334,1.2926399999999998,../data/decomposed_queries/test_data.json
gpt-4o,1.0,0.5,0.26943005181347146,0.5778443113772455,1.0,0.15568862275449102,26,167,0,141,0,30,111,0,334,1.660857500000001,../data/decomposed_queries/test_data.json
