run_id,tests,patch,model,submitted,completed,resolved,unresolved,errors,empty_patches,completion_rate,resolve_rate
mybatch.dataset.baseline.20241103_OpenHands-CodeAct-2.1-sonnet-20241022.filtered,dataset,baseline,20241103_OpenHands-CodeAct-2.1-sonnet-20241022.filtered,217,215,62,153,2,0,0.9907834101382489,0.2857142857142857
mybatch.dataset.gold.20241103_OpenHands-CodeAct-2.1-sonnet-20241022.filtered,dataset,gold,20241103_OpenHands-CodeAct-2.1-sonnet-20241022.filtered,2294,214,212,2,3,0,0.09328683522231909,0.09241499564080209
mybatch.dataset.model.20241103_OpenHands-CodeAct-2.1-sonnet-20241022.filtered,dataset,model,20241103_OpenHands-CodeAct-2.1-sonnet-20241022.filtered,217,206,204,2,11,0,0.9493087557603687,0.9400921658986175
mybatch.te.baseline.20241103_OpenHands-CodeAct-2.1-sonnet-20241022.filtered,te,baseline,20241103_OpenHands-CodeAct-2.1-sonnet-20241022.filtered,217,217,1,216,0,0,1.0,0.004608294930875576
mybatch.te.gold.20241103_OpenHands-CodeAct-2.1-sonnet-20241022.filtered,te,gold,20241103_OpenHands-CodeAct-2.1-sonnet-20241022.filtered,2294,216,199,17,1,0,0.09415867480383609,0.08674803836094158
mybatch.te.model.20241103_OpenHands-CodeAct-2.1-sonnet-20241022.filtered,te,model,20241103_OpenHands-CodeAct-2.1-sonnet-20241022.filtered,217,208,191,17,9,0,0.9585253456221198,0.880184331797235
mybatch.dataset.baseline.20241121_autocoderover-v2.0-claude-3-5-sonnet-20241022.filtered,dataset,baseline,20241121_autocoderover-v2.0-claude-3-5-sonnet-20241022.filtered,217,215,62,153,2,0,0.9907834101382489,0.2857142857142857
mybatch.dataset.gold.20241121_autocoderover-v2.0-claude-3-5-sonnet-20241022.filtered,dataset,gold,20241121_autocoderover-v2.0-claude-3-5-sonnet-20241022.filtered,2294,214,211,3,3,0,0.09328683522231909,0.0919790758500436
mybatch.dataset.model.20241121_autocoderover-v2.0-claude-3-5-sonnet-20241022.filtered,dataset,model,20241121_autocoderover-v2.0-claude-3-5-sonnet-20241022.filtered,217,214,212,2,3,0,0.9861751152073732,0.9769585253456221
mybatch.te.baseline.20241121_autocoderover-v2.0-claude-3-5-sonnet-20241022.filtered,te,baseline,20241121_autocoderover-v2.0-claude-3-5-sonnet-20241022.filtered,217,217,1,216,0,0,1.0,0.004608294930875576
mybatch.te.gold.20241121_autocoderover-v2.0-claude-3-5-sonnet-20241022.filtered,te,gold,20241121_autocoderover-v2.0-claude-3-5-sonnet-20241022.filtered,2294,216,200,16,1,0,0.09415867480383609,0.08718395815170009
mybatch.te.model.20241121_autocoderover-v2.0-claude-3-5-sonnet-20241022.filtered,te,model,20241121_autocoderover-v2.0-claude-3-5-sonnet-20241022.filtered,217,217,200,17,0,0,1.0,0.9216589861751152
mybatch.dataset.baseline.20250227_sweagent-claude-3-7-20250219.filtered,dataset,baseline,20250227_sweagent-claude-3-7-20250219.filtered,217,215,62,153,2,0,0.9907834101382489,0.2857142857142857
mybatch.dataset.gold.20250227_sweagent-claude-3-7-20250219.filtered,dataset,gold,20250227_sweagent-claude-3-7-20250219.filtered,2294,214,214,0,3,0,0.09328683522231909,0.09328683522231909
mybatch.dataset.model.20250227_sweagent-claude-3-7-20250219.filtered,dataset,model,20250227_sweagent-claude-3-7-20250219.filtered,217,215,215,0,2,0,0.9907834101382489,0.9907834101382489
mybatch.te.baseline.20250227_sweagent-claude-3-7-20250219.filtered,te,baseline,20250227_sweagent-claude-3-7-20250219.filtered,217,217,2,215,0,0,1.0,0.009216589861751152
mybatch.te.gold.20250227_sweagent-claude-3-7-20250219.filtered,te,gold,20250227_sweagent-claude-3-7-20250219.filtered,2294,216,198,18,1,0,0.09415867480383609,0.08631211857018309
mybatch.te.model.20250227_sweagent-claude-3-7-20250219.filtered,te,model,20250227_sweagent-claude-3-7-20250219.filtered,217,217,201,16,0,0,1.0,0.9262672811059908
