model,right_rate,right,wrong,bad_domain,all
textgrad_nl_Qwen2.5-0.5B-Instruct,0.000,0,0,283,283
textgrad_nl_Qwen2.5-1.5B-Instruct,0.007,2,0,275,277
textgrad_nl_Qwen2.5-14B-Instruct,0.526,72,19,46,137
textgrad_nl_Qwen2.5-32B-Instruct,0.585,55,8,31,94
textgrad_nl_Qwen2.5-3B-Instruct,0.080,20,1,229,250
textgrad_nl_Qwen2.5-72B-Instruct,0.508,63,19,42,124
textgrad_nl_Qwen2.5-7B-Instruct,0.140,36,20,201,257
textgrad_prob_Qwen2.5-0.5B-Instruct,0.000,0,0,324,324
textgrad_prob_Qwen2.5-1.5B-Instruct,0.000,0,1,322,323
textgrad_prob_Qwen2.5-14B-Instruct,0.517,61,23,34,118
textgrad_prob_Qwen2.5-32B-Instruct,0.711,54,8,14,76
textgrad_prob_Qwen2.5-3B-Instruct,0.006,2,1,317,320
textgrad_prob_Qwen2.5-72B-Instruct,0.580,51,18,19,88
textgrad_prob_Qwen2.5-7B-Instruct,0.230,48,36,125,209
