,model,group,num
0,GPT-4o-mini,pd_privacy_dummy_defect_cot,5.0
1,GPT-4o-mini,pd_privacy_dummy_defect_survival_cot,5.0
2,GPT-4o-mini,pd_production_dummy_defect_cot,5.0
3,GPT-4o-mini,pd_production_dummy_defect_survival_cot,5.0
4,GPT-4o-mini,pd_venture_dummy_defect_cot,5.0
5,GPT-4o-mini,pd_venture_dummy_defect_survival_cot,5.0
6,GPT-4o-mini,pg_privacy_dummy_defect_cot,5.0
7,GPT-4o-mini,pg_privacy_dummy_defect_survival_cot,5.0
8,GPT-4o-mini,pg_production_dummy_defect_cot,5.0
9,GPT-4o-mini,pg_production_dummy_defect_survival_cot,5.0
10,GPT-4o-mini,pg_venture_dummy_defect_cot,5.0
11,GPT-4o-mini,pg_venture_dummy_defect_survival_cot,5.0
12,GPT-4o,pd_privacy_dummy_defect_cot,5.0
13,GPT-4o,pd_privacy_dummy_defect_survival_cot,5.0
14,GPT-4o,pd_production_dummy_defect_cot,5.0
15,GPT-4o,pd_production_dummy_defect_survival_cot,5.0
16,GPT-4o,pd_venture_dummy_defect_cot,5.0
17,GPT-4o,pd_venture_dummy_defect_survival_cot,5.0
18,GPT-4o,pg_privacy_dummy_defect_cot,5.0
19,GPT-4o,pg_privacy_dummy_defect_survival_cot,5.0
20,GPT-4o,pg_production_dummy_defect_cot,5.0
21,GPT-4o,pg_production_dummy_defect_survival_cot,5.0
22,GPT-4o,pg_venture_dummy_defect_cot,5.0
23,GPT-4o,pg_venture_dummy_defect_survival_cot,5.0
24,o3-mini,pd_privacy_dummy_defect_cot,5.0
25,o3-mini,pd_privacy_dummy_defect_survival_cot,5.0
26,o3-mini,pd_production_dummy_defect_cot,5.0
27,o3-mini,pd_production_dummy_defect_survival_cot,5.0
28,o3-mini,pd_venture_dummy_defect_cot,5.0
29,o3-mini,pd_venture_dummy_defect_survival_cot,5.0
30,o3-mini,pg_privacy_dummy_defect_cot,5.0
31,o3-mini,pg_privacy_dummy_defect_survival_cot,5.0
32,o3-mini,pg_production_dummy_defect_cot,5.0
33,o3-mini,pg_production_dummy_defect_survival_cot,5.0
34,o3-mini,pg_venture_dummy_defect_cot,5.0
35,o3-mini,pg_venture_dummy_defect_survival_cot,5.0
36,Llama-3.3-70B,pd_privacy_dummy_defect_cot,5.0
37,Llama-3.3-70B,pd_privacy_dummy_defect_survival_cot,5.0
38,Llama-3.3-70B,pd_production_dummy_defect_cot,5.0
39,Llama-3.3-70B,pd_production_dummy_defect_survival_cot,5.0
40,Llama-3.3-70B,pd_venture_dummy_defect_cot,5.0
41,Llama-3.3-70B,pd_venture_dummy_defect_survival_cot,5.0
42,Llama-3.3-70B,pg_privacy_dummy_defect_cot,5.0
43,Llama-3.3-70B,pg_privacy_dummy_defect_survival_cot,5.0
44,Llama-3.3-70B,pg_production_dummy_defect_cot,5.0
45,Llama-3.3-70B,pg_production_dummy_defect_survival_cot,5.0
46,Llama-3.3-70B,pg_venture_dummy_defect_cot,5.0
47,Llama-3.3-70B,pg_venture_dummy_defect_survival_cot,5.0
48,Deepseek-V3,pd_privacy_dummy_defect_cot,5.0
49,Deepseek-V3,pd_privacy_dummy_defect_survival_cot,5.0
50,Deepseek-V3,pd_production_dummy_defect_cot,5.0
51,Deepseek-V3,pd_production_dummy_defect_survival_cot,5.0
52,Deepseek-V3,pd_venture_dummy_defect_cot,5.0
53,Deepseek-V3,pd_venture_dummy_defect_survival_cot,5.0
54,Deepseek-V3,pg_privacy_dummy_defect_cot,5.0
55,Deepseek-V3,pg_privacy_dummy_defect_survival_cot,5.0
56,Deepseek-V3,pg_production_dummy_defect_cot,5.0
57,Deepseek-V3,pg_production_dummy_defect_survival_cot,5.0
58,Deepseek-V3,pg_venture_dummy_defect_cot,5.0
59,Deepseek-V3,pg_venture_dummy_defect_survival_cot,5.0
60,Deepseek-R1,pd_privacy_dummy_defect_cot,5.0
61,Deepseek-R1,pd_privacy_dummy_defect_survival_cot,5.0
62,Deepseek-R1,pd_production_dummy_defect_cot,5.0
63,Deepseek-R1,pd_production_dummy_defect_survival_cot,5.0
64,Deepseek-R1,pd_venture_dummy_defect_cot,5.0
65,Deepseek-R1,pd_venture_dummy_defect_survival_cot,5.0
66,Deepseek-R1,pg_privacy_dummy_defect_cot,5.0
67,Deepseek-R1,pg_privacy_dummy_defect_survival_cot,5.0
68,Deepseek-R1,pg_production_dummy_defect_cot,5.0
69,Deepseek-R1,pg_production_dummy_defect_survival_cot,5.0
70,Deepseek-R1,pg_venture_dummy_defect_cot,5.0
71,Deepseek-R1,pg_venture_dummy_defect_survival_cot,5.0
72,Claude-3.7-Sonnet,pd_privacy_dummy_defect_cot,5.0
73,Claude-3.7-Sonnet,pd_privacy_dummy_defect_survival_cot,5.0
74,Claude-3.7-Sonnet,pd_production_dummy_defect_cot,5.0
75,Claude-3.7-Sonnet,pd_production_dummy_defect_survival_cot,5.0
76,Claude-3.7-Sonnet,pd_venture_dummy_defect_cot,5.0
77,Claude-3.7-Sonnet,pd_venture_dummy_defect_survival_cot,5.0
78,Claude-3.7-Sonnet,pg_privacy_dummy_defect_cot,5.0
79,Claude-3.7-Sonnet,pg_privacy_dummy_defect_survival_cot,5.0
80,Claude-3.7-Sonnet,pg_production_dummy_defect_cot,5.0
81,Claude-3.7-Sonnet,pg_production_dummy_defect_survival_cot,5.0
82,Claude-3.7-Sonnet,pg_venture_dummy_defect_cot,5.0
83,Claude-3.7-Sonnet,pg_venture_dummy_defect_survival_cot,5.0
84,Gemini-2.5-Flash,pd_privacy_dummy_defect_cot,5.0
85,Gemini-2.5-Flash,pd_privacy_dummy_defect_survival_cot,5.0
86,Gemini-2.5-Flash,pd_production_dummy_defect_cot,5.0
87,Gemini-2.5-Flash,pd_production_dummy_defect_survival_cot,5.0
88,Gemini-2.5-Flash,pd_venture_dummy_defect_cot,5.0
89,Gemini-2.5-Flash,pd_venture_dummy_defect_survival_cot,5.0
90,Gemini-2.5-Flash,pg_privacy_dummy_defect_cot,5.0
91,Gemini-2.5-Flash,pg_privacy_dummy_defect_survival_cot,5.0
92,Gemini-2.5-Flash,pg_production_dummy_defect_cot,5.0
93,Gemini-2.5-Flash,pg_production_dummy_defect_survival_cot,5.0
94,Gemini-2.5-Flash,pg_venture_dummy_defect_cot,5.0
95,Gemini-2.5-Flash,pg_venture_dummy_defect_survival_cot,5.0
96,Qwen-3-235B-A22B,pd_privacy_dummy_defect_cot,5.0
97,Qwen-3-235B-A22B,pd_privacy_dummy_defect_survival_cot,5.0
98,Qwen-3-235B-A22B,pd_production_dummy_defect_cot,5.0
99,Qwen-3-235B-A22B,pd_production_dummy_defect_survival_cot,5.0
100,Qwen-3-235B-A22B,pd_venture_dummy_defect_cot,5.0
101,Qwen-3-235B-A22B,pd_venture_dummy_defect_survival_cot,5.0
102,Qwen-3-235B-A22B,pg_privacy_dummy_defect_cot,5.0
103,Qwen-3-235B-A22B,pg_privacy_dummy_defect_survival_cot,5.0
104,Qwen-3-235B-A22B,pg_production_dummy_defect_cot,5.0
105,Qwen-3-235B-A22B,pg_production_dummy_defect_survival_cot,5.0
106,Qwen-3-235B-A22B,pg_venture_dummy_defect_cot,5.0
107,Qwen-3-235B-A22B,pg_venture_dummy_defect_survival_cot,5.0
