experiment run details:
  dataset: hoi
  path: /gpfs/mariana/home/envomp/bongard/big_hake/
  prompt method: direct
  prompt structure: interleaved_test_first

---------------------------------------
  test split name: test_seen_obj_seen_act
---------------------------------------

0 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
1 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
2 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
3 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
4 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
5 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
6 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
7 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
8 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
9 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
10 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
11 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
12 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
13 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
14 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
15 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
16 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
17 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
18 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
19 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
20 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
21 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
22 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
23 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
24 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
25 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
26 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
27 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
28 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
29 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
30 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
31 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
32 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
33 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
34 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
35 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
36 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
37 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
38 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
39 | expected:'cat_1' | got='cat_1 | full: [' cat_1']'
40 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
41 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
42 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
43 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
44 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
45 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
46 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
47 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
48 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
49 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
50 | expected:'cat_2' | got='cat_1 | full: [' cat_1']'
51 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
52 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
53 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
54 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
55 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
56 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
57 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
58 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
59 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
60 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
61 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
62 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
63 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
64 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
65 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
66 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
67 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
68 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
69 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
70 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
71 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
72 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
73 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
74 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
75 | expected:'cat_1' | got='cat_1 | full: [' cat_1']'
76 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
77 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
78 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
79 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
80 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
81 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
82 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
83 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
84 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
85 | expected:'cat_1' | got='cat_1 | full: [' cat_1']'
86 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
87 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
88 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
89 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
90 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
91 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
92 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
93 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
94 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
95 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
96 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
97 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
98 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
99 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
100 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
101 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
102 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
103 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
104 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
105 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
106 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
107 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
108 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
109 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
110 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
111 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
112 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
113 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
114 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
115 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
116 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
117 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
118 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
119 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
120 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
121 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
122 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
123 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
124 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
125 | expected:'cat_1' | got='cat_1 | full: [' cat_1']'
126 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
127 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
128 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
129 | expected:'cat_1' | got='cat_1 | full: [' cat_1']'
130 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
131 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
132 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
133 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
134 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
135 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
136 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
137 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
138 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
139 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
140 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
141 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
142 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
143 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
144 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
145 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
146 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
147 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
148 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
149 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
150 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
151 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
152 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
153 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
154 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
155 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
156 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
157 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
158 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
159 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
160 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
161 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
162 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
163 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
164 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
165 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
166 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
167 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
168 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
169 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
170 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
171 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
172 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
173 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
174 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
175 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
176 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
177 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
178 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
179 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
180 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
181 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
182 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
183 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
184 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
185 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
186 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
187 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
188 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
189 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
190 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
191 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
192 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
193 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
194 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
195 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
196 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
197 | expected:'cat_1' | got='cat_1 | full: [' cat_1']'
198 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
199 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
---------------------------------------
Summary for Split 'test_seen_obj_seen_act':
 results: {'correct': {'cat_1': 6, 'cat_2': 99}, 'incorrect': {'cat_1': 94, 'cat_2': 1}}
 accuracy: 52.50%

---------------------------------------
  test split name: test_seen_obj_unseen_act
---------------------------------------

0 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
1 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
2 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
3 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
4 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
5 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
6 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
7 | expected:'cat_1' | got='cat_1 | full: [' cat_1']'
8 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
9 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
10 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
11 | expected:'cat_1' | got='cat_1 | full: [' cat_1']'
12 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
13 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
14 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
15 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
16 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
17 | expected:'cat_1' | got='cat_1 | full: [' cat_1']'
18 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
19 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
20 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
21 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
22 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
23 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
24 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
25 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
26 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
27 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
28 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
29 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
30 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
31 | expected:'cat_1' | got='cat_1 | full: [' cat_1']'
32 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
33 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
34 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
35 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
36 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
37 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
38 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
39 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
40 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
41 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
42 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
43 | expected:'cat_1' | got='cat_1 | full: [' cat_1']'
44 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
45 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
46 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
47 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
48 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
49 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
50 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
51 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
52 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
53 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
54 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
55 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
56 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
57 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
58 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
59 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
60 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
61 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
62 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
63 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
64 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
65 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
66 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
67 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
68 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
69 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
70 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
71 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
72 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
73 | expected:'cat_1' | got='cat_1 | full: [' cat_1']'
74 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
75 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
76 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
77 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
78 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
79 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
80 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
81 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
82 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
83 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
84 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
85 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
86 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
87 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
88 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
89 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
90 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
91 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
92 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
93 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
94 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
95 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
96 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
97 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
98 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
99 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
100 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
101 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
102 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
103 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
104 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
105 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
106 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
107 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
108 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
109 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
110 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
111 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
112 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
113 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
114 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
115 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
116 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
117 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
118 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
119 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
120 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
121 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
122 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
123 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
124 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
125 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
126 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
127 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
128 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
129 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
130 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
131 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
132 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
133 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
134 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
135 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
136 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
137 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
138 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
139 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
140 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
141 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
142 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
143 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
144 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
145 | expected:'cat_1' | got='cat_1 | full: [' cat_1']'
146 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
147 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
148 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
149 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
150 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
151 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
152 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
153 | expected:'cat_1' | got='cat_1 | full: [' cat_1']'
154 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
155 | expected:'cat_1' | got='cat_1 | full: [' cat_1']'
156 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
157 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
158 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
159 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
160 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
161 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
162 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
163 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
164 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
165 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
166 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
167 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
168 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
169 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
170 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
171 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
172 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
173 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
174 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
175 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
176 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
177 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
178 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
179 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
180 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
181 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
182 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
183 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
184 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
185 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
186 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
187 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
188 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
189 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
190 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
191 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
192 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
193 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
194 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
195 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
196 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
197 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
198 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
199 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
---------------------------------------
Summary for Split 'test_seen_obj_unseen_act':
 results: {'correct': {'cat_1': 9, 'cat_2': 100}, 'incorrect': {'cat_1': 91, 'cat_2': 0}}
 accuracy: 54.50%

---------------------------------------
  test split name: test_unseen_obj_seen_act
---------------------------------------

0 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
1 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
2 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
3 | expected:'cat_1' | got='cat_1 | full: [' cat_1']'
4 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
5 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
6 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
7 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
8 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
9 | expected:'cat_1' | got='cat_1 | full: [' cat_1']'
10 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
11 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
12 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
13 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
14 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
15 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
16 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
17 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
18 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
19 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
20 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
21 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
22 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
23 | expected:'cat_1' | got='cat_1 | full: [' cat_1']'
24 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
25 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
26 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
27 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
28 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
29 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
30 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
31 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
32 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
33 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
34 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
35 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
36 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
37 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
38 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
39 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
40 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
41 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
42 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
43 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
44 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
45 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
46 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
47 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
48 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
49 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
50 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
51 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
52 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
53 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
54 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
55 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
56 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
57 | expected:'cat_1' | got='cat_1 | full: [' cat_1']'
58 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
59 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
60 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
61 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
62 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
63 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
64 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
65 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
66 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
67 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
68 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
69 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
70 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
71 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
72 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
73 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
74 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
75 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
76 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
77 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
78 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
79 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
80 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
81 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
82 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
83 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
84 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
85 | expected:'cat_1' | got='cat_1 | full: [' cat_1']'
86 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
87 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
88 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
89 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
90 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
91 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
92 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
93 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
94 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
95 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
96 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
97 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
98 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
99 | expected:'cat_1' | got='cat_1 | full: [' cat_1']'
100 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
101 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
102 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
103 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
104 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
105 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
106 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
107 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
108 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
109 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
110 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
111 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
112 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
113 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
114 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
115 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
116 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
117 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
118 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
119 | expected:'cat_1' | got='cat_1 | full: [' cat_1']'
120 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
121 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
122 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
123 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
124 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
125 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
126 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
127 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
128 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
129 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
130 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
131 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
132 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
133 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
134 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
135 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
136 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
137 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
138 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
139 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
140 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
141 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
142 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
143 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
144 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
145 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
146 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
147 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
148 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
149 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
150 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
151 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
152 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
153 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
154 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
155 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
156 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
157 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
158 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
159 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
160 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
161 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
162 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
163 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
164 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
165 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
166 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
167 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
168 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
169 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
170 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
171 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
172 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
173 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
174 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
175 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
176 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
177 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
178 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
179 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
180 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
181 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
182 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
183 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
184 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
185 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
186 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
187 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
188 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
189 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
190 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
191 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
192 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
193 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
194 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
195 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
196 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
197 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
198 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
199 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
---------------------------------------
Summary for Split 'test_unseen_obj_seen_act':
 results: {'correct': {'cat_1': 7, 'cat_2': 100}, 'incorrect': {'cat_1': 93, 'cat_2': 0}}
 accuracy: 53.50%

---------------------------------------
  test split name: test_unseen_obj_unseen_act
---------------------------------------

0 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
1 | expected:'cat_1' | got='cat_1 | full: [' cat_1']'
2 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
3 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
4 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
5 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
6 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
7 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
8 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
9 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
10 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
11 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
12 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
13 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
14 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
15 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
16 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
17 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
18 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
19 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
20 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
21 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
22 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
23 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
24 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
25 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
26 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
27 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
28 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
29 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
30 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
31 | expected:'cat_1' | got='cat_1 | full: [' cat_1']'
32 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
33 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
34 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
35 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
36 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
37 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
38 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
39 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
40 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
41 | expected:'cat_1' | got='cat_1 | full: [' cat_1']'
42 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
43 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
44 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
45 | expected:'cat_1' | got='cat_1 | full: [' cat_1']'
46 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
47 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
48 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
49 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
50 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
51 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
52 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
53 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
54 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
55 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
56 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
57 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
58 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
59 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
60 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
61 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
62 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
63 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
64 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
65 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
66 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
67 | expected:'cat_1' | got='cat_1 | full: [' cat_1\n\n**Reasoning:**\n\nThe rule appears to be whether or not the person in the image is actively adjusting or tying their tie. All the images in `cat_2` show someone in the process of tying or adjusting their tie. The images in `cat_1` show people with their ties already tied, or in poses where they are not actively adjusting it.\n\nThe test image shows a wall of ties, not a person adjusting a tie. Therefore, it belongs to `cat_1`.']'
68 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
69 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
70 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
71 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
72 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
73 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
74 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
75 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
76 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
77 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
78 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
79 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
80 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
81 | expected:'cat_1' | got='cat_1 | full: [' cat_1']'
82 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
83 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
84 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
85 | expected:'cat_1' | got='cat_1 | full: [' cat_1']'
86 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
87 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
88 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
89 | expected:'cat_1' | got='cat_1 | full: [' cat_1']'
90 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
91 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
92 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
93 | expected:'cat_1' | got='cat_1 | full: [' cat_1']'
94 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
95 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
96 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
97 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
98 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
99 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
100 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
101 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
102 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
103 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
104 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
105 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
106 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
107 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
108 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
109 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
110 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
111 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
112 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
113 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
114 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
115 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
116 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
117 | expected:'cat_1' | got='cat_1 | full: [' cat_1']'
118 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
119 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
120 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
121 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
122 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
123 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
124 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
125 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
126 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
127 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
128 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
129 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
130 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
131 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
132 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
133 | expected:'cat_1' | got='cat_1 | full: [' cat_1']'
134 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
135 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
136 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
137 | expected:'cat_1' | got='cat_1 | full: [' cat_1']'
138 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
139 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
140 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
141 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
142 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
143 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
144 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
145 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
146 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
147 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
148 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
149 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
150 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
151 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
152 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
153 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
154 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
155 | expected:'cat_1' | got='cat_1 | full: [' cat_1']'
156 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
157 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
158 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
159 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
160 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
161 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
162 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
163 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
164 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
165 | expected:'cat_1' | got='cat_1 | full: [' cat_1']'
166 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
167 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
168 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
169 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
170 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
171 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
172 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
173 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
174 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
175 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
176 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
177 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
178 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
179 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
180 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
181 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
182 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
183 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
184 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
185 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
186 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
187 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
188 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
189 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
190 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
191 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
192 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
193 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
194 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
195 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
196 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
197 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
198 | expected:'cat_2' | got='cat_2 | full: [' cat_2']'
199 | expected:'cat_1' | got='cat_2 | full: [' cat_2']'
---------------------------------------
Summary for Split 'test_unseen_obj_unseen_act':
 results: {'correct': {'cat_1': 14, 'cat_2': 100}, 'incorrect': {'cat_1': 86, 'cat_2': 0}}
 accuracy: 57.00%

---------------------------------------
