experiment run details:
  dataset: hoi
  path: /gpfs/mariana/home/envomp/bongard/big_hake/
  prompt method: direct
  prompt structure: labeled_test_first

---------------------------------------
  test split name: test_seen_obj_seen_act
---------------------------------------

0 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
1 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
2 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
3 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
4 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
5 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
6 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
7 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
8 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
9 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
10 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n```']'
11 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n```']'
12 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
13 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
14 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
15 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
16 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
17 | expected:'cat_1' | got='cat_1 | full: [' cat_1\n```']'
18 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
19 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
20 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
21 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
22 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
23 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
24 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
25 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
26 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
27 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
28 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
29 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
30 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
31 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
32 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
33 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
34 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
35 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
36 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
37 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
38 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
39 | expected:'cat_1' | got='cat_1 | full: [' cat_1\n']'
40 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
41 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
42 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
43 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
44 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
45 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
46 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
47 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
48 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
49 | expected:'cat_1' | got='cat_1 | full: [' cat_1\n']'
50 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
51 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
52 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
53 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
54 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
55 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
56 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
57 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
58 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
59 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
60 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
61 | expected:'cat_1' | got='cat_1 | full: [' cat_1\n```']'
62 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n```']'
63 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n```']'
64 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
65 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
66 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
67 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
68 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
69 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
70 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
71 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
72 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
73 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
74 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
75 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
76 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
77 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
78 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
79 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
80 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
81 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
82 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
83 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
84 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
85 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
86 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
87 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
88 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
89 | expected:'cat_1' | got='cat_1 | full: [' cat_1\n```']'
90 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
91 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
92 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
93 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
94 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
95 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
96 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n```']'
97 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
98 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
99 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
100 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
101 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
102 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
103 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
104 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
105 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
106 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
107 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
108 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
109 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
110 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
111 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
112 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
113 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
114 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
115 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
116 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
117 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
118 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
119 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
120 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
121 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
122 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
123 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
124 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
125 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
126 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
127 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
128 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
129 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
130 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
131 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
132 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
133 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
134 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
135 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
136 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
137 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
138 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
139 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
140 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
141 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
142 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
143 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
144 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
145 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
146 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
147 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
148 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
149 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
150 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
151 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
152 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
153 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
154 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n```']'
155 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n```']'
156 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
157 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
158 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
159 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
160 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
161 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
162 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
163 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
164 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
165 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
166 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
167 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
168 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
169 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
170 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
171 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
172 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
173 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
174 | expected:'cat_2' | got='cat_1 | full: [' cat_1\n```']'
175 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
176 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
177 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
178 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
179 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
180 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
181 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
182 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
183 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
184 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
185 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
186 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
187 | expected:'cat_1' | got='cat_1 | full: [' cat_1\n']'
188 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
189 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
190 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
191 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
192 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
193 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
194 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
195 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
196 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
197 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
198 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
199 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
---------------------------------------
Summary for Split 'test_seen_obj_seen_act':
 results: {'correct': {'cat_1': 6, 'cat_2': 99}, 'incorrect': {'cat_1': 94, 'cat_2': 1}}
 accuracy: 52.50%

---------------------------------------
  test split name: test_seen_obj_unseen_act
---------------------------------------

0 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
1 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
2 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
3 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
4 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
5 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
6 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
7 | expected:'cat_1' | got='cat_1 | full: [' cat_1\n']'
8 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
9 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
10 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
11 | expected:'cat_1' | got='cat_1 | full: [' cat_1\n']'
12 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
13 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
14 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
15 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
16 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
17 | expected:'cat_1' | got='cat_1 | full: [' cat_1\n```']'
18 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n```']'
19 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n```']'
20 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
21 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
22 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
23 | expected:'cat_1' | got='cat_1 | full: [' cat_1\n']'
24 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
25 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n```']'
26 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
27 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
28 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
29 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
30 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
31 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
32 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
33 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
34 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
35 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
36 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
37 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
38 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
39 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
40 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
41 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
42 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
43 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
44 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
45 | expected:'cat_1' | got='cat_1 | full: [' cat_1\n```']'
46 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
47 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
48 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
49 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
50 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
51 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
52 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
53 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n```']'
54 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n```']'
55 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
56 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
57 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
58 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
59 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
60 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
61 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
62 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
63 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
64 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
65 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
66 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
67 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
68 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
69 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
70 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
71 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
72 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
73 | expected:'cat_1' | got='cat_1 | full: [' cat_1\n']'
74 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
75 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
76 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
77 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
78 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
79 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
80 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n```']'
81 | expected:'cat_1' | got='cat_1 | full: [' cat_1\n```']'
82 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
83 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
84 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
85 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
86 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
87 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
88 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
89 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
90 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
91 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
92 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
93 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
94 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
95 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
96 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
97 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
98 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
99 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
100 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
101 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
102 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
103 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
104 | expected:'cat_2' | got='cat_1 | full: [' cat_1\n']'
105 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
106 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
107 | expected:'cat_1' | got='cat_1 | full: [' cat_1\n']'
108 | expected:'cat_2' | got='cat_1 | full: [' cat_1\n']'
109 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
110 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
111 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
112 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
113 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
114 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
115 | expected:'cat_1' | got='cat_1 | full: [' cat_1\n']'
116 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
117 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
118 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
119 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
120 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
121 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
122 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
123 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
124 | expected:'cat_2' | got='cat_2 | full: [' cat_2\nThe test image shows people in a swan-shaped paddle boat on a lake, which is similar to the cat_2 images showing people in various small boats on the water.\n']'
125 | expected:'cat_1' | got='cat_2 | full: [' cat_2\nThe test image shows a sailboat on a calm body of water, which is similar to the cat_2 images that depict people in small boats or kayaks on water.\n']'
126 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
127 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
128 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
129 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
130 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
131 | expected:'cat_1' | got='cat_1 | full: [' cat_1\n']'
132 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
133 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
134 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
135 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
136 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
137 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
138 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
139 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n```']'
140 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
141 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
142 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
143 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
144 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
145 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
146 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
147 | expected:'cat_1' | got='cat_1 | full: [' cat_1\n']'
148 | expected:'cat_2' | got='cat_1 | full: [' cat_1\n```']'
149 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
150 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
151 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
152 | expected:'cat_2' | got='cat_1 | full: [' cat_1\n```']'
153 | expected:'cat_1' | got='cat_1 | full: [' cat_1\n```']'
154 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
155 | expected:'cat_1' | got='cat_1 | full: [' cat_1\n']'
156 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
157 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
158 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
159 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
160 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
161 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
162 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
163 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
164 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
165 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
166 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
167 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
168 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
169 | expected:'cat_1' | got='cat_1 | full: [' cat_1\n```']'
170 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
171 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
172 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
173 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
174 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
175 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
176 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
177 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
178 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
179 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
180 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
181 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
182 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
183 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
184 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
185 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
186 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
187 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
188 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
189 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
190 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
191 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
192 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
193 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
194 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
195 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
196 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
197 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
198 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
199 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
---------------------------------------
Summary for Split 'test_seen_obj_unseen_act':
 results: {'correct': {'cat_1': 14, 'cat_2': 96}, 'incorrect': {'cat_1': 86, 'cat_2': 4}}
 accuracy: 55.00%

---------------------------------------
  test split name: test_unseen_obj_seen_act
---------------------------------------

0 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
1 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
2 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
3 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
4 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
5 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
6 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
7 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
8 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
9 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
10 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
11 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
12 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
13 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
14 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
15 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
16 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
17 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
18 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
19 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
20 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
21 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
22 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
23 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
24 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
25 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
26 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
27 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
28 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
29 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
30 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
31 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
32 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
33 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
34 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
35 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
36 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
37 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
38 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
39 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
40 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
41 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
42 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
43 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
44 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
45 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
46 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
47 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
48 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
49 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
50 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
51 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
52 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n```']'
53 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
54 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
55 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
56 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
57 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
58 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
59 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
60 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
61 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
62 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
63 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
64 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
65 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
66 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
67 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
68 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
69 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
70 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
71 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
72 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
73 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
74 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
75 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
76 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
77 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
78 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
79 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
80 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
81 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
82 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
83 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
84 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
85 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
86 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
87 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
88 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
89 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
90 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
91 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
92 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
93 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
94 | expected:'cat_2' | got='cat_1 | full: [' cat_1\n```']'
95 | expected:'cat_1' | got='cat_1 | full: [' cat_1\nThe test image shows a red sports car parked on the street, which does not fit the theme of the cat_2 images that all feature people sitting on benches in various locations. Therefore, the test image should be categorized as cat_1.\n']'
96 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
97 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
98 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
99 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
100 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
101 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
102 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
103 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
104 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
105 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
106 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
107 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
108 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n```']'
109 | expected:'cat_1' | got='cat_1 | full: [' cat_1\n```']'
110 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
111 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
112 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
113 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
114 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
115 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
116 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
117 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
118 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
119 | expected:'cat_1' | got='cat_1 | full: [' cat_1\n```']'
120 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
121 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
122 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
123 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
124 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
125 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
126 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
127 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
128 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
129 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
130 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
131 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
132 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
133 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
134 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
135 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
136 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
137 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
138 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
139 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
140 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
141 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
142 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
143 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
144 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
145 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
146 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
147 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
148 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
149 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
150 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
151 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
152 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
153 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
154 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
155 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
156 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
157 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
158 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
159 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
160 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
161 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
162 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
163 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
164 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
165 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
166 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
167 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
168 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
169 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
170 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
171 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
172 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
173 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
174 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
175 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n```']'
176 | expected:'cat_2' | got='cat_1 | full: [' cat_1\n```']'
177 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
178 | expected:'cat_2' | got='cat_1 | full: [' cat_1\n```']'
179 | expected:'cat_1' | got='cat_1 | full: [' cat_1\n```']'
180 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
181 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
182 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
183 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
184 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
185 | expected:'cat_1' | got='cat_1 | full: [' cat_1\n```']'
186 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
187 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
188 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
189 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
190 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
191 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
192 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
193 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
194 | expected:'cat_2' | got='cat_2 | full: [' cat_2\nThe test image shows a person giving a speech at a podium in a formal setting, which is similar to the cat_2 images showing people in formal settings or events.\n']'
195 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
196 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
197 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
198 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
199 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
---------------------------------------
Summary for Split 'test_unseen_obj_seen_act':
 results: {'correct': {'cat_1': 5, 'cat_2': 97}, 'incorrect': {'cat_1': 95, 'cat_2': 3}}
 accuracy: 51.00%

---------------------------------------
  test split name: test_unseen_obj_unseen_act
---------------------------------------

0 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
1 | expected:'cat_1' | got='cat_1 | full: [' cat_1\n```']'
2 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
3 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
4 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
5 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
6 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
7 | expected:'cat_1' | got='cat_1 | full: [' cat_1\n```']'
8 | expected:'cat_2' | got='cat_1 | full: [' cat_1\n```']'
9 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
10 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
11 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
12 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
13 | expected:'cat_1' | got='cat_1 | full: [' cat_1\n```']'
14 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
15 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
16 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
17 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
18 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
19 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
20 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
21 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
22 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
23 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
24 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
25 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
26 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
27 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
28 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
29 | expected:'cat_1' | got='cat_1 | full: [' cat_1\n```']'
30 | expected:'cat_2' | got='cat_1 | full: [' cat_1\n```']'
31 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
32 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
33 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
34 | expected:'cat_2' | got='cat_1 | full: [' cat_1\n```']'
35 | expected:'cat_1' | got='cat_1 | full: [' cat_1\n```']'
36 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
37 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
38 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
39 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
40 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
41 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
42 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
43 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
44 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
45 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
46 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
47 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
48 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
49 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
50 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
51 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
52 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
53 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
54 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
55 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
56 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
57 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
58 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
59 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
60 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
61 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
62 | expected:'cat_2' | got='cat_1 | full: [' cat_1\n```']'
63 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
64 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
65 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
66 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
67 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
68 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
69 | expected:'cat_1' | got='cat_1 | full: [' cat_1\n```']'
70 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
71 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
72 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
73 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
74 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
75 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
76 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
77 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
78 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
79 | expected:'cat_1' | got='cat_1 | full: [' cat_1\n```']'
80 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
81 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
82 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
83 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
84 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
85 | expected:'cat_1' | got='cat_1 | full: [' cat_1\n```']'
86 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
87 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
88 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
89 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
90 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
91 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
92 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
93 | expected:'cat_1' | got='cat_1 | full: [' cat_1\n```']'
94 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
95 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
96 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
97 | expected:'cat_1' | got='cat_1 | full: [' cat_1\n```']'
98 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
99 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
100 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
101 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
102 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
103 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
104 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
105 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
106 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
107 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
108 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
109 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
110 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
111 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
112 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
113 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
114 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
115 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
116 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
117 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
118 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
119 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
120 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
121 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
122 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
123 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
124 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
125 | expected:'cat_1' | got='cat_1 | full: [' cat_1\nThe test image shows a woman and a child petting a sheep, which does not match the common theme of shearing sheep in the cat_2 images. Therefore, it belongs to cat_1.\n']'
126 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
127 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
128 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
129 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
130 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
131 | expected:'cat_1' | got='cat_1 | full: [' cat_1\n```']'
132 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
133 | expected:'cat_1' | got='cat_1 | full: [' cat_1\n```']'
134 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
135 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
136 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
137 | expected:'cat_1' | got='cat_1 | full: [' cat_1\n```']'
138 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
139 | expected:'cat_1' | got='cat_1 | full: [' cat_1\nThe test image shows a man holding a sandwich, which does not fit the theme of picking or holding apples seen in the cat_2 images. Therefore, it belongs to cat_1.\n']'
140 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
141 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
142 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
143 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
144 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
145 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
146 | expected:'cat_2' | got='cat_1 | full: [' cat_1\n```']'
147 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
148 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
149 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
150 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
151 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
152 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
153 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
154 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
155 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
156 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
157 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
158 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
159 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
160 | expected:'cat_2' | got='cat_1 | full: [' cat_1\n```']'
161 | expected:'cat_1' | got='cat_1 | full: [' cat_1\n```']'
162 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
163 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
164 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
165 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
166 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
167 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
168 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
169 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
170 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
171 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
172 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
173 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
174 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
175 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
176 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
177 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
178 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
179 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
180 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
181 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
182 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
183 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
184 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
185 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
186 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
187 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
188 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
189 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
190 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
191 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
192 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
193 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
194 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
195 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
196 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
197 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
198 | expected:'cat_2' | got='cat_2 | full: [' cat_2\n']'
199 | expected:'cat_1' | got='cat_2 | full: [' cat_2\n']'
---------------------------------------
Summary for Split 'test_unseen_obj_unseen_act':
 results: {'correct': {'cat_1': 16, 'cat_2': 94}, 'incorrect': {'cat_1': 84, 'cat_2': 6}}
 accuracy: 55.00%

---------------------------------------
