--- eval_baseline_on_HOI_ VQA Evaluation ---
  Model: phi
  Total Samples: 8000

---------------------------------------
0 | expected:'C' | got:'C' | concept: 'greet person'
1 | expected:'A' | got:'A' | concept: 'greet person'
2 | expected:'C' | got:'C' | concept: 'greet person'
3 | expected:'D' | got:'C' | concept: 'greet person'
4 | expected:'A' | got:'D' | concept: 'hug person'
5 | expected:'B' | got:'B' | concept: 'hug person'
6 | expected:'B' | got:'B' | concept: 'hug person'
7 | expected:'A' | got:'A' | concept: 'hug person'
8 | expected:'B' | got:'B' | concept: 'kiss person'
9 | expected:'A' | got:'A' | concept: 'kiss person'
10 | expected:'A' | got:'A' | concept: 'kiss person'
11 | expected:'C' | got:'C' | concept: 'kiss person'
12 | expected:'C' | got:'C' | concept: 'kiss horse'
13 | expected:'B' | got:'B' | concept: 'kiss horse'
14 | expected:'D' | got:'D' | concept: 'kiss horse'
15 | expected:'D' | got:'D' | concept: 'kiss horse'
16 | expected:'C' | got:'C' | concept: 'board train'
17 | expected:'C' | got:'C' | concept: 'board train'
18 | expected:'B' | got:'B' | concept: 'board train'
19 | expected:'C' | got:'C' | concept: 'board train'
20 | expected:'A' | got:'A' | concept: 'sit_inside bus'
21 | expected:'B' | got:'B' | concept: 'sit_inside bus'
22 | expected:'B' | got:'A' | concept: 'sit_inside bus'
23 | expected:'C' | got:'C' | concept: 'sit_inside bus'
24 | expected:'A' | got:'A' | concept: 'drive train'
25 | expected:'C' | got:'C' | concept: 'drive train'
26 | expected:'B' | got:'B' | concept: 'drive train'
27 | expected:'C' | got:'A' | concept: 'drive train'
28 | expected:'A' | got:'A' | concept: 'board bus'
29 | expected:'D' | got:'D' | concept: 'board bus'
30 | expected:'B' | got:'B' | concept: 'board bus'
31 | expected:'B' | got:'B' | concept: 'board bus'
32 | expected:'A' | got:'A' | concept: 'wash apple'
33 | expected:'B' | got:'B' | concept: 'wash apple'
34 | expected:'B' | got:'A' | concept: 'wash apple'
35 | expected:'A' | got:'A' | concept: 'wash apple'
36 | expected:'D' | got:'A' | concept: 'wash car'
37 | expected:'B' | got:'A' | concept: 'wash car'
38 | expected:'B' | got:'A' | concept: 'wash car'
39 | expected:'D' | got:'D' | concept: 'wash car'
40 | expected:'C' | got:'A' | concept: 'wash dog'
41 | expected:'B' | got:'A' | concept: 'wash dog'
42 | expected:'B' | got:'A' | concept: 'wash dog'
43 | expected:'A' | got:'A' | concept: 'wash dog'
44 | expected:'A' | got:'A' | concept: 'wash motorcycle'
45 | expected:'B' | got:'A' | concept: 'wash motorcycle'
46 | expected:'D' | got:'A' | concept: 'wash motorcycle'
47 | expected:'C' | got:'A' | concept: 'wash motorcycle'
48 | expected:'A' | got:'B' | concept: 'blow cake'
49 | expected:'C' | got:'A' | concept: 'blow cake'
50 | expected:'A' | got:'A' | concept: 'blow cake'
51 | expected:'D' | got:'C' | concept: 'blow cake'
52 | expected:'A' | got:'A' | concept: 'eat cake'
53 | expected:'B' | got:'B' | concept: 'eat cake'
54 | expected:'A' | got:'A' | concept: 'eat cake'
55 | expected:'B' | got:'B' | concept: 'eat cake'
56 | expected:'A' | got:'C' | concept: 'hold cake'
57 | expected:'A' | got:'C' | concept: 'hold cake'
58 | expected:'C' | got:'C' | concept: 'hold cake'
59 | expected:'B' | got:'B' | concept: 'hold cake'
60 | expected:'D' | got:'D' | concept: 'cut cake'
61 | expected:'D' | got:'D' | concept: 'cut cake'
62 | expected:'D' | got:'D' | concept: 'cut cake'
63 | expected:'A' | got:'A' | concept: 'cut cake'
64 | expected:'C' | got:'C' | concept: 'read book'
65 | expected:'A' | got:'A' | concept: 'read book'
66 | expected:'B' | got:'B' | concept: 'read book'
67 | expected:'D' | got:'A' | concept: 'read book'
68 | expected:'B' | got:'B' | concept: 'read laptop'
69 | expected:'B' | got:'C' | concept: 'read laptop'
70 | expected:'B' | got:'A' | concept: 'read laptop'
71 | expected:'D' | got:'B' | concept: 'read laptop'
72 | expected:'A' | got:'A' | concept: 'repair laptop'
73 | expected:'A' | got:'A' | concept: 'repair laptop'
74 | expected:'A' | got:'A' | concept: 'repair laptop'
75 | expected:'D' | got:'A' | concept: 'repair laptop'
76 | expected:'A' | got:'A' | concept: 'type_on laptop'
77 | expected:'C' | got:'C' | concept: 'type_on laptop'
78 | expected:'B' | got:'B' | concept: 'type_on laptop'
79 | expected:'B' | got:'B' | concept: 'type_on laptop'
80 | expected:'A' | got:'A' | concept: 'ride snowboard'
81 | expected:'B' | got:'B' | concept: 'ride snowboard'
82 | expected:'B' | got:'B' | concept: 'ride snowboard'
83 | expected:'A' | got:'A' | concept: 'ride snowboard'
84 | expected:'D' | got:'A' | concept: 'carry suitcase'
85 | expected:'A' | got:'A' | concept: 'carry suitcase'
86 | expected:'A' | got:'A' | concept: 'carry suitcase'
87 | expected:'D' | got:'A' | concept: 'carry suitcase'
88 | expected:'D' | got:'B' | concept: 'carry snowboard'
89 | expected:'A' | got:'A' | concept: 'carry snowboard'
90 | expected:'D' | got:'D' | concept: 'carry snowboard'
91 | expected:'D' | got:'D' | concept: 'carry snowboard'
92 | expected:'D' | got:'C' | concept: 'grind snowboard'
93 | expected:'D' | got:'D' | concept: 'grind snowboard'
94 | expected:'B' | got:'B' | concept: 'grind snowboard'
95 | expected:'B' | got:'A' | concept: 'grind snowboard'
96 | expected:'D' | got:'D' | concept: 'feed horse'
97 | expected:'D' | got:'D' | concept: 'feed horse'
98 | expected:'B' | got:'B' | concept: 'feed horse'
99 | expected:'C' | got:'C' | concept: 'feed horse'
100 | expected:'A' | got:'A' | concept: 'walk horse'
101 | expected:'A' | got:'A' | concept: 'walk horse'
102 | expected:'B' | got:'C' | concept: 'walk horse'
103 | expected:'A' | got:'A' | concept: 'walk horse'
104 | expected:'A' | got:'A' | concept: 'jump horse'
105 | expected:'B' | got:'B' | concept: 'jump horse'
106 | expected:'A' | got:'A' | concept: 'jump horse'
107 | expected:'A' | got:'A' | concept: 'jump horse'
108 | expected:'A' | got:'A' | concept: 'feed sheep'
109 | expected:'A' | got:'A' | concept: 'feed sheep'
110 | expected:'A' | got:'A' | concept: 'feed sheep'
111 | expected:'A' | got:'A' | concept: 'feed sheep'
112 | expected:'D' | got:'A' | concept: 'hold laptop'
113 | expected:'D' | got:'D' | concept: 'hold laptop'
114 | expected:'A' | got:'A' | concept: 'hold laptop'
115 | expected:'A' | got:'A' | concept: 'hold laptop'
116 | expected:'D' | got:'A' | concept: 'hold umbrella'
117 | expected:'C' | got:'C' | concept: 'hold umbrella'
118 | expected:'D' | got:'A' | concept: 'hold umbrella'
119 | expected:'B' | got:'B' | concept: 'hold umbrella'
120 | expected:'B' | got:'B' | concept: 'hold donut'
121 | expected:'C' | got:'C' | concept: 'hold donut'
122 | expected:'C' | got:'C' | concept: 'hold donut'
123 | expected:'C' | got:'C' | concept: 'hold donut'
124 | expected:'D' | got:'A' | concept: 'type_on laptop'
125 | expected:'C' | got:'C' | concept: 'type_on laptop'
126 | expected:'A' | got:'A' | concept: 'type_on laptop'
127 | expected:'A' | got:'A' | concept: 'type_on laptop'
128 | expected:'C' | got:'C' | concept: 'hold kite'
129 | expected:'D' | got:'D' | concept: 'hold kite'
130 | expected:'A' | got:'A' | concept: 'hold kite'
131 | expected:'C' | got:'C' | concept: 'hold kite'
132 | expected:'B' | got:'B' | concept: 'hold keyboard'
133 | expected:'D' | got:'D' | concept: 'hold keyboard'
134 | expected:'C' | got:'C' | concept: 'hold keyboard'
135 | expected:'A' | got:'A' | concept: 'hold keyboard'
136 | expected:'A' | got:'A' | concept: 'hold laptop'
137 | expected:'D' | got:'D' | concept: 'hold laptop'
138 | expected:'C' | got:'C' | concept: 'hold laptop'
139 | expected:'B' | got:'A' | concept: 'hold laptop'
140 | expected:'B' | got:'B' | concept: 'hold hot_dog'
141 | expected:'B' | got:'B' | concept: 'hold hot_dog'
142 | expected:'C' | got:'C' | concept: 'hold hot_dog'
143 | expected:'A' | got:'A' | concept: 'hold hot_dog'
144 | expected:'A' | got:'A' | concept: 'hold knife'
145 | expected:'C' | got:'C' | concept: 'hold knife'
146 | expected:'C' | got:'C' | concept: 'hold knife'
147 | expected:'A' | got:'A' | concept: 'hold knife'
148 | expected:'D' | got:'D' | concept: 'hold frisbee'
149 | expected:'C' | got:'C' | concept: 'hold frisbee'
150 | expected:'C' | got:'C' | concept: 'hold frisbee'
151 | expected:'D' | got:'D' | concept: 'hold frisbee'
152 | expected:'C' | got:'C' | concept: 'hold dog'
153 | expected:'B' | got:'B' | concept: 'hold dog'
154 | expected:'B' | got:'B' | concept: 'hold dog'
155 | expected:'A' | got:'A' | concept: 'hold dog'
156 | expected:'D' | got:'D' | concept: 'hold banana'
157 | expected:'C' | got:'C' | concept: 'hold banana'
158 | expected:'D' | got:'A' | concept: 'hold banana'
159 | expected:'A' | got:'A' | concept: 'hold banana'
160 | expected:'D' | got:'D' | concept: 'sit_on train'
161 | expected:'A' | got:'A' | concept: 'sit_on train'
162 | expected:'D' | got:'D' | concept: 'sit_on train'
163 | expected:'A' | got:'A' | concept: 'sit_on train'
164 | expected:'B' | got:'B' | concept: 'drive train'
165 | expected:'D' | got:'D' | concept: 'drive train'
166 | expected:'C' | got:'C' | concept: 'drive train'
167 | expected:'A' | got:'A' | concept: 'drive train'
168 | expected:'A' | got:'A' | concept: 'drive car'
169 | expected:'D' | got:'D' | concept: 'drive car'
170 | expected:'A' | got:'A' | concept: 'drive car'
171 | expected:'B' | got:'B' | concept: 'drive car'
172 | expected:'B' | got:'B' | concept: 'drive boat'
173 | expected:'B' | got:'B' | concept: 'drive boat'
174 | expected:'D' | got:'D' | concept: 'drive boat'
175 | expected:'D' | got:'D' | concept: 'drive boat'
176 | expected:'C' | got:'C' | concept: 'row boat'
177 | expected:'A' | got:'A' | concept: 'row boat'
178 | expected:'C' | got:'C' | concept: 'row boat'
179 | expected:'A' | got:'D' | concept: 'row boat'
180 | expected:'D' | got:'D' | concept: 'ride boat'
181 | expected:'C' | got:'C' | concept: 'ride boat'
182 | expected:'B' | got:'B' | concept: 'ride boat'
183 | expected:'C' | got:'D' | concept: 'ride boat'
184 | expected:'C' | got:'C' | concept: 'sail boat'
185 | expected:'B' | got:'B' | concept: 'sail boat'
186 | expected:'B' | got:'B' | concept: 'sail boat'
187 | expected:'B' | got:'B' | concept: 'sail boat'
188 | expected:'A' | got:'A' | concept: 'stand_on boat'
189 | expected:'A' | got:'A' | concept: 'stand_on boat'
190 | expected:'A' | got:'B' | concept: 'stand_on boat'
191 | expected:'D' | got:'B' | concept: 'stand_on boat'
192 | expected:'A' | got:'A' | concept: 'carry keyboard'
193 | expected:'A' | got:'A' | concept: 'carry keyboard'
194 | expected:'A' | got:'C' | concept: 'carry keyboard'
195 | expected:'D' | got:'A' | concept: 'carry keyboard'
196 | expected:'A' | got:'A' | concept: 'carry surfboard'
197 | expected:'A' | got:'A' | concept: 'carry surfboard'
198 | expected:'C' | got:'C' | concept: 'carry surfboard'
199 | expected:'B' | got:'B' | concept: 'carry surfboard'
200 | expected:'C' | got:'C' | concept: 'type_on keyboard'
201 | expected:'B' | got:'B' | concept: 'type_on keyboard'
202 | expected:'A' | got:'A' | concept: 'type_on keyboard'
203 | expected:'C' | got:'C' | concept: 'type_on keyboard'
204 | expected:'D' | got:'A' | concept: 'clean keyboard'
205 | expected:'B' | got:'B' | concept: 'clean keyboard'
206 | expected:'B' | got:'B' | concept: 'clean keyboard'
207 | expected:'A' | got:'A' | concept: 'clean keyboard'
208 | expected:'A' | got:'C' | concept: 'hold scissors'
209 | expected:'D' | got:'D' | concept: 'hold scissors'
210 | expected:'C' | got:'C' | concept: 'hold scissors'
211 | expected:'C' | got:'C' | concept: 'hold scissors'
212 | expected:'A' | got:'A' | concept: 'hold skateboard'
213 | expected:'D' | got:'D' | concept: 'hold skateboard'
214 | expected:'B' | got:'B' | concept: 'hold skateboard'
215 | expected:'A' | got:'A' | concept: 'hold skateboard'
216 | expected:'A' | got:'A' | concept: 'sit_on skateboard'
217 | expected:'B' | got:'D' | concept: 'sit_on skateboard'
218 | expected:'A' | got:'D' | concept: 'sit_on skateboard'
219 | expected:'A' | got:'A' | concept: 'sit_on skateboard'
220 | expected:'B' | got:'B' | concept: 'hold tennis_racket'
221 | expected:'A' | got:'A' | concept: 'hold tennis_racket'
222 | expected:'C' | got:'C' | concept: 'hold tennis_racket'
223 | expected:'D' | got:'D' | concept: 'hold tennis_racket'
224 | expected:'A' | got:'A' | concept: 'hold apple'
225 | expected:'B' | got:'B' | concept: 'hold apple'
226 | expected:'B' | got:'B' | concept: 'hold apple'
227 | expected:'A' | got:'A' | concept: 'hold apple'
228 | expected:'C' | got:'C' | concept: 'hold bird'
229 | expected:'C' | got:'C' | concept: 'hold bird'
230 | expected:'A' | got:'A' | concept: 'hold bird'
231 | expected:'C' | got:'C' | concept: 'hold bird'
232 | expected:'D' | got:'C' | concept: 'hold cake'
233 | expected:'B' | got:'A' | concept: 'hold cake'
234 | expected:'A' | got:'INVALID' | concept: 'hold cake'
235 | expected:'A' | got:'B' | concept: 'hold cake'
236 | expected:'B' | got:'B' | concept: 'hold sandwich'
237 | expected:'C' | got:'C' | concept: 'hold sandwich'
238 | expected:'C' | got:'C' | concept: 'hold sandwich'
239 | expected:'A' | got:'A' | concept: 'hold sandwich'
240 | expected:'A' | got:'A' | concept: 'pet dog'
241 | expected:'B' | got:'B' | concept: 'pet dog'
242 | expected:'D' | got:'D' | concept: 'pet dog'
243 | expected:'B' | got:'B' | concept: 'pet dog'
244 | expected:'B' | got:'B' | concept: 'pet horse'
245 | expected:'D' | got:'D' | concept: 'pet horse'
246 | expected:'B' | got:'B' | concept: 'pet horse'
247 | expected:'C' | got:'C' | concept: 'pet horse'
248 | expected:'B' | got:'A' | concept: 'wash dog'
249 | expected:'C' | got:'A' | concept: 'wash dog'
250 | expected:'C' | got:'C' | concept: 'wash dog'
251 | expected:'D' | got:'A' | concept: 'wash dog'
252 | expected:'B' | got:'B' | concept: 'walk dog'
253 | expected:'B' | got:'B' | concept: 'walk dog'
254 | expected:'D' | got:'D' | concept: 'walk dog'
255 | expected:'D' | got:'D' | concept: 'walk dog'
256 | expected:'C' | got:'D' | concept: 'hold oven'
257 | expected:'C' | got:'B' | concept: 'hold oven'
258 | expected:'D' | got:'C' | concept: 'hold oven'
259 | expected:'A' | got:'C' | concept: 'hold oven'
260 | expected:'A' | got:'D' | concept: 'clean oven'
261 | expected:'B' | got:'B' | concept: 'clean oven'
262 | expected:'A' | got:'C' | concept: 'clean oven'
263 | expected:'A' | got:'D' | concept: 'clean oven'
264 | expected:'A' | got:'C' | concept: 'open oven'
265 | expected:'C' | got:'B' | concept: 'open oven'
266 | expected:'C' | got:'C' | concept: 'open oven'
267 | expected:'D' | got:'D' | concept: 'open oven'
268 | expected:'C' | got:'C' | concept: 'operate oven'
269 | expected:'D' | got:'D' | concept: 'operate oven'
270 | expected:'A' | got:'C' | concept: 'operate oven'
271 | expected:'B' | got:'D' | concept: 'operate oven'
272 | expected:'A' | got:'A' | concept: 'load truck'
273 | expected:'D' | got:'D' | concept: 'load truck'
274 | expected:'A' | got:'A' | concept: 'load truck'
275 | expected:'A' | got:'A' | concept: 'load truck'
276 | expected:'C' | got:'C' | concept: 'repair bicycle'
277 | expected:'A' | got:'A' | concept: 'repair bicycle'
278 | expected:'B' | got:'B' | concept: 'repair bicycle'
279 | expected:'D' | got:'D' | concept: 'repair bicycle'
280 | expected:'A' | got:'D' | concept: 'sit_on truck'
281 | expected:'A' | got:'INVALID' | concept: 'sit_on truck'
282 | expected:'B' | got:'B' | concept: 'sit_on truck'
283 | expected:'A' | got:'D' | concept: 'sit_on truck'
284 | expected:'A' | got:'A' | concept: 'repair truck'
285 | expected:'B' | got:'B' | concept: 'repair truck'
286 | expected:'B' | got:'B' | concept: 'repair truck'
287 | expected:'D' | got:'D' | concept: 'repair truck'
288 | expected:'D' | got:'A' | concept: 'operate microwave'
289 | expected:'C' | got:'C' | concept: 'operate microwave'
290 | expected:'D' | got:'C' | concept: 'operate microwave'
291 | expected:'D' | got:'A' | concept: 'operate microwave'
292 | expected:'B' | got:'C' | concept: 'open microwave'
293 | expected:'C' | got:'C' | concept: 'open microwave'
294 | expected:'B' | got:'B' | concept: 'open microwave'
295 | expected:'A' | got:'A' | concept: 'open microwave'
296 | expected:'B' | got:'B' | concept: 'operate oven'
297 | expected:'D' | got:'A' | concept: 'operate oven'
298 | expected:'D' | got:'A' | concept: 'operate oven'
299 | expected:'C' | got:'C' | concept: 'operate oven'
300 | expected:'B' | got:'B' | concept: 'clean microwave'
301 | expected:'B' | got:'B' | concept: 'clean microwave'
302 | expected:'B' | got:'B' | concept: 'clean microwave'
303 | expected:'A' | got:'A' | concept: 'clean microwave'
304 | expected:'B' | got:'B' | concept: 'ride motorcycle'
305 | expected:'D' | got:'D' | concept: 'ride motorcycle'
306 | expected:'C' | got:'C' | concept: 'ride motorcycle'
307 | expected:'A' | got:'A' | concept: 'ride motorcycle'
308 | expected:'C' | got:'C' | concept: 'ride skateboard'
309 | expected:'C' | got:'C' | concept: 'ride skateboard'
310 | expected:'A' | got:'A' | concept: 'ride skateboard'
311 | expected:'D' | got:'D' | concept: 'ride skateboard'
312 | expected:'C' | got:'C' | concept: 'ride surfboard'
313 | expected:'C' | got:'C' | concept: 'ride surfboard'
314 | expected:'D' | got:'D' | concept: 'ride surfboard'
315 | expected:'C' | got:'C' | concept: 'ride surfboard'
316 | expected:'D' | got:'D' | concept: 'ride elephant'
317 | expected:'A' | got:'A' | concept: 'ride elephant'
318 | expected:'D' | got:'D' | concept: 'ride elephant'
319 | expected:'D' | got:'D' | concept: 'ride elephant'
320 | expected:'C' | got:'C' | concept: 'jump snowboard'
321 | expected:'A' | got:'A' | concept: 'jump snowboard'
322 | expected:'B' | got:'B' | concept: 'jump snowboard'
323 | expected:'A' | got:'A' | concept: 'jump snowboard'
324 | expected:'B' | got:'B' | concept: 'carry skateboard'
325 | expected:'B' | got:'B' | concept: 'carry skateboard'
326 | expected:'A' | got:'A' | concept: 'carry skateboard'
327 | expected:'B' | got:'B' | concept: 'carry skateboard'
328 | expected:'C' | got:'C' | concept: 'carry snowboard'
329 | expected:'D' | got:'A' | concept: 'carry snowboard'
330 | expected:'B' | got:'B' | concept: 'carry snowboard'
331 | expected:'D' | got:'D' | concept: 'carry snowboard'
332 | expected:'C' | got:'C' | concept: 'carry keyboard'
333 | expected:'D' | got:'A' | concept: 'carry keyboard'
334 | expected:'D' | got:'A' | concept: 'carry keyboard'
335 | expected:'B' | got:'B' | concept: 'carry keyboard'
336 | expected:'B' | got:'C' | concept: 'jump surfboard'
337 | expected:'C' | got:'C' | concept: 'jump surfboard'
338 | expected:'D' | got:'A' | concept: 'jump surfboard'
339 | expected:'B' | got:'C' | concept: 'jump surfboard'
340 | expected:'C' | got:'C' | concept: 'ride surfboard'
341 | expected:'C' | got:'C' | concept: 'ride surfboard'
342 | expected:'B' | got:'B' | concept: 'ride surfboard'
343 | expected:'B' | got:'B' | concept: 'ride surfboard'
344 | expected:'C' | got:'C' | concept: 'ride motorcycle'
345 | expected:'A' | got:'A' | concept: 'ride motorcycle'
346 | expected:'A' | got:'A' | concept: 'ride motorcycle'
347 | expected:'B' | got:'B' | concept: 'ride motorcycle'
348 | expected:'A' | got:'A' | concept: 'ride snowboard'
349 | expected:'A' | got:'A' | concept: 'ride snowboard'
350 | expected:'D' | got:'D' | concept: 'ride snowboard'
351 | expected:'B' | got:'B' | concept: 'ride snowboard'
352 | expected:'C' | got:'C' | concept: 'ride boat'
353 | expected:'D' | got:'B' | concept: 'ride boat'
354 | expected:'B' | got:'A' | concept: 'ride boat'
355 | expected:'C' | got:'C' | concept: 'ride boat'
356 | expected:'C' | got:'C' | concept: 'row boat'
357 | expected:'B' | got:'B' | concept: 'row boat'
358 | expected:'C' | got:'C' | concept: 'row boat'
359 | expected:'B' | got:'B' | concept: 'row boat'
360 | expected:'A' | got:'D' | concept: 'stand_on boat'
361 | expected:'C' | got:'D' | concept: 'stand_on boat'
362 | expected:'D' | got:'D' | concept: 'stand_on boat'
363 | expected:'B' | got:'D' | concept: 'stand_on boat'
364 | expected:'C' | got:'C' | concept: 'sail boat'
365 | expected:'A' | got:'C' | concept: 'sail boat'
366 | expected:'C' | got:'C' | concept: 'sail boat'
367 | expected:'A' | got:'A' | concept: 'sail boat'
368 | expected:'D' | got:'A' | concept: 'hold sports_ball'
369 | expected:'A' | got:'A' | concept: 'hold sports_ball'
370 | expected:'A' | got:'C' | concept: 'hold sports_ball'
371 | expected:'D' | got:'D' | concept: 'hold sports_ball'
372 | expected:'D' | got:'A' | concept: 'hold mouse'
373 | expected:'B' | got:'B' | concept: 'hold mouse'
374 | expected:'A' | got:'A' | concept: 'hold mouse'
375 | expected:'A' | got:'C' | concept: 'hold mouse'
376 | expected:'D' | got:'C' | concept: 'use mouse'
377 | expected:'A' | got:'A' | concept: 'use mouse'
378 | expected:'C' | got:'C' | concept: 'use mouse'
379 | expected:'C' | got:'C' | concept: 'use mouse'
380 | expected:'D' | got:'B' | concept: 'hold frisbee'
381 | expected:'A' | got:'A' | concept: 'hold frisbee'
382 | expected:'B' | got:'B' | concept: 'hold frisbee'
383 | expected:'D' | got:'B' | concept: 'hold frisbee'
384 | expected:'B' | got:'B' | concept: 'feed horse'
385 | expected:'B' | got:'B' | concept: 'feed horse'
386 | expected:'A' | got:'A' | concept: 'feed horse'
387 | expected:'C' | got:'C' | concept: 'feed horse'
388 | expected:'B' | got:'B' | concept: 'feed elephant'
389 | expected:'C' | got:'C' | concept: 'feed elephant'
390 | expected:'C' | got:'C' | concept: 'feed elephant'
391 | expected:'A' | got:'A' | concept: 'feed elephant'
392 | expected:'D' | got:'D' | concept: 'feed sheep'
393 | expected:'D' | got:'D' | concept: 'feed sheep'
394 | expected:'A' | got:'A' | concept: 'feed sheep'
395 | expected:'A' | got:'A' | concept: 'feed sheep'
396 | expected:'C' | got:'A' | concept: 'feed giraffe'
397 | expected:'B' | got:'B' | concept: 'feed giraffe'
398 | expected:'C' | got:'A' | concept: 'feed giraffe'
399 | expected:'B' | got:'B' | concept: 'feed giraffe'
400 | expected:'B' | got:'B' | concept: 'clean keyboard'
401 | expected:'D' | got:'A' | concept: 'clean keyboard'
402 | expected:'C' | got:'C' | concept: 'clean keyboard'
403 | expected:'B' | got:'B' | concept: 'clean keyboard'
404 | expected:'D' | got:'A' | concept: 'operate oven'
405 | expected:'D' | got:'D' | concept: 'operate oven'
406 | expected:'A' | got:'A' | concept: 'operate oven'
407 | expected:'C' | got:'C' | concept: 'operate oven'
408 | expected:'A' | got:'B' | concept: 'clean microwave'
409 | expected:'D' | got:'A' | concept: 'clean microwave'
410 | expected:'B' | got:'B' | concept: 'clean microwave'
411 | expected:'C' | got:'C' | concept: 'clean microwave'
412 | expected:'D' | got:'A' | concept: 'clean oven'
413 | expected:'C' | got:'C' | concept: 'clean oven'
414 | expected:'B' | got:'B' | concept: 'clean oven'
415 | expected:'B' | got:'B' | concept: 'clean oven'
416 | expected:'C' | got:'C' | concept: 'wash apple'
417 | expected:'A' | got:'A' | concept: 'wash apple'
418 | expected:'B' | got:'B' | concept: 'wash apple'
419 | expected:'A' | got:'A' | concept: 'wash apple'
420 | expected:'D' | got:'D' | concept: 'peel_or_cut apple'
421 | expected:'C' | got:'C' | concept: 'peel_or_cut apple'
422 | expected:'A' | got:'A' | concept: 'peel_or_cut apple'
423 | expected:'A' | got:'A' | concept: 'peel_or_cut apple'
424 | expected:'A' | got:'A' | concept: 'smell apple'
425 | expected:'D' | got:'D' | concept: 'smell apple'
426 | expected:'D' | got:'D' | concept: 'smell apple'
427 | expected:'D' | got:'D' | concept: 'smell apple'
428 | expected:'B' | got:'B' | concept: 'eat apple'
429 | expected:'C' | got:'C' | concept: 'eat apple'
430 | expected:'D' | got:'D' | concept: 'eat apple'
431 | expected:'A' | got:'A' | concept: 'eat apple'
432 | expected:'D' | got:'C' | concept: 'throw frisbee'
433 | expected:'A' | got:'D' | concept: 'throw frisbee'
434 | expected:'A' | got:'A' | concept: 'throw frisbee'
435 | expected:'B' | got:'B' | concept: 'throw frisbee'
436 | expected:'D' | got:'C' | concept: 'hold frisbee'
437 | expected:'C' | got:'C' | concept: 'hold frisbee'
438 | expected:'C' | got:'B' | concept: 'hold frisbee'
439 | expected:'C' | got:'C' | concept: 'hold frisbee'
440 | expected:'D' | got:'D' | concept: 'catch frisbee'
441 | expected:'A' | got:'D' | concept: 'catch frisbee'
442 | expected:'A' | got:'A' | concept: 'catch frisbee'
443 | expected:'B' | got:'D' | concept: 'catch frisbee'
444 | expected:'D' | got:'D' | concept: 'hold sheep'
445 | expected:'D' | got:'D' | concept: 'hold sheep'
446 | expected:'B' | got:'B' | concept: 'hold sheep'
447 | expected:'B' | got:'B' | concept: 'hold sheep'
448 | expected:'C' | got:'A' | concept: 'dribble sports_ball'
449 | expected:'C' | got:'B' | concept: 'dribble sports_ball'
450 | expected:'D' | got:'D' | concept: 'dribble sports_ball'
451 | expected:'D' | got:'D' | concept: 'dribble sports_ball'
452 | expected:'A' | got:'A' | concept: 'kick sports_ball'
453 | expected:'B' | got:'B' | concept: 'kick sports_ball'
454 | expected:'C' | got:'C' | concept: 'kick sports_ball'
455 | expected:'A' | got:'A' | concept: 'kick sports_ball'
456 | expected:'C' | got:'C' | concept: 'serve sports_ball'
457 | expected:'D' | got:'D' | concept: 'serve sports_ball'
458 | expected:'B' | got:'B' | concept: 'serve sports_ball'
459 | expected:'A' | got:'A' | concept: 'serve sports_ball'
460 | expected:'D' | got:'D' | concept: 'block sports_ball'
461 | expected:'C' | got:'C' | concept: 'block sports_ball'
462 | expected:'D' | got:'D' | concept: 'block sports_ball'
463 | expected:'D' | got:'B' | concept: 'block sports_ball'
464 | expected:'B' | got:'B' | concept: 'hold vase'
465 | expected:'D' | got:'A' | concept: 'hold vase'
466 | expected:'A' | got:'A' | concept: 'hold vase'
467 | expected:'D' | got:'D' | concept: 'hold vase'
468 | expected:'B' | got:'C' | concept: 'hold carrot'
469 | expected:'B' | got:'INVALID' | concept: 'hold carrot'
470 | expected:'B' | got:'B' | concept: 'hold carrot'
471 | expected:'D' | got:'A' | concept: 'hold carrot'
472 | expected:'B' | got:'B' | concept: 'hold hot_dog'
473 | expected:'C' | got:'C' | concept: 'hold hot_dog'
474 | expected:'A' | got:'A' | concept: 'hold hot_dog'
475 | expected:'A' | got:'A' | concept: 'hold hot_dog'
476 | expected:'C' | got:'C' | concept: 'hold cell_phone'
477 | expected:'A' | got:'A' | concept: 'hold cell_phone'
478 | expected:'B' | got:'B' | concept: 'hold cell_phone'
479 | expected:'C' | got:'C' | concept: 'hold cell_phone'
480 | expected:'D' | got:'A' | concept: 'wash dog'
481 | expected:'C' | got:'A' | concept: 'wash dog'
482 | expected:'A' | got:'A' | concept: 'wash dog'
483 | expected:'A' | got:'A' | concept: 'wash dog'
484 | expected:'D' | got:'A' | concept: 'wash motorcycle'
485 | expected:'B' | got:'A' | concept: 'wash motorcycle'
486 | expected:'C' | got:'A' | concept: 'wash motorcycle'
487 | expected:'D' | got:'A' | concept: 'wash motorcycle'
488 | expected:'D' | got:'A' | concept: 'wash car'
489 | expected:'B' | got:'A' | concept: 'wash car'
490 | expected:'B' | got:'A' | concept: 'wash car'
491 | expected:'D' | got:'A' | concept: 'wash car'
492 | expected:'D' | got:'A' | concept: 'wash apple'
493 | expected:'D' | got:'A' | concept: 'wash apple'
494 | expected:'D' | got:'A' | concept: 'wash apple'
495 | expected:'C' | got:'A' | concept: 'wash apple'
496 | expected:'A' | got:'A' | concept: 'eat orange'
497 | expected:'C' | got:'C' | concept: 'eat orange'
498 | expected:'D' | got:'D' | concept: 'eat orange'
499 | expected:'D' | got:'D' | concept: 'eat orange'
500 | expected:'A' | got:'C' | concept: 'hold orange'
501 | expected:'A' | got:'B' | concept: 'hold orange'
502 | expected:'C' | got:'C' | concept: 'hold orange'
503 | expected:'D' | got:'A' | concept: 'hold orange'
504 | expected:'D' | got:'B' | concept: 'squeeze orange'
505 | expected:'B' | got:'B' | concept: 'squeeze orange'
506 | expected:'C' | got:'C' | concept: 'squeeze orange'
507 | expected:'C' | got:'D' | concept: 'squeeze orange'
508 | expected:'A' | got:'D' | concept: 'peel orange'
509 | expected:'B' | got:'D' | concept: 'peel orange'
510 | expected:'A' | got:'D' | concept: 'peel orange'
511 | expected:'B' | got:'D' | concept: 'peel orange'
512 | expected:'D' | got:'B' | concept: 'eat apple'
513 | expected:'D' | got:'D' | concept: 'eat apple'
514 | expected:'B' | got:'C' | concept: 'eat apple'
515 | expected:'A' | got:'C' | concept: 'eat apple'
516 | expected:'C' | got:'A' | concept: 'wash apple'
517 | expected:'D' | got:'D' | concept: 'wash apple'
518 | expected:'A' | got:'A' | concept: 'wash apple'
519 | expected:'B' | got:'A' | concept: 'wash apple'
520 | expected:'B' | got:'B' | concept: 'hold_and_about_to_eat apple'
521 | expected:'C' | got:'C' | concept: 'hold_and_about_to_eat apple'
522 | expected:'B' | got:'D' | concept: 'hold_and_about_to_eat apple'
523 | expected:'B' | got:'B' | concept: 'hold_and_about_to_eat apple'
524 | expected:'D' | got:'D' | concept: 'peel_or_cut apple'
525 | expected:'B' | got:'B' | concept: 'peel_or_cut apple'
526 | expected:'C' | got:'C' | concept: 'peel_or_cut apple'
527 | expected:'D' | got:'D' | concept: 'peel_or_cut apple'
528 | expected:'A' | got:'C' | concept: 'inspect bicycle'
529 | expected:'D' | got:'D' | concept: 'inspect bicycle'
530 | expected:'C' | got:'C' | concept: 'inspect bicycle'
531 | expected:'D' | got:'B' | concept: 'inspect bicycle'
532 | expected:'B' | got:'B' | concept: 'repair bicycle'
533 | expected:'C' | got:'C' | concept: 'repair bicycle'
534 | expected:'B' | got:'B' | concept: 'repair bicycle'
535 | expected:'C' | got:'C' | concept: 'repair bicycle'
536 | expected:'B' | got:'B' | concept: 'jump snowboard'
537 | expected:'D' | got:'D' | concept: 'jump snowboard'
538 | expected:'D' | got:'D' | concept: 'jump snowboard'
539 | expected:'A' | got:'A' | concept: 'jump snowboard'
540 | expected:'B' | got:'B' | concept: 'jump bicycle'
541 | expected:'D' | got:'D' | concept: 'jump bicycle'
542 | expected:'D' | got:'D' | concept: 'jump bicycle'
543 | expected:'C' | got:'C' | concept: 'jump bicycle'
544 | expected:'A' | got:'A' | concept: 'cut_with knife'
545 | expected:'C' | got:'C' | concept: 'cut_with knife'
546 | expected:'B' | got:'B' | concept: 'cut_with knife'
547 | expected:'D' | got:'D' | concept: 'cut_with knife'
548 | expected:'D' | got:'C' | concept: 'stick knife'
549 | expected:'A' | got:'D' | concept: 'stick knife'
550 | expected:'A' | got:'D' | concept: 'stick knife'
551 | expected:'A' | got:'C' | concept: 'stick knife'
552 | expected:'B' | got:'B' | concept: 'lick knife'
553 | expected:'C' | got:'C' | concept: 'lick knife'
554 | expected:'A' | got:'A' | concept: 'lick knife'
555 | expected:'A' | got:'A' | concept: 'lick knife'
556 | expected:'C' | got:'C' | concept: 'hold knife'
557 | expected:'A' | got:'A' | concept: 'hold knife'
558 | expected:'A' | got:'C' | concept: 'hold knife'
559 | expected:'B' | got:'B' | concept: 'hold knife'
560 | expected:'D' | got:'D' | concept: 'eat donut'
561 | expected:'D' | got:'D' | concept: 'eat donut'
562 | expected:'A' | got:'A' | concept: 'eat donut'
563 | expected:'B' | got:'A' | concept: 'eat donut'
564 | expected:'C' | got:'C' | concept: 'eat hot_dog'
565 | expected:'D' | got:'A' | concept: 'eat hot_dog'
566 | expected:'D' | got:'D' | concept: 'eat hot_dog'
567 | expected:'B' | got:'C' | concept: 'eat hot_dog'
568 | expected:'A' | got:'A' | concept: 'eat apple'
569 | expected:'C' | got:'C' | concept: 'eat apple'
570 | expected:'C' | got:'C' | concept: 'eat apple'
571 | expected:'D' | got:'C' | concept: 'eat apple'
572 | expected:'B' | got:'B' | concept: 'pick apple'
573 | expected:'A' | got:'A' | concept: 'pick apple'
574 | expected:'C' | got:'C' | concept: 'pick apple'
575 | expected:'C' | got:'C' | concept: 'pick apple'
576 | expected:'C' | got:'C' | concept: 'sit_on motorcycle'
577 | expected:'A' | got:'A' | concept: 'sit_on motorcycle'
578 | expected:'A' | got:'A' | concept: 'sit_on motorcycle'
579 | expected:'C' | got:'C' | concept: 'sit_on motorcycle'
580 | expected:'B' | got:'B' | concept: 'sit_on toilet'
581 | expected:'A' | got:'A' | concept: 'sit_on toilet'
582 | expected:'A' | got:'A' | concept: 'sit_on toilet'
583 | expected:'B' | got:'B' | concept: 'sit_on toilet'
584 | expected:'D' | got:'D' | concept: 'sit_on airplane'
585 | expected:'D' | got:'D' | concept: 'sit_on airplane'
586 | expected:'A' | got:'D' | concept: 'sit_on airplane'
587 | expected:'D' | got:'D' | concept: 'sit_on airplane'
588 | expected:'B' | got:'B' | concept: 'sit_on chair'
589 | expected:'B' | got:'B' | concept: 'sit_on chair'
590 | expected:'A' | got:'A' | concept: 'sit_on chair'
591 | expected:'A' | got:'A' | concept: 'sit_on chair'
592 | expected:'A' | got:'A' | concept: 'sit_on couch'
593 | expected:'A' | got:'A' | concept: 'sit_on couch'
594 | expected:'C' | got:'C' | concept: 'sit_on couch'
595 | expected:'C' | got:'C' | concept: 'sit_on couch'
596 | expected:'A' | got:'A' | concept: 'sit_on bench'
597 | expected:'D' | got:'D' | concept: 'sit_on bench'
598 | expected:'A' | got:'A' | concept: 'sit_on bench'
599 | expected:'D' | got:'D' | concept: 'sit_on bench'
600 | expected:'B' | got:'B' | concept: 'lie_on bench'
601 | expected:'D' | got:'D' | concept: 'lie_on bench'
602 | expected:'A' | got:'D' | concept: 'lie_on bench'
603 | expected:'D' | got:'B' | concept: 'lie_on bench'
604 | expected:'C' | got:'C' | concept: 'sit_on truck'
605 | expected:'C' | got:'C' | concept: 'sit_on truck'
606 | expected:'D' | got:'D' | concept: 'sit_on truck'
607 | expected:'C' | got:'C' | concept: 'sit_on truck'
608 | expected:'B' | got:'B' | concept: 'clean oven'
609 | expected:'C' | got:'C' | concept: 'clean oven'
610 | expected:'C' | got:'C' | concept: 'clean oven'
611 | expected:'D' | got:'C' | concept: 'clean oven'
612 | expected:'C' | got:'C' | concept: 'clean microwave'
613 | expected:'D' | got:'D' | concept: 'clean microwave'
614 | expected:'A' | got:'A' | concept: 'clean microwave'
615 | expected:'D' | got:'D' | concept: 'clean microwave'
616 | expected:'C' | got:'C' | concept: 'clean toilet'
617 | expected:'C' | got:'C' | concept: 'clean toilet'
618 | expected:'B' | got:'B' | concept: 'clean toilet'
619 | expected:'D' | got:'D' | concept: 'clean toilet'
620 | expected:'D' | got:'A' | concept: 'clean keyboard'
621 | expected:'D' | got:'A' | concept: 'clean keyboard'
622 | expected:'B' | got:'B' | concept: 'clean keyboard'
623 | expected:'D' | got:'D' | concept: 'clean keyboard'
624 | expected:'D' | got:'D' | concept: 'feed bird'
625 | expected:'A' | got:'A' | concept: 'feed bird'
626 | expected:'B' | got:'B' | concept: 'feed bird'
627 | expected:'A' | got:'A' | concept: 'feed bird'
628 | expected:'B' | got:'B' | concept: 'hold banana'
629 | expected:'D' | got:'A' | concept: 'hold banana'
630 | expected:'A' | got:'A' | concept: 'hold banana'
631 | expected:'D' | got:'A' | concept: 'hold banana'
632 | expected:'B' | got:'B' | concept: 'release bird'
633 | expected:'D' | got:'D' | concept: 'release bird'
634 | expected:'A' | got:'D' | concept: 'release bird'
635 | expected:'A' | got:'A' | concept: 'release bird'
636 | expected:'A' | got:'A' | concept: 'hold bird'
637 | expected:'C' | got:'C' | concept: 'hold bird'
638 | expected:'B' | got:'B' | concept: 'hold bird'
639 | expected:'B' | got:'B' | concept: 'hold bird'
640 | expected:'C' | got:'C' | concept: 'hug dog'
641 | expected:'C' | got:'C' | concept: 'hug dog'
642 | expected:'B' | got:'B' | concept: 'hug dog'
643 | expected:'C' | got:'C' | concept: 'hug dog'
644 | expected:'D' | got:'D' | concept: 'hug horse'
645 | expected:'D' | got:'D' | concept: 'hug horse'
646 | expected:'A' | got:'A' | concept: 'hug horse'
647 | expected:'B' | got:'B' | concept: 'hug horse'
648 | expected:'C' | got:'A' | concept: 'hug cat'
649 | expected:'C' | got:'C' | concept: 'hug cat'
650 | expected:'C' | got:'C' | concept: 'hug cat'
651 | expected:'D' | got:'A' | concept: 'hug cat'
652 | expected:'C' | got:'C' | concept: 'hug person'
653 | expected:'B' | got:'B' | concept: 'hug person'
654 | expected:'D' | got:'D' | concept: 'hug person'
655 | expected:'A' | got:'A' | concept: 'hug person'
656 | expected:'C' | got:'C' | concept: 'sit_on truck'
657 | expected:'C' | got:'C' | concept: 'sit_on truck'
658 | expected:'C' | got:'C' | concept: 'sit_on truck'
659 | expected:'D' | got:'D' | concept: 'sit_on truck'
660 | expected:'B' | got:'B' | concept: 'repair bicycle'
661 | expected:'B' | got:'B' | concept: 'repair bicycle'
662 | expected:'D' | got:'A' | concept: 'repair bicycle'
663 | expected:'B' | got:'B' | concept: 'repair bicycle'
664 | expected:'C' | got:'A' | concept: 'repair truck'
665 | expected:'A' | got:'A' | concept: 'repair truck'
666 | expected:'D' | got:'A' | concept: 'repair truck'
667 | expected:'C' | got:'C' | concept: 'repair truck'
668 | expected:'B' | got:'B' | concept: 'load truck'
669 | expected:'B' | got:'B' | concept: 'load truck'
670 | expected:'B' | got:'C' | concept: 'load truck'
671 | expected:'D' | got:'A' | concept: 'load truck'
672 | expected:'C' | got:'C' | concept: 'clean toilet'
673 | expected:'A' | got:'A' | concept: 'clean toilet'
674 | expected:'D' | got:'D' | concept: 'clean toilet'
675 | expected:'C' | got:'C' | concept: 'clean toilet'
676 | expected:'C' | got:'C' | concept: 'sit_on airplane'
677 | expected:'A' | got:'A' | concept: 'sit_on airplane'
678 | expected:'B' | got:'B' | concept: 'sit_on airplane'
679 | expected:'C' | got:'C' | concept: 'sit_on airplane'
680 | expected:'A' | got:'A' | concept: 'sit_on train'
681 | expected:'B' | got:'B' | concept: 'sit_on train'
682 | expected:'D' | got:'D' | concept: 'sit_on train'
683 | expected:'A' | got:'A' | concept: 'sit_on train'
684 | expected:'C' | got:'C' | concept: 'sit_on toilet'
685 | expected:'C' | got:'C' | concept: 'sit_on toilet'
686 | expected:'A' | got:'A' | concept: 'sit_on toilet'
687 | expected:'D' | got:'D' | concept: 'sit_on toilet'
688 | expected:'B' | got:'B' | concept: 'cut pizza'
689 | expected:'C' | got:'C' | concept: 'cut pizza'
690 | expected:'C' | got:'C' | concept: 'cut pizza'
691 | expected:'D' | got:'D' | concept: 'cut pizza'
692 | expected:'A' | got:'C' | concept: 'make pizza'
693 | expected:'B' | got:'B' | concept: 'make pizza'
694 | expected:'C' | got:'C' | concept: 'make pizza'
695 | expected:'D' | got:'D' | concept: 'make pizza'
696 | expected:'D' | got:'D' | concept: 'hold pizza'
697 | expected:'D' | got:'D' | concept: 'hold pizza'
698 | expected:'D' | got:'D' | concept: 'hold pizza'
699 | expected:'B' | got:'B' | concept: 'hold pizza'
700 | expected:'A' | got:'A' | concept: 'make vase'
701 | expected:'A' | got:'A' | concept: 'make vase'
702 | expected:'A' | got:'A' | concept: 'make vase'
703 | expected:'B' | got:'B' | concept: 'make vase'
704 | expected:'B' | got:'B' | concept: 'sail boat'
705 | expected:'C' | got:'C' | concept: 'sail boat'
706 | expected:'A' | got:'D' | concept: 'sail boat'
707 | expected:'B' | got:'B' | concept: 'sail boat'
708 | expected:'A' | got:'D' | concept: 'stand_on boat'
709 | expected:'A' | got:'C' | concept: 'stand_on boat'
710 | expected:'C' | got:'C' | concept: 'stand_on boat'
711 | expected:'D' | got:'A' | concept: 'stand_on boat'
712 | expected:'D' | got:'D' | concept: 'row boat'
713 | expected:'B' | got:'C' | concept: 'row boat'
714 | expected:'D' | got:'D' | concept: 'row boat'
715 | expected:'A' | got:'A' | concept: 'row boat'
716 | expected:'B' | got:'D' | concept: 'ride boat'
717 | expected:'A' | got:'A' | concept: 'ride boat'
718 | expected:'A' | got:'D' | concept: 'ride boat'
719 | expected:'D' | got:'D' | concept: 'ride boat'
720 | expected:'B' | got:'A' | concept: 'carry keyboard'
721 | expected:'C' | got:'C' | concept: 'carry keyboard'
722 | expected:'D' | got:'A' | concept: 'carry keyboard'
723 | expected:'D' | got:'A' | concept: 'carry keyboard'
724 | expected:'A' | got:'A' | concept: 'carry handbag'
725 | expected:'D' | got:'D' | concept: 'carry handbag'
726 | expected:'C' | got:'C' | concept: 'carry handbag'
727 | expected:'D' | got:'A' | concept: 'carry handbag'
728 | expected:'D' | got:'D' | concept: 'carry snowboard'
729 | expected:'D' | got:'A' | concept: 'carry snowboard'
730 | expected:'A' | got:'A' | concept: 'carry snowboard'
731 | expected:'A' | got:'A' | concept: 'carry snowboard'
732 | expected:'D' | got:'D' | concept: 'carry surfboard'
733 | expected:'A' | got:'A' | concept: 'carry surfboard'
734 | expected:'B' | got:'B' | concept: 'carry surfboard'
735 | expected:'B' | got:'B' | concept: 'carry surfboard'
736 | expected:'C' | got:'C' | concept: 'repair laptop'
737 | expected:'B' | got:'B' | concept: 'repair laptop'
738 | expected:'B' | got:'B' | concept: 'repair laptop'
739 | expected:'C' | got:'C' | concept: 'repair laptop'
740 | expected:'B' | got:'A' | concept: 'read laptop'
741 | expected:'A' | got:'C' | concept: 'read laptop'
742 | expected:'C' | got:'C' | concept: 'read laptop'
743 | expected:'B' | got:'B' | concept: 'read laptop'
744 | expected:'C' | got:'A' | concept: 'type_on keyboard'
745 | expected:'D' | got:'C' | concept: 'type_on keyboard'
746 | expected:'D' | got:'B' | concept: 'type_on keyboard'
747 | expected:'D' | got:'D' | concept: 'type_on keyboard'
748 | expected:'A' | got:'A' | concept: 'type_on laptop'
749 | expected:'A' | got:'A' | concept: 'type_on laptop'
750 | expected:'A' | got:'A' | concept: 'type_on laptop'
751 | expected:'A' | got:'A' | concept: 'type_on laptop'
752 | expected:'D' | got:'D' | concept: 'serve sports_ball'
753 | expected:'D' | got:'D' | concept: 'serve sports_ball'
754 | expected:'C' | got:'C' | concept: 'serve sports_ball'
755 | expected:'D' | got:'D' | concept: 'serve sports_ball'
756 | expected:'D' | got:'D' | concept: 'kick sports_ball'
757 | expected:'A' | got:'A' | concept: 'kick sports_ball'
758 | expected:'A' | got:'A' | concept: 'kick sports_ball'
759 | expected:'C' | got:'C' | concept: 'kick sports_ball'
760 | expected:'C' | got:'A' | concept: 'spin sports_ball'
761 | expected:'C' | got:'D' | concept: 'spin sports_ball'
762 | expected:'D' | got:'B' | concept: 'spin sports_ball'
763 | expected:'A' | got:'D' | concept: 'spin sports_ball'
764 | expected:'C' | got:'C' | concept: 'hold sports_ball'
765 | expected:'A' | got:'INVALID' | concept: 'hold sports_ball'
766 | expected:'A' | got:'A' | concept: 'hold sports_ball'
767 | expected:'D' | got:'B' | concept: 'hold sports_ball'
768 | expected:'D' | got:'D' | concept: 'hold sports_ball'
769 | expected:'A' | got:'C' | concept: 'hold sports_ball'
770 | expected:'D' | got:'A' | concept: 'hold sports_ball'
771 | expected:'A' | got:'A' | concept: 'hold sports_ball'
772 | expected:'A' | got:'A' | concept: 'hold sandwich'
773 | expected:'D' | got:'D' | concept: 'hold sandwich'
774 | expected:'C' | got:'C' | concept: 'hold sandwich'
775 | expected:'A' | got:'A' | concept: 'hold sandwich'
776 | expected:'C' | got:'C' | concept: 'hold remote'
777 | expected:'C' | got:'C' | concept: 'hold remote'
778 | expected:'B' | got:'B' | concept: 'hold remote'
779 | expected:'B' | got:'B' | concept: 'hold remote'
780 | expected:'A' | got:'A' | concept: 'hold bird'
781 | expected:'D' | got:'D' | concept: 'hold bird'
782 | expected:'C' | got:'C' | concept: 'hold bird'
783 | expected:'D' | got:'D' | concept: 'hold bird'
784 | expected:'A' | got:'C' | concept: 'block sports_ball'
785 | expected:'D' | got:'D' | concept: 'block sports_ball'
786 | expected:'C' | got:'C' | concept: 'block sports_ball'
787 | expected:'D' | got:'D' | concept: 'block sports_ball'
788 | expected:'D' | got:'D' | concept: 'dribble sports_ball'
789 | expected:'D' | got:'D' | concept: 'dribble sports_ball'
790 | expected:'A' | got:'A' | concept: 'dribble sports_ball'
791 | expected:'C' | got:'C' | concept: 'dribble sports_ball'
792 | expected:'D' | got:'A' | concept: 'hold sports_ball'
793 | expected:'C' | got:'C' | concept: 'hold sports_ball'
794 | expected:'D' | got:'D' | concept: 'hold sports_ball'
795 | expected:'C' | got:'C' | concept: 'hold sports_ball'
796 | expected:'C' | got:'D' | concept: 'spin sports_ball'
797 | expected:'B' | got:'D' | concept: 'spin sports_ball'
798 | expected:'C' | got:'C' | concept: 'spin sports_ball'
799 | expected:'C' | got:'B' | concept: 'spin sports_ball'
800 | expected:'D' | got:'D' | concept: 'sit_on train'
801 | expected:'C' | got:'B' | concept: 'sit_on train'
802 | expected:'A' | got:'A' | concept: 'sit_on train'
803 | expected:'C' | got:'C' | concept: 'sit_on train'
804 | expected:'D' | got:'D' | concept: 'sit_on airplane'
805 | expected:'B' | got:'B' | concept: 'sit_on airplane'
806 | expected:'A' | got:'A' | concept: 'sit_on airplane'
807 | expected:'D' | got:'D' | concept: 'sit_on airplane'
808 | expected:'B' | got:'B' | concept: 'sit_on bed'
809 | expected:'C' | got:'C' | concept: 'sit_on bed'
810 | expected:'D' | got:'D' | concept: 'sit_on bed'
811 | expected:'C' | got:'C' | concept: 'sit_on bed'
812 | expected:'D' | got:'D' | concept: 'direct airplane'
813 | expected:'D' | got:'D' | concept: 'direct airplane'
814 | expected:'C' | got:'C' | concept: 'direct airplane'
815 | expected:'D' | got:'D' | concept: 'direct airplane'
816 | expected:'B' | got:'B' | concept: 'adjust_or_tie tie'
817 | expected:'A' | got:'A' | concept: 'adjust_or_tie tie'
818 | expected:'D' | got:'C' | concept: 'adjust_or_tie tie'
819 | expected:'B' | got:'B' | concept: 'adjust_or_tie tie'
820 | expected:'D' | got:'D' | concept: 'help_adjust_or_tie tie'
821 | expected:'D' | got:'D' | concept: 'help_adjust_or_tie tie'
822 | expected:'D' | got:'D' | concept: 'help_adjust_or_tie tie'
823 | expected:'B' | got:'B' | concept: 'help_adjust_or_tie tie'
824 | expected:'A' | got:'A' | concept: 'wear backpack'
825 | expected:'A' | got:'C' | concept: 'wear backpack'
826 | expected:'C' | got:'C' | concept: 'wear backpack'
827 | expected:'B' | got:'B' | concept: 'wear backpack'
828 | expected:'C' | got:'A' | concept: 'wear tie'
829 | expected:'B' | got:'B' | concept: 'wear tie'
830 | expected:'C' | got:'C' | concept: 'wear tie'
831 | expected:'A' | got:'A' | concept: 'wear tie'
832 | expected:'A' | got:'A' | concept: 'inspect surfboard'
833 | expected:'D' | got:'D' | concept: 'inspect surfboard'
834 | expected:'A' | got:'A' | concept: 'inspect surfboard'
835 | expected:'C' | got:'C' | concept: 'inspect surfboard'
836 | expected:'C' | got:'C' | concept: 'ride surfboard'
837 | expected:'D' | got:'D' | concept: 'ride surfboard'
838 | expected:'C' | got:'C' | concept: 'ride surfboard'
839 | expected:'D' | got:'D' | concept: 'ride surfboard'
840 | expected:'B' | got:'A' | concept: 'jump surfboard'
841 | expected:'B' | got:'D' | concept: 'jump surfboard'
842 | expected:'C' | got:'C' | concept: 'jump surfboard'
843 | expected:'D' | got:'D' | concept: 'jump surfboard'
844 | expected:'C' | got:'C' | concept: 'inspect bicycle'
845 | expected:'D' | got:'D' | concept: 'inspect bicycle'
846 | expected:'B' | got:'B' | concept: 'inspect bicycle'
847 | expected:'A' | got:'A' | concept: 'inspect bicycle'
848 | expected:'B' | got:'B' | concept: 'hold mouse'
849 | expected:'B' | got:'B' | concept: 'hold mouse'
850 | expected:'B' | got:'B' | concept: 'hold mouse'
851 | expected:'A' | got:'A' | concept: 'hold mouse'
852 | expected:'A' | got:'A' | concept: 'hold backpack'
853 | expected:'B' | got:'B' | concept: 'hold backpack'
854 | expected:'A' | got:'A' | concept: 'hold backpack'
855 | expected:'C' | got:'C' | concept: 'hold backpack'
856 | expected:'D' | got:'D' | concept: 'hold hot_dog'
857 | expected:'C' | got:'C' | concept: 'hold hot_dog'
858 | expected:'C' | got:'C' | concept: 'hold hot_dog'
859 | expected:'B' | got:'B' | concept: 'hold hot_dog'
860 | expected:'D' | got:'INVALID' | concept: 'hold kite'
861 | expected:'B' | got:'B' | concept: 'hold kite'
862 | expected:'B' | got:'B' | concept: 'hold kite'
863 | expected:'B' | got:'B' | concept: 'hold kite'
864 | expected:'B' | got:'B' | concept: 'hold pizza'
865 | expected:'D' | got:'A' | concept: 'hold pizza'
866 | expected:'D' | got:'A' | concept: 'hold pizza'
867 | expected:'A' | got:'A' | concept: 'hold pizza'
868 | expected:'C' | got:'A' | concept: 'hold sandwich'
869 | expected:'A' | got:'A' | concept: 'hold sandwich'
870 | expected:'C' | got:'C' | concept: 'hold sandwich'
871 | expected:'B' | got:'B' | concept: 'hold sandwich'
872 | expected:'A' | got:'A' | concept: 'hold cell_phone'
873 | expected:'A' | got:'A' | concept: 'hold cell_phone'
874 | expected:'B' | got:'B' | concept: 'hold cell_phone'
875 | expected:'A' | got:'A' | concept: 'hold cell_phone'
876 | expected:'A' | got:'A' | concept: 'hold bottle'
877 | expected:'D' | got:'B' | concept: 'hold bottle'
878 | expected:'B' | got:'B' | concept: 'hold bottle'
879 | expected:'C' | got:'C' | concept: 'hold bottle'
880 | expected:'B' | got:'B' | concept: 'hold hot_dog'
881 | expected:'A' | got:'A' | concept: 'hold hot_dog'
882 | expected:'A' | got:'B' | concept: 'hold hot_dog'
883 | expected:'C' | got:'B' | concept: 'hold hot_dog'
884 | expected:'A' | got:'A' | concept: 'hold person'
885 | expected:'B' | got:'B' | concept: 'hold person'
886 | expected:'B' | got:'B' | concept: 'hold person'
887 | expected:'C' | got:'C' | concept: 'hold person'
888 | expected:'B' | got:'B' | concept: 'hold book'
889 | expected:'C' | got:'C' | concept: 'hold book'
890 | expected:'D' | got:'D' | concept: 'hold book'
891 | expected:'B' | got:'B' | concept: 'hold book'
892 | expected:'B' | got:'B' | concept: 'hold bicycle'
893 | expected:'B' | got:'B' | concept: 'hold bicycle'
894 | expected:'C' | got:'C' | concept: 'hold bicycle'
895 | expected:'D' | got:'D' | concept: 'hold bicycle'
896 | expected:'B' | got:'B' | concept: 'peel orange'
897 | expected:'C' | got:'C' | concept: 'peel orange'
898 | expected:'D' | got:'D' | concept: 'peel orange'
899 | expected:'D' | got:'D' | concept: 'peel orange'
900 | expected:'C' | got:'C' | concept: 'hold orange'
901 | expected:'D' | got:'C' | concept: 'hold orange'
902 | expected:'B' | got:'C' | concept: 'hold orange'
903 | expected:'B' | got:'B' | concept: 'hold orange'
904 | expected:'B' | got:'B' | concept: 'eat orange'
905 | expected:'B' | got:'D' | concept: 'eat orange'
906 | expected:'A' | got:'D' | concept: 'eat orange'
907 | expected:'D' | got:'D' | concept: 'eat orange'
908 | expected:'C' | got:'C' | concept: 'squeeze orange'
909 | expected:'B' | got:'B' | concept: 'squeeze orange'
910 | expected:'B' | got:'B' | concept: 'squeeze orange'
911 | expected:'B' | got:'B' | concept: 'squeeze orange'
912 | expected:'D' | got:'A' | concept: 'repair truck'
913 | expected:'D' | got:'A' | concept: 'repair truck'
914 | expected:'B' | got:'B' | concept: 'repair truck'
915 | expected:'C' | got:'D' | concept: 'repair truck'
916 | expected:'C' | got:'C' | concept: 'sit_on bed'
917 | expected:'B' | got:'B' | concept: 'sit_on bed'
918 | expected:'D' | got:'D' | concept: 'sit_on bed'
919 | expected:'A' | got:'A' | concept: 'sit_on bed'
920 | expected:'B' | got:'B' | concept: 'load truck'
921 | expected:'A' | got:'A' | concept: 'load truck'
922 | expected:'A' | got:'A' | concept: 'load truck'
923 | expected:'C' | got:'C' | concept: 'load truck'
924 | expected:'B' | got:'A' | concept: 'sit_on truck'
925 | expected:'B' | got:'B' | concept: 'sit_on truck'
926 | expected:'A' | got:'A' | concept: 'sit_on truck'
927 | expected:'A' | got:'D' | concept: 'sit_on truck'
928 | expected:'D' | got:'D' | concept: 'sit_on toilet'
929 | expected:'A' | got:'A' | concept: 'sit_on toilet'
930 | expected:'A' | got:'A' | concept: 'sit_on toilet'
931 | expected:'D' | got:'D' | concept: 'sit_on toilet'
932 | expected:'B' | got:'B' | concept: 'clean oven'
933 | expected:'C' | got:'C' | concept: 'clean oven'
934 | expected:'C' | got:'C' | concept: 'clean oven'
935 | expected:'B' | got:'B' | concept: 'clean oven'
936 | expected:'C' | got:'C' | concept: 'clean horse'
937 | expected:'B' | got:'B' | concept: 'clean horse'
938 | expected:'C' | got:'C' | concept: 'clean horse'
939 | expected:'C' | got:'C' | concept: 'clean horse'
940 | expected:'D' | got:'D' | concept: 'clean toilet'
941 | expected:'D' | got:'D' | concept: 'clean toilet'
942 | expected:'A' | got:'A' | concept: 'clean toilet'
943 | expected:'B' | got:'B' | concept: 'clean toilet'
944 | expected:'B' | got:'D' | concept: 'throw frisbee'
945 | expected:'C' | got:'C' | concept: 'throw frisbee'
946 | expected:'C' | got:'B' | concept: 'throw frisbee'
947 | expected:'A' | got:'C' | concept: 'throw frisbee'
948 | expected:'D' | got:'C' | concept: 'catch frisbee'
949 | expected:'D' | got:'D' | concept: 'catch frisbee'
950 | expected:'D' | got:'D' | concept: 'catch frisbee'
951 | expected:'C' | got:'C' | concept: 'catch frisbee'
952 | expected:'D' | got:'D' | concept: 'hold knife'
953 | expected:'B' | got:'B' | concept: 'hold knife'
954 | expected:'C' | got:'C' | concept: 'hold knife'
955 | expected:'C' | got:'C' | concept: 'hold knife'
956 | expected:'B' | got:'B' | concept: 'hold frisbee'
957 | expected:'C' | got:'D' | concept: 'hold frisbee'
958 | expected:'A' | got:'D' | concept: 'hold frisbee'
959 | expected:'B' | got:'D' | concept: 'hold frisbee'
960 | expected:'C' | got:'C' | concept: 'hold vase'
961 | expected:'C' | got:'C' | concept: 'hold vase'
962 | expected:'A' | got:'A' | concept: 'hold vase'
963 | expected:'C' | got:'C' | concept: 'hold vase'
964 | expected:'D' | got:'D' | concept: 'hold backpack'
965 | expected:'B' | got:'B' | concept: 'hold backpack'
966 | expected:'C' | got:'C' | concept: 'hold backpack'
967 | expected:'D' | got:'A' | concept: 'hold backpack'
968 | expected:'A' | got:'A' | concept: 'hold horse'
969 | expected:'B' | got:'B' | concept: 'hold horse'
970 | expected:'A' | got:'A' | concept: 'hold horse'
971 | expected:'D' | got:'D' | concept: 'hold horse'
972 | expected:'A' | got:'A' | concept: 'hold spoon'
973 | expected:'C' | got:'C' | concept: 'hold spoon'
974 | expected:'A' | got:'A' | concept: 'hold spoon'
975 | expected:'C' | got:'C' | concept: 'hold spoon'
976 | expected:'A' | got:'A' | concept: 'ride skateboard'
977 | expected:'C' | got:'A' | concept: 'ride skateboard'
978 | expected:'A' | got:'C' | concept: 'ride skateboard'
979 | expected:'A' | got:'A' | concept: 'ride skateboard'
980 | expected:'A' | got:'A' | concept: 'grind skateboard'
981 | expected:'B' | got:'B' | concept: 'grind skateboard'
982 | expected:'C' | got:'C' | concept: 'grind skateboard'
983 | expected:'A' | got:'A' | concept: 'grind skateboard'
984 | expected:'B' | got:'B' | concept: 'hold skateboard'
985 | expected:'B' | got:'B' | concept: 'hold skateboard'
986 | expected:'C' | got:'C' | concept: 'hold skateboard'
987 | expected:'A' | got:'A' | concept: 'hold skateboard'
988 | expected:'D' | got:'D' | concept: 'sit_on skateboard'
989 | expected:'C' | got:'C' | concept: 'sit_on skateboard'
990 | expected:'C' | got:'C' | concept: 'sit_on skateboard'
991 | expected:'A' | got:'C' | concept: 'sit_on skateboard'
992 | expected:'A' | got:'A' | concept: 'sit_on truck'
993 | expected:'C' | got:'C' | concept: 'sit_on truck'
994 | expected:'C' | got:'C' | concept: 'sit_on truck'
995 | expected:'B' | got:'B' | concept: 'sit_on truck'
996 | expected:'B' | got:'B' | concept: 'sit_on toilet'
997 | expected:'D' | got:'D' | concept: 'sit_on toilet'
998 | expected:'B' | got:'B' | concept: 'sit_on toilet'
999 | expected:'A' | got:'A' | concept: 'sit_on toilet'
1000 | expected:'B' | got:'B' | concept: 'sit_on skateboard'
1001 | expected:'C' | got:'C' | concept: 'sit_on skateboard'
1002 | expected:'B' | got:'B' | concept: 'sit_on skateboard'
1003 | expected:'A' | got:'A' | concept: 'sit_on skateboard'
1004 | expected:'C' | got:'C' | concept: 'sit_on motorcycle'
1005 | expected:'D' | got:'D' | concept: 'sit_on motorcycle'
1006 | expected:'D' | got:'D' | concept: 'sit_on motorcycle'
1007 | expected:'B' | got:'B' | concept: 'sit_on motorcycle'
1008 | expected:'D' | got:'A' | concept: 'repair laptop'
1009 | expected:'D' | got:'A' | concept: 'repair laptop'
1010 | expected:'A' | got:'A' | concept: 'repair laptop'
1011 | expected:'D' | got:'A' | concept: 'repair laptop'
1012 | expected:'A' | got:'A' | concept: 'type_on laptop'
1013 | expected:'A' | got:'A' | concept: 'type_on laptop'
1014 | expected:'B' | got:'B' | concept: 'type_on laptop'
1015 | expected:'C' | got:'C' | concept: 'type_on laptop'
1016 | expected:'D' | got:'A' | concept: 'read book'
1017 | expected:'A' | got:'A' | concept: 'read book'
1018 | expected:'C' | got:'A' | concept: 'read book'
1019 | expected:'B' | got:'B' | concept: 'read book'
1020 | expected:'D' | got:'B' | concept: 'read laptop'
1021 | expected:'C' | got:'A' | concept: 'read laptop'
1022 | expected:'C' | got:'A' | concept: 'read laptop'
1023 | expected:'D' | got:'B' | concept: 'read laptop'
1024 | expected:'C' | got:'D' | concept: 'straddle bicycle'
1025 | expected:'C' | got:'B' | concept: 'straddle bicycle'
1026 | expected:'A' | got:'A' | concept: 'straddle bicycle'
1027 | expected:'B' | got:'B' | concept: 'straddle bicycle'
1028 | expected:'D' | got:'D' | concept: 'jump bicycle'
1029 | expected:'B' | got:'B' | concept: 'jump bicycle'
1030 | expected:'C' | got:'B' | concept: 'jump bicycle'
1031 | expected:'B' | got:'B' | concept: 'jump bicycle'
1032 | expected:'B' | got:'B' | concept: 'straddle motorcycle'
1033 | expected:'C' | got:'C' | concept: 'straddle motorcycle'
1034 | expected:'B' | got:'B' | concept: 'straddle motorcycle'
1035 | expected:'A' | got:'A' | concept: 'straddle motorcycle'
1036 | expected:'C' | got:'C' | concept: 'inspect bicycle'
1037 | expected:'B' | got:'B' | concept: 'inspect bicycle'
1038 | expected:'A' | got:'A' | concept: 'inspect bicycle'
1039 | expected:'D' | got:'D' | concept: 'inspect bicycle'
1040 | expected:'B' | got:'B' | concept: 'jump skateboard'
1041 | expected:'D' | got:'D' | concept: 'jump skateboard'
1042 | expected:'A' | got:'A' | concept: 'jump skateboard'
1043 | expected:'B' | got:'B' | concept: 'jump skateboard'
1044 | expected:'A' | got:'A' | concept: 'jump skis'
1045 | expected:'A' | got:'A' | concept: 'jump skis'
1046 | expected:'A' | got:'A' | concept: 'jump skis'
1047 | expected:'A' | got:'A' | concept: 'jump skis'
1048 | expected:'A' | got:'A' | concept: 'jump surfboard'
1049 | expected:'A' | got:'A' | concept: 'jump surfboard'
1050 | expected:'C' | got:'C' | concept: 'jump surfboard'
1051 | expected:'C' | got:'C' | concept: 'jump surfboard'
1052 | expected:'C' | got:'C' | concept: 'jump bicycle'
1053 | expected:'A' | got:'D' | concept: 'jump bicycle'
1054 | expected:'A' | got:'A' | concept: 'jump bicycle'
1055 | expected:'C' | got:'C' | concept: 'jump bicycle'
1056 | expected:'D' | got:'D' | concept: 'block sports_ball'
1057 | expected:'C' | got:'D' | concept: 'block sports_ball'
1058 | expected:'C' | got:'B' | concept: 'block sports_ball'
1059 | expected:'B' | got:'B' | concept: 'block sports_ball'
1060 | expected:'D' | got:'B' | concept: 'dribble sports_ball'
1061 | expected:'C' | got:'B' | concept: 'dribble sports_ball'
1062 | expected:'C' | got:'C' | concept: 'dribble sports_ball'
1063 | expected:'C' | got:'B' | concept: 'dribble sports_ball'
1064 | expected:'B' | got:'B' | concept: 'kick sports_ball'
1065 | expected:'D' | got:'D' | concept: 'kick sports_ball'
1066 | expected:'B' | got:'B' | concept: 'kick sports_ball'
1067 | expected:'D' | got:'D' | concept: 'kick sports_ball'
1068 | expected:'C' | got:'A' | concept: 'hold sports_ball'
1069 | expected:'D' | got:'D' | concept: 'hold sports_ball'
1070 | expected:'C' | got:'D' | concept: 'hold sports_ball'
1071 | expected:'A' | got:'C' | concept: 'hold sports_ball'
1072 | expected:'A' | got:'A' | concept: 'feed horse'
1073 | expected:'B' | got:'B' | concept: 'feed horse'
1074 | expected:'A' | got:'A' | concept: 'feed horse'
1075 | expected:'D' | got:'D' | concept: 'feed horse'
1076 | expected:'B' | got:'B' | concept: 'kiss person'
1077 | expected:'D' | got:'D' | concept: 'kiss person'
1078 | expected:'B' | got:'B' | concept: 'kiss person'
1079 | expected:'D' | got:'D' | concept: 'kiss person'
1080 | expected:'B' | got:'B' | concept: 'jump horse'
1081 | expected:'C' | got:'C' | concept: 'jump horse'
1082 | expected:'D' | got:'D' | concept: 'jump horse'
1083 | expected:'A' | got:'A' | concept: 'jump horse'
1084 | expected:'C' | got:'C' | concept: 'kiss horse'
1085 | expected:'D' | got:'D' | concept: 'kiss horse'
1086 | expected:'C' | got:'C' | concept: 'kiss horse'
1087 | expected:'A' | got:'A' | concept: 'kiss horse'
1088 | expected:'D' | got:'D' | concept: 'throw frisbee'
1089 | expected:'C' | got:'C' | concept: 'throw frisbee'
1090 | expected:'A' | got:'D' | concept: 'throw frisbee'
1091 | expected:'A' | got:'D' | concept: 'throw frisbee'
1092 | expected:'A' | got:'A' | concept: 'catch frisbee'
1093 | expected:'D' | got:'D' | concept: 'catch frisbee'
1094 | expected:'A' | got:'D' | concept: 'catch frisbee'
1095 | expected:'D' | got:'B' | concept: 'catch frisbee'
1096 | expected:'B' | got:'C' | concept: 'hold frisbee'
1097 | expected:'A' | got:'B' | concept: 'hold frisbee'
1098 | expected:'D' | got:'D' | concept: 'hold frisbee'
1099 | expected:'C' | got:'C' | concept: 'hold frisbee'
1100 | expected:'A' | got:'A' | concept: 'hold scissors'
1101 | expected:'C' | got:'C' | concept: 'hold scissors'
1102 | expected:'B' | got:'B' | concept: 'hold scissors'
1103 | expected:'A' | got:'A' | concept: 'hold scissors'
1104 | expected:'B' | got:'A' | concept: 'eat_at dining_table'
1105 | expected:'D' | got:'D' | concept: 'eat_at dining_table'
1106 | expected:'A' | got:'A' | concept: 'eat_at dining_table'
1107 | expected:'B' | got:'C' | concept: 'eat_at dining_table'
1108 | expected:'A' | got:'A' | concept: 'cut pizza'
1109 | expected:'C' | got:'C' | concept: 'cut pizza'
1110 | expected:'B' | got:'B' | concept: 'cut pizza'
1111 | expected:'D' | got:'D' | concept: 'cut pizza'
1112 | expected:'B' | got:'B' | concept: 'jump snowboard'
1113 | expected:'C' | got:'C' | concept: 'jump snowboard'
1114 | expected:'D' | got:'A' | concept: 'jump snowboard'
1115 | expected:'D' | got:'D' | concept: 'jump snowboard'
1116 | expected:'D' | got:'D' | concept: 'sit_at dining_table'
1117 | expected:'A' | got:'A' | concept: 'sit_at dining_table'
1118 | expected:'A' | got:'B' | concept: 'sit_at dining_table'
1119 | expected:'C' | got:'C' | concept: 'sit_at dining_table'
1120 | expected:'C' | got:'C' | concept: 'make pizza'
1121 | expected:'B' | got:'B' | concept: 'make pizza'
1122 | expected:'B' | got:'B' | concept: 'make pizza'
1123 | expected:'B' | got:'B' | concept: 'make pizza'
1124 | expected:'A' | got:'A' | concept: 'cut pizza'
1125 | expected:'B' | got:'A' | concept: 'cut pizza'
1126 | expected:'B' | got:'B' | concept: 'cut pizza'
1127 | expected:'D' | got:'D' | concept: 'cut pizza'
1128 | expected:'C' | got:'C' | concept: 'eat pizza'
1129 | expected:'C' | got:'C' | concept: 'eat pizza'
1130 | expected:'B' | got:'B' | concept: 'eat pizza'
1131 | expected:'D' | got:'D' | concept: 'eat pizza'
1132 | expected:'C' | got:'D' | concept: 'hold pizza'
1133 | expected:'A' | got:'A' | concept: 'hold pizza'
1134 | expected:'D' | got:'D' | concept: 'hold pizza'
1135 | expected:'B' | got:'B' | concept: 'hold pizza'
1136 | expected:'B' | got:'B' | concept: 'repair laptop'
1137 | expected:'C' | got:'C' | concept: 'repair laptop'
1138 | expected:'A' | got:'A' | concept: 'repair laptop'
1139 | expected:'A' | got:'A' | concept: 'repair laptop'
1140 | expected:'A' | got:'A' | concept: 'read book'
1141 | expected:'C' | got:'C' | concept: 'read book'
1142 | expected:'D' | got:'A' | concept: 'read book'
1143 | expected:'A' | got:'A' | concept: 'read book'
1144 | expected:'A' | got:'B' | concept: 'read laptop'
1145 | expected:'B' | got:'B' | concept: 'read laptop'
1146 | expected:'C' | got:'C' | concept: 'read laptop'
1147 | expected:'B' | got:'B' | concept: 'read laptop'
1148 | expected:'B' | got:'B' | concept: 'hold laptop'
1149 | expected:'D' | got:'A' | concept: 'hold laptop'
1150 | expected:'A' | got:'A' | concept: 'hold laptop'
1151 | expected:'A' | got:'A' | concept: 'hold laptop'
1152 | expected:'C' | got:'C' | concept: 'feed horse'
1153 | expected:'B' | got:'B' | concept: 'feed horse'
1154 | expected:'D' | got:'D' | concept: 'feed horse'
1155 | expected:'A' | got:'A' | concept: 'feed horse'
1156 | expected:'D' | got:'C' | concept: 'inspect motorcycle'
1157 | expected:'B' | got:'B' | concept: 'inspect motorcycle'
1158 | expected:'C' | got:'C' | concept: 'inspect motorcycle'
1159 | expected:'C' | got:'C' | concept: 'inspect motorcycle'
1160 | expected:'D' | got:'D' | concept: 'direct airplane'
1161 | expected:'B' | got:'B' | concept: 'direct airplane'
1162 | expected:'A' | got:'A' | concept: 'direct airplane'
1163 | expected:'B' | got:'B' | concept: 'direct airplane'
1164 | expected:'C' | got:'C' | concept: 'eat orange'
1165 | expected:'B' | got:'B' | concept: 'eat orange'
1166 | expected:'B' | got:'B' | concept: 'eat orange'
1167 | expected:'A' | got:'A' | concept: 'eat orange'
1168 | expected:'D' | got:'C' | concept: 'release bird'
1169 | expected:'C' | got:'C' | concept: 'release bird'
1170 | expected:'B' | got:'B' | concept: 'release bird'
1171 | expected:'C' | got:'C' | concept: 'release bird'
1172 | expected:'C' | got:'C' | concept: 'hold kite'
1173 | expected:'C' | got:'C' | concept: 'hold kite'
1174 | expected:'D' | got:'D' | concept: 'hold kite'
1175 | expected:'C' | got:'C' | concept: 'hold kite'
1176 | expected:'B' | got:'B' | concept: 'hold bird'
1177 | expected:'A' | got:'A' | concept: 'hold bird'
1178 | expected:'A' | got:'A' | concept: 'hold bird'
1179 | expected:'B' | got:'C' | concept: 'hold bird'
1180 | expected:'D' | got:'C' | concept: 'feed bird'
1181 | expected:'B' | got:'B' | concept: 'feed bird'
1182 | expected:'C' | got:'C' | concept: 'feed bird'
1183 | expected:'D' | got:'D' | concept: 'feed bird'
1184 | expected:'A' | got:'A' | concept: 'walk dog'
1185 | expected:'A' | got:'A' | concept: 'walk dog'
1186 | expected:'C' | got:'C' | concept: 'walk dog'
1187 | expected:'A' | got:'A' | concept: 'walk dog'
1188 | expected:'D' | got:'D' | concept: 'kiss dog'
1189 | expected:'D' | got:'D' | concept: 'kiss dog'
1190 | expected:'A' | got:'A' | concept: 'kiss dog'
1191 | expected:'C' | got:'C' | concept: 'kiss dog'
1192 | expected:'D' | got:'A' | concept: 'train dog'
1193 | expected:'C' | got:'C' | concept: 'train dog'
1194 | expected:'C' | got:'D' | concept: 'train dog'
1195 | expected:'C' | got:'C' | concept: 'train dog'
1196 | expected:'A' | got:'A' | concept: 'hug dog'
1197 | expected:'B' | got:'B' | concept: 'hug dog'
1198 | expected:'B' | got:'B' | concept: 'hug dog'
1199 | expected:'A' | got:'D' | concept: 'hug dog'
1200 | expected:'D' | got:'A' | concept: 'load truck'
1201 | expected:'B' | got:'B' | concept: 'load truck'
1202 | expected:'A' | got:'A' | concept: 'load truck'
1203 | expected:'A' | got:'A' | concept: 'load truck'
1204 | expected:'C' | got:'C' | concept: 'repair truck'
1205 | expected:'B' | got:'B' | concept: 'repair truck'
1206 | expected:'D' | got:'D' | concept: 'repair truck'
1207 | expected:'B' | got:'B' | concept: 'repair truck'
1208 | expected:'B' | got:'B' | concept: 'repair laptop'
1209 | expected:'A' | got:'A' | concept: 'repair laptop'
1210 | expected:'B' | got:'B' | concept: 'repair laptop'
1211 | expected:'B' | got:'B' | concept: 'repair laptop'
1212 | expected:'B' | got:'B' | concept: 'sit_on truck'
1213 | expected:'A' | got:'A' | concept: 'sit_on truck'
1214 | expected:'C' | got:'C' | concept: 'sit_on truck'
1215 | expected:'B' | got:'B' | concept: 'sit_on truck'
1216 | expected:'B' | got:'C' | concept: 'cut_with scissors'
1217 | expected:'D' | got:'D' | concept: 'cut_with scissors'
1218 | expected:'B' | got:'A' | concept: 'cut_with scissors'
1219 | expected:'C' | got:'C' | concept: 'cut_with scissors'
1220 | expected:'C' | got:'D' | concept: 'hold scissors'
1221 | expected:'D' | got:'C' | concept: 'hold scissors'
1222 | expected:'B' | got:'C' | concept: 'hold scissors'
1223 | expected:'D' | got:'D' | concept: 'hold scissors'
1224 | expected:'D' | got:'A' | concept: 'hold wine_glass'
1225 | expected:'A' | got:'A' | concept: 'hold wine_glass'
1226 | expected:'A' | got:'A' | concept: 'hold wine_glass'
1227 | expected:'B' | got:'B' | concept: 'hold wine_glass'
1228 | expected:'B' | got:'B' | concept: 'cut_with knife'
1229 | expected:'B' | got:'B' | concept: 'cut_with knife'
1230 | expected:'D' | got:'D' | concept: 'cut_with knife'
1231 | expected:'C' | got:'D' | concept: 'cut_with knife'
1232 | expected:'D' | got:'D' | concept: 'ride skateboard'
1233 | expected:'C' | got:'C' | concept: 'ride skateboard'
1234 | expected:'D' | got:'D' | concept: 'ride skateboard'
1235 | expected:'B' | got:'B' | concept: 'ride skateboard'
1236 | expected:'A' | got:'A' | concept: 'ride skis'
1237 | expected:'C' | got:'C' | concept: 'ride skis'
1238 | expected:'A' | got:'A' | concept: 'ride skis'
1239 | expected:'C' | got:'C' | concept: 'ride skis'
1240 | expected:'A' | got:'A' | concept: 'ride snowboard'
1241 | expected:'D' | got:'D' | concept: 'ride snowboard'
1242 | expected:'A' | got:'A' | concept: 'ride snowboard'
1243 | expected:'A' | got:'A' | concept: 'ride snowboard'
1244 | expected:'C' | got:'C' | concept: 'ride horse'
1245 | expected:'D' | got:'D' | concept: 'ride horse'
1246 | expected:'D' | got:'D' | concept: 'ride horse'
1247 | expected:'C' | got:'C' | concept: 'ride horse'
1248 | expected:'D' | got:'D' | concept: 'repair laptop'
1249 | expected:'C' | got:'C' | concept: 'repair laptop'
1250 | expected:'D' | got:'A' | concept: 'repair laptop'
1251 | expected:'C' | got:'C' | concept: 'repair laptop'
1252 | expected:'C' | got:'C' | concept: 'read laptop'
1253 | expected:'B' | got:'B' | concept: 'read laptop'
1254 | expected:'A' | got:'A' | concept: 'read laptop'
1255 | expected:'A' | got:'A' | concept: 'read laptop'
1256 | expected:'A' | got:'A' | concept: 'repair bicycle'
1257 | expected:'D' | got:'A' | concept: 'repair bicycle'
1258 | expected:'C' | got:'C' | concept: 'repair bicycle'
1259 | expected:'C' | got:'A' | concept: 'repair bicycle'
1260 | expected:'C' | got:'C' | concept: 'hold laptop'
1261 | expected:'C' | got:'C' | concept: 'hold laptop'
1262 | expected:'A' | got:'A' | concept: 'hold laptop'
1263 | expected:'C' | got:'B' | concept: 'hold laptop'
1264 | expected:'D' | got:'D' | concept: 'block sports_ball'
1265 | expected:'A' | got:'C' | concept: 'block sports_ball'
1266 | expected:'B' | got:'A' | concept: 'block sports_ball'
1267 | expected:'A' | got:'A' | concept: 'block sports_ball'
1268 | expected:'D' | got:'A' | concept: 'dribble sports_ball'
1269 | expected:'D' | got:'C' | concept: 'dribble sports_ball'
1270 | expected:'D' | got:'B' | concept: 'dribble sports_ball'
1271 | expected:'C' | got:'B' | concept: 'dribble sports_ball'
1272 | expected:'C' | got:'D' | concept: 'spin sports_ball'
1273 | expected:'A' | got:'A' | concept: 'spin sports_ball'
1274 | expected:'D' | got:'A' | concept: 'spin sports_ball'
1275 | expected:'C' | got:'D' | concept: 'spin sports_ball'
1276 | expected:'C' | got:'C' | concept: 'kick sports_ball'
1277 | expected:'A' | got:'A' | concept: 'kick sports_ball'
1278 | expected:'B' | got:'B' | concept: 'kick sports_ball'
1279 | expected:'A' | got:'A' | concept: 'kick sports_ball'
1280 | expected:'A' | got:'A' | concept: 'greet person'
1281 | expected:'B' | got:'B' | concept: 'greet person'
1282 | expected:'B' | got:'D' | concept: 'greet person'
1283 | expected:'D' | got:'D' | concept: 'greet person'
1284 | expected:'C' | got:'C' | concept: 'hug person'
1285 | expected:'A' | got:'C' | concept: 'hug person'
1286 | expected:'C' | got:'C' | concept: 'hug person'
1287 | expected:'C' | got:'C' | concept: 'hug person'
1288 | expected:'B' | got:'B' | concept: 'hold person'
1289 | expected:'A' | got:'A' | concept: 'hold person'
1290 | expected:'D' | got:'D' | concept: 'hold person'
1291 | expected:'C' | got:'C' | concept: 'hold person'
1292 | expected:'C' | got:'C' | concept: 'kiss person'
1293 | expected:'D' | got:'A' | concept: 'kiss person'
1294 | expected:'B' | got:'B' | concept: 'kiss person'
1295 | expected:'A' | got:'A' | concept: 'kiss person'
1296 | expected:'A' | got:'A' | concept: 'walk dog'
1297 | expected:'A' | got:'A' | concept: 'walk dog'
1298 | expected:'C' | got:'C' | concept: 'walk dog'
1299 | expected:'D' | got:'D' | concept: 'walk dog'
1300 | expected:'C' | got:'C' | concept: 'walk bicycle'
1301 | expected:'D' | got:'A' | concept: 'walk bicycle'
1302 | expected:'C' | got:'C' | concept: 'walk bicycle'
1303 | expected:'B' | got:'B' | concept: 'walk bicycle'
1304 | expected:'B' | got:'B' | concept: 'walk horse'
1305 | expected:'B' | got:'B' | concept: 'walk horse'
1306 | expected:'D' | got:'D' | concept: 'walk horse'
1307 | expected:'D' | got:'A' | concept: 'walk horse'
1308 | expected:'B' | got:'C' | concept: 'walk cow'
1309 | expected:'C' | got:'C' | concept: 'walk cow'
1310 | expected:'D' | got:'A' | concept: 'walk cow'
1311 | expected:'D' | got:'A' | concept: 'walk cow'
1312 | expected:'A' | got:'A' | concept: 'kiss person'
1313 | expected:'D' | got:'D' | concept: 'kiss person'
1314 | expected:'A' | got:'A' | concept: 'kiss person'
1315 | expected:'C' | got:'C' | concept: 'kiss person'
1316 | expected:'B' | got:'B' | concept: 'hug cat'
1317 | expected:'C' | got:'B' | concept: 'hug cat'
1318 | expected:'D' | got:'A' | concept: 'hug cat'
1319 | expected:'B' | got:'B' | concept: 'hug cat'
1320 | expected:'D' | got:'D' | concept: 'hug person'
1321 | expected:'C' | got:'C' | concept: 'hug person'
1322 | expected:'D' | got:'D' | concept: 'hug person'
1323 | expected:'B' | got:'C' | concept: 'hug person'
1324 | expected:'C' | got:'C' | concept: 'hold person'
1325 | expected:'C' | got:'C' | concept: 'hold person'
1326 | expected:'D' | got:'D' | concept: 'hold person'
1327 | expected:'C' | got:'C' | concept: 'hold person'
1328 | expected:'B' | got:'B' | concept: 'open oven'
1329 | expected:'C' | got:'A' | concept: 'open oven'
1330 | expected:'C' | got:'A' | concept: 'open oven'
1331 | expected:'C' | got:'C' | concept: 'open oven'
1332 | expected:'A' | got:'A' | concept: 'inspect oven'
1333 | expected:'D' | got:'A' | concept: 'inspect oven'
1334 | expected:'D' | got:'C' | concept: 'inspect oven'
1335 | expected:'A' | got:'C' | concept: 'inspect oven'
1336 | expected:'B' | got:'B' | concept: 'clean oven'
1337 | expected:'C' | got:'D' | concept: 'clean oven'
1338 | expected:'D' | got:'D' | concept: 'clean oven'
1339 | expected:'B' | got:'B' | concept: 'clean oven'
1340 | expected:'C' | got:'C' | concept: 'clean keyboard'
1341 | expected:'D' | got:'A' | concept: 'clean keyboard'
1342 | expected:'B' | got:'B' | concept: 'clean keyboard'
1343 | expected:'C' | got:'C' | concept: 'clean keyboard'
1344 | expected:'C' | got:'C' | concept: 'jump skateboard'
1345 | expected:'C' | got:'C' | concept: 'jump skateboard'
1346 | expected:'D' | got:'D' | concept: 'jump skateboard'
1347 | expected:'A' | got:'A' | concept: 'jump skateboard'
1348 | expected:'B' | got:'B' | concept: 'jump skis'
1349 | expected:'C' | got:'C' | concept: 'jump skis'
1350 | expected:'C' | got:'D' | concept: 'jump skis'
1351 | expected:'D' | got:'D' | concept: 'jump skis'
1352 | expected:'D' | got:'D' | concept: 'ride skis'
1353 | expected:'C' | got:'C' | concept: 'ride skis'
1354 | expected:'A' | got:'A' | concept: 'ride skis'
1355 | expected:'A' | got:'A' | concept: 'ride skis'
1356 | expected:'A' | got:'A' | concept: 'jump horse'
1357 | expected:'D' | got:'D' | concept: 'jump horse'
1358 | expected:'D' | got:'D' | concept: 'jump horse'
1359 | expected:'C' | got:'C' | concept: 'jump horse'
1360 | expected:'D' | got:'D' | concept: 'sit_on bench'
1361 | expected:'A' | got:'B' | concept: 'sit_on bench'
1362 | expected:'A' | got:'C' | concept: 'sit_on bench'
1363 | expected:'C' | got:'C' | concept: 'sit_on bench'
1364 | expected:'A' | got:'A' | concept: 'sit_on bed'
1365 | expected:'D' | got:'D' | concept: 'sit_on bed'
1366 | expected:'B' | got:'D' | concept: 'sit_on bed'
1367 | expected:'B' | got:'B' | concept: 'sit_on bed'
1368 | expected:'D' | got:'D' | concept: 'sit_on_with_multiple_person bench'
1369 | expected:'A' | got:'A' | concept: 'sit_on_with_multiple_person bench'
1370 | expected:'A' | got:'C' | concept: 'sit_on_with_multiple_person bench'
1371 | expected:'B' | got:'B' | concept: 'sit_on_with_multiple_person bench'
1372 | expected:'A' | got:'A' | concept: 'sit_on skateboard'
1373 | expected:'D' | got:'D' | concept: 'sit_on skateboard'
1374 | expected:'D' | got:'D' | concept: 'sit_on skateboard'
1375 | expected:'B' | got:'C' | concept: 'sit_on skateboard'
1376 | expected:'B' | got:'B' | concept: 'lie_on couch'
1377 | expected:'A' | got:'D' | concept: 'lie_on couch'
1378 | expected:'B' | got:'B' | concept: 'lie_on couch'
1379 | expected:'A' | got:'A' | concept: 'lie_on couch'
1380 | expected:'D' | got:'B' | concept: 'lie_on bench'
1381 | expected:'D' | got:'C' | concept: 'lie_on bench'
1382 | expected:'A' | got:'C' | concept: 'lie_on bench'
1383 | expected:'B' | got:'B' | concept: 'lie_on bench'
1384 | expected:'C' | got:'C' | concept: 'lie_on bed'
1385 | expected:'C' | got:'C' | concept: 'lie_on bed'
1386 | expected:'B' | got:'B' | concept: 'lie_on bed'
1387 | expected:'C' | got:'C' | concept: 'lie_on bed'
1388 | expected:'A' | got:'A' | concept: 'sit_on bench'
1389 | expected:'B' | got:'B' | concept: 'sit_on bench'
1390 | expected:'B' | got:'B' | concept: 'sit_on bench'
1391 | expected:'D' | got:'D' | concept: 'sit_on bench'
1392 | expected:'A' | got:'A' | concept: 'inspect oven'
1393 | expected:'C' | got:'B' | concept: 'inspect oven'
1394 | expected:'D' | got:'C' | concept: 'inspect oven'
1395 | expected:'C' | got:'C' | concept: 'inspect oven'
1396 | expected:'A' | got:'A' | concept: 'clean oven'
1397 | expected:'C' | got:'C' | concept: 'clean oven'
1398 | expected:'A' | got:'A' | concept: 'clean oven'
1399 | expected:'A' | got:'A' | concept: 'clean oven'
1400 | expected:'C' | got:'C' | concept: 'clean microwave'
1401 | expected:'C' | got:'D' | concept: 'clean microwave'
1402 | expected:'C' | got:'C' | concept: 'clean microwave'
1403 | expected:'D' | got:'C' | concept: 'clean microwave'
1404 | expected:'D' | got:'A' | concept: 'operate oven'
1405 | expected:'A' | got:'C' | concept: 'operate oven'
1406 | expected:'A' | got:'A' | concept: 'operate oven'
1407 | expected:'C' | got:'C' | concept: 'operate oven'
1408 | expected:'D' | got:'A' | concept: 'adjust_or_tie tie'
1409 | expected:'A' | got:'A' | concept: 'adjust_or_tie tie'
1410 | expected:'D' | got:'A' | concept: 'adjust_or_tie tie'
1411 | expected:'D' | got:'D' | concept: 'adjust_or_tie tie'
1412 | expected:'C' | got:'C' | concept: 'wear backpack'
1413 | expected:'A' | got:'B' | concept: 'wear backpack'
1414 | expected:'C' | got:'C' | concept: 'wear backpack'
1415 | expected:'A' | got:'A' | concept: 'wear backpack'
1416 | expected:'D' | got:'B' | concept: 'wear tie'
1417 | expected:'C' | got:'A' | concept: 'wear tie'
1418 | expected:'A' | got:'C' | concept: 'wear tie'
1419 | expected:'C' | got:'C' | concept: 'wear tie'
1420 | expected:'B' | got:'B' | concept: 'hold backpack'
1421 | expected:'D' | got:'C' | concept: 'hold backpack'
1422 | expected:'C' | got:'C' | concept: 'hold backpack'
1423 | expected:'A' | got:'A' | concept: 'hold backpack'
1424 | expected:'B' | got:'B' | concept: 'type_on keyboard'
1425 | expected:'D' | got:'A' | concept: 'type_on keyboard'
1426 | expected:'D' | got:'A' | concept: 'type_on keyboard'
1427 | expected:'B' | got:'B' | concept: 'type_on keyboard'
1428 | expected:'C' | got:'C' | concept: 'type_on laptop'
1429 | expected:'B' | got:'B' | concept: 'type_on laptop'
1430 | expected:'B' | got:'C' | concept: 'type_on laptop'
1431 | expected:'B' | got:'B' | concept: 'type_on laptop'
1432 | expected:'A' | got:'A' | concept: 'clean toilet'
1433 | expected:'D' | got:'D' | concept: 'clean toilet'
1434 | expected:'A' | got:'A' | concept: 'clean toilet'
1435 | expected:'C' | got:'C' | concept: 'clean toilet'
1436 | expected:'A' | got:'C' | concept: 'clean keyboard'
1437 | expected:'D' | got:'A' | concept: 'clean keyboard'
1438 | expected:'D' | got:'B' | concept: 'clean keyboard'
1439 | expected:'B' | got:'A' | concept: 'clean keyboard'
1440 | expected:'D' | got:'D' | concept: 'kiss dog'
1441 | expected:'C' | got:'C' | concept: 'kiss dog'
1442 | expected:'C' | got:'C' | concept: 'kiss dog'
1443 | expected:'C' | got:'C' | concept: 'kiss dog'
1444 | expected:'C' | got:'C' | concept: 'train dog'
1445 | expected:'A' | got:'A' | concept: 'train dog'
1446 | expected:'A' | got:'A' | concept: 'train dog'
1447 | expected:'B' | got:'B' | concept: 'train dog'
1448 | expected:'C' | got:'D' | concept: 'hug dog'
1449 | expected:'B' | got:'B' | concept: 'hug dog'
1450 | expected:'B' | got:'C' | concept: 'hug dog'
1451 | expected:'B' | got:'B' | concept: 'hug dog'
1452 | expected:'B' | got:'B' | concept: 'hold dog'
1453 | expected:'C' | got:'A' | concept: 'hold dog'
1454 | expected:'A' | got:'D' | concept: 'hold dog'
1455 | expected:'D' | got:'A' | concept: 'hold dog'
1456 | expected:'D' | got:'C' | concept: 'hold_and_about_to_eat banana'
1457 | expected:'B' | got:'B' | concept: 'hold_and_about_to_eat banana'
1458 | expected:'C' | got:'A' | concept: 'hold_and_about_to_eat banana'
1459 | expected:'B' | got:'B' | concept: 'hold_and_about_to_eat banana'
1460 | expected:'C' | got:'A' | concept: 'peel banana'
1461 | expected:'C' | got:'C' | concept: 'peel banana'
1462 | expected:'A' | got:'D' | concept: 'peel banana'
1463 | expected:'A' | got:'C' | concept: 'peel banana'
1464 | expected:'C' | got:'A' | concept: 'hold banana'
1465 | expected:'B' | got:'A' | concept: 'hold banana'
1466 | expected:'C' | got:'D' | concept: 'hold banana'
1467 | expected:'D' | got:'B' | concept: 'hold banana'
1468 | expected:'D' | got:'B' | concept: 'eat banana'
1469 | expected:'A' | got:'C' | concept: 'eat banana'
1470 | expected:'A' | got:'D' | concept: 'eat banana'
1471 | expected:'D' | got:'B' | concept: 'eat banana'
1472 | expected:'C' | got:'C' | concept: 'hold person'
1473 | expected:'C' | got:'C' | concept: 'hold person'
1474 | expected:'B' | got:'C' | concept: 'hold person'
1475 | expected:'B' | got:'B' | concept: 'hold person'
1476 | expected:'D' | got:'D' | concept: 'hug person'
1477 | expected:'C' | got:'C' | concept: 'hug person'
1478 | expected:'A' | got:'C' | concept: 'hug person'
1479 | expected:'A' | got:'D' | concept: 'hug person'
1480 | expected:'A' | got:'C' | concept: 'greet person'
1481 | expected:'B' | got:'D' | concept: 'greet person'
1482 | expected:'A' | got:'A' | concept: 'greet person'
1483 | expected:'B' | got:'D' | concept: 'greet person'
1484 | expected:'D' | got:'D' | concept: 'kiss person'
1485 | expected:'A' | got:'A' | concept: 'kiss person'
1486 | expected:'D' | got:'D' | concept: 'kiss person'
1487 | expected:'B' | got:'B' | concept: 'kiss person'
1488 | expected:'A' | got:'A' | concept: 'carry surfboard'
1489 | expected:'B' | got:'B' | concept: 'carry surfboard'
1490 | expected:'D' | got:'D' | concept: 'carry surfboard'
1491 | expected:'B' | got:'B' | concept: 'carry surfboard'
1492 | expected:'D' | got:'B' | concept: 'drag suitcase'
1493 | expected:'D' | got:'A' | concept: 'drag suitcase'
1494 | expected:'A' | got:'C' | concept: 'drag suitcase'
1495 | expected:'B' | got:'D' | concept: 'drag suitcase'
1496 | expected:'A' | got:'A' | concept: 'carry suitcase'
1497 | expected:'D' | got:'D' | concept: 'carry suitcase'
1498 | expected:'D' | got:'D' | concept: 'carry suitcase'
1499 | expected:'A' | got:'A' | concept: 'carry suitcase'
1500 | expected:'D' | got:'A' | concept: 'carry handbag'
1501 | expected:'C' | got:'C' | concept: 'carry handbag'
1502 | expected:'A' | got:'A' | concept: 'carry handbag'
1503 | expected:'D' | got:'A' | concept: 'carry handbag'
1504 | expected:'B' | got:'B' | concept: 'hold toothbrush'
1505 | expected:'D' | got:'B' | concept: 'hold toothbrush'
1506 | expected:'D' | got:'D' | concept: 'hold toothbrush'
1507 | expected:'A' | got:'A' | concept: 'hold toothbrush'
1508 | expected:'D' | got:'D' | concept: 'hold fork'
1509 | expected:'D' | got:'D' | concept: 'hold fork'
1510 | expected:'B' | got:'B' | concept: 'hold fork'
1511 | expected:'A' | got:'A' | concept: 'hold fork'
1512 | expected:'C' | got:'C' | concept: 'hold handbag'
1513 | expected:'B' | got:'B' | concept: 'hold handbag'
1514 | expected:'A' | got:'A' | concept: 'hold handbag'
1515 | expected:'D' | got:'A' | concept: 'hold handbag'
1516 | expected:'D' | got:'D' | concept: 'hold bird'
1517 | expected:'C' | got:'B' | concept: 'hold bird'
1518 | expected:'C' | got:'C' | concept: 'hold bird'
1519 | expected:'A' | got:'A' | concept: 'hold bird'
1520 | expected:'A' | got:'A' | concept: 'eat donut'
1521 | expected:'D' | got:'D' | concept: 'eat donut'
1522 | expected:'B' | got:'B' | concept: 'eat donut'
1523 | expected:'B' | got:'B' | concept: 'eat donut'
1524 | expected:'D' | got:'D' | concept: 'eat apple'
1525 | expected:'D' | got:'D' | concept: 'eat apple'
1526 | expected:'A' | got:'A' | concept: 'eat apple'
1527 | expected:'D' | got:'D' | concept: 'eat apple'
1528 | expected:'A' | got:'A' | concept: 'eat pizza'
1529 | expected:'D' | got:'INVALID' | concept: 'eat pizza'
1530 | expected:'A' | got:'A' | concept: 'eat pizza'
1531 | expected:'B' | got:'B' | concept: 'eat pizza'
1532 | expected:'B' | got:'B' | concept: 'eat hot_dog'
1533 | expected:'D' | got:'D' | concept: 'eat hot_dog'
1534 | expected:'C' | got:'C' | concept: 'eat hot_dog'
1535 | expected:'A' | got:'A' | concept: 'eat hot_dog'
1536 | expected:'C' | got:'C' | concept: 'hug person'
1537 | expected:'B' | got:'B' | concept: 'hug person'
1538 | expected:'D' | got:'D' | concept: 'hug person'
1539 | expected:'B' | got:'B' | concept: 'hug person'
1540 | expected:'B' | got:'B' | concept: 'kiss person'
1541 | expected:'D' | got:'D' | concept: 'kiss person'
1542 | expected:'C' | got:'C' | concept: 'kiss person'
1543 | expected:'B' | got:'B' | concept: 'kiss person'
1544 | expected:'C' | got:'C' | concept: 'hug horse'
1545 | expected:'D' | got:'C' | concept: 'hug horse'
1546 | expected:'C' | got:'D' | concept: 'hug horse'
1547 | expected:'A' | got:'A' | concept: 'hug horse'
1548 | expected:'A' | got:'A' | concept: 'greet person'
1549 | expected:'B' | got:'B' | concept: 'greet person'
1550 | expected:'D' | got:'D' | concept: 'greet person'
1551 | expected:'A' | got:'A' | concept: 'greet person'
1552 | expected:'D' | got:'D' | concept: 'hold scissors'
1553 | expected:'A' | got:'A' | concept: 'hold scissors'
1554 | expected:'A' | got:'A' | concept: 'hold scissors'
1555 | expected:'B' | got:'B' | concept: 'hold scissors'
1556 | expected:'D' | got:'D' | concept: 'hold horse'
1557 | expected:'D' | got:'D' | concept: 'hold horse'
1558 | expected:'B' | got:'B' | concept: 'hold horse'
1559 | expected:'B' | got:'B' | concept: 'hold horse'
1560 | expected:'A' | got:'A' | concept: 'hold bottle'
1561 | expected:'C' | got:'C' | concept: 'hold bottle'
1562 | expected:'B' | got:'B' | concept: 'hold bottle'
1563 | expected:'D' | got:'B' | concept: 'hold bottle'
1564 | expected:'C' | got:'C' | concept: 'hold spoon'
1565 | expected:'D' | got:'C' | concept: 'hold spoon'
1566 | expected:'C' | got:'C' | concept: 'hold spoon'
1567 | expected:'B' | got:'D' | concept: 'hold spoon'
1568 | expected:'D' | got:'B' | concept: 'feed bird'
1569 | expected:'D' | got:'B' | concept: 'feed bird'
1570 | expected:'B' | got:'B' | concept: 'feed bird'
1571 | expected:'A' | got:'A' | concept: 'feed bird'
1572 | expected:'D' | got:'C' | concept: 'feed sheep'
1573 | expected:'D' | got:'C' | concept: 'feed sheep'
1574 | expected:'D' | got:'B' | concept: 'feed sheep'
1575 | expected:'A' | got:'A' | concept: 'feed sheep'
1576 | expected:'A' | got:'A' | concept: 'shear sheep'
1577 | expected:'C' | got:'C' | concept: 'shear sheep'
1578 | expected:'C' | got:'C' | concept: 'shear sheep'
1579 | expected:'A' | got:'A' | concept: 'shear sheep'
1580 | expected:'A' | got:'A' | concept: 'pet sheep'
1581 | expected:'D' | got:'D' | concept: 'pet sheep'
1582 | expected:'C' | got:'C' | concept: 'pet sheep'
1583 | expected:'C' | got:'C' | concept: 'pet sheep'
1584 | expected:'D' | got:'D' | concept: 'hold horse'
1585 | expected:'B' | got:'B' | concept: 'hold horse'
1586 | expected:'C' | got:'C' | concept: 'hold horse'
1587 | expected:'A' | got:'A' | concept: 'hold horse'
1588 | expected:'A' | got:'A' | concept: 'hold scissors'
1589 | expected:'C' | got:'C' | concept: 'hold scissors'
1590 | expected:'D' | got:'D' | concept: 'hold scissors'
1591 | expected:'A' | got:'A' | concept: 'hold scissors'
1592 | expected:'B' | got:'B' | concept: 'hold sandwich'
1593 | expected:'D' | got:'D' | concept: 'hold sandwich'
1594 | expected:'C' | got:'C' | concept: 'hold sandwich'
1595 | expected:'A' | got:'A' | concept: 'hold sandwich'
1596 | expected:'B' | got:'A' | concept: 'hold wine_glass'
1597 | expected:'D' | got:'A' | concept: 'hold wine_glass'
1598 | expected:'C' | got:'C' | concept: 'hold wine_glass'
1599 | expected:'C' | got:'C' | concept: 'hold wine_glass'
1600 | expected:'A' | got:'A' | concept: 'hold cup'
1601 | expected:'A' | got:'A' | concept: 'hold cup'
1602 | expected:'A' | got:'C' | concept: 'hold cup'
1603 | expected:'D' | got:'C' | concept: 'hold cup'
1604 | expected:'D' | got:'C' | concept: 'hold orange'
1605 | expected:'A' | got:'D' | concept: 'hold orange'
1606 | expected:'D' | got:'D' | concept: 'hold orange'
1607 | expected:'A' | got:'A' | concept: 'hold orange'
1608 | expected:'C' | got:'C' | concept: 'hold wine_glass'
1609 | expected:'B' | got:'B' | concept: 'hold wine_glass'
1610 | expected:'C' | got:'C' | concept: 'hold wine_glass'
1611 | expected:'D' | got:'D' | concept: 'hold wine_glass'
1612 | expected:'D' | got:'D' | concept: 'hold bottle'
1613 | expected:'D' | got:'D' | concept: 'hold bottle'
1614 | expected:'B' | got:'B' | concept: 'hold bottle'
1615 | expected:'B' | got:'C' | concept: 'hold bottle'
1616 | expected:'A' | got:'C' | concept: 'hug person'
1617 | expected:'A' | got:'C' | concept: 'hug person'
1618 | expected:'C' | got:'D' | concept: 'hug person'
1619 | expected:'D' | got:'D' | concept: 'hug person'
1620 | expected:'B' | got:'B' | concept: 'kiss horse'
1621 | expected:'A' | got:'A' | concept: 'kiss horse'
1622 | expected:'C' | got:'C' | concept: 'kiss horse'
1623 | expected:'A' | got:'A' | concept: 'kiss horse'
1624 | expected:'D' | got:'C' | concept: 'kiss dog'
1625 | expected:'B' | got:'B' | concept: 'kiss dog'
1626 | expected:'B' | got:'B' | concept: 'kiss dog'
1627 | expected:'B' | got:'B' | concept: 'kiss dog'
1628 | expected:'D' | got:'D' | concept: 'kiss person'
1629 | expected:'B' | got:'B' | concept: 'kiss person'
1630 | expected:'A' | got:'A' | concept: 'kiss person'
1631 | expected:'C' | got:'C' | concept: 'kiss person'
1632 | expected:'D' | got:'D' | concept: 'kick sports_ball'
1633 | expected:'A' | got:'A' | concept: 'kick sports_ball'
1634 | expected:'C' | got:'C' | concept: 'kick sports_ball'
1635 | expected:'A' | got:'A' | concept: 'kick sports_ball'
1636 | expected:'D' | got:'A' | concept: 'spin sports_ball'
1637 | expected:'C' | got:'A' | concept: 'spin sports_ball'
1638 | expected:'D' | got:'A' | concept: 'spin sports_ball'
1639 | expected:'B' | got:'B' | concept: 'spin sports_ball'
1640 | expected:'B' | got:'B' | concept: 'block sports_ball'
1641 | expected:'C' | got:'D' | concept: 'block sports_ball'
1642 | expected:'D' | got:'D' | concept: 'block sports_ball'
1643 | expected:'C' | got:'C' | concept: 'block sports_ball'
1644 | expected:'C' | got:'C' | concept: 'serve sports_ball'
1645 | expected:'B' | got:'B' | concept: 'serve sports_ball'
1646 | expected:'D' | got:'D' | concept: 'serve sports_ball'
1647 | expected:'B' | got:'B' | concept: 'serve sports_ball'
1648 | expected:'C' | got:'C' | concept: 'hold bottle'
1649 | expected:'A' | got:'B' | concept: 'hold bottle'
1650 | expected:'C' | got:'A' | concept: 'hold bottle'
1651 | expected:'A' | got:'C' | concept: 'hold bottle'
1652 | expected:'C' | got:'C' | concept: 'drink_with bottle'
1653 | expected:'D' | got:'B' | concept: 'drink_with bottle'
1654 | expected:'D' | got:'D' | concept: 'drink_with bottle'
1655 | expected:'B' | got:'B' | concept: 'drink_with bottle'
1656 | expected:'C' | got:'C' | concept: 'drink_with cup'
1657 | expected:'D' | got:'A' | concept: 'drink_with cup'
1658 | expected:'A' | got:'A' | concept: 'drink_with cup'
1659 | expected:'B' | got:'D' | concept: 'drink_with cup'
1660 | expected:'D' | got:'D' | concept: 'hold remote'
1661 | expected:'A' | got:'A' | concept: 'hold remote'
1662 | expected:'A' | got:'A' | concept: 'hold remote'
1663 | expected:'A' | got:'A' | concept: 'hold remote'
1664 | expected:'A' | got:'A' | concept: 'point_at_camera remote'
1665 | expected:'C' | got:'C' | concept: 'point_at_camera remote'
1666 | expected:'D' | got:'D' | concept: 'point_at_camera remote'
1667 | expected:'D' | got:'D' | concept: 'point_at_camera remote'
1668 | expected:'A' | got:'A' | concept: 'direct airplane'
1669 | expected:'C' | got:'C' | concept: 'direct airplane'
1670 | expected:'A' | got:'A' | concept: 'direct airplane'
1671 | expected:'B' | got:'B' | concept: 'direct airplane'
1672 | expected:'B' | got:'B' | concept: 'wash motorcycle'
1673 | expected:'C' | got:'C' | concept: 'wash motorcycle'
1674 | expected:'D' | got:'A' | concept: 'wash motorcycle'
1675 | expected:'D' | got:'D' | concept: 'wash motorcycle'
1676 | expected:'C' | got:'C' | concept: 'jump motorcycle'
1677 | expected:'B' | got:'B' | concept: 'jump motorcycle'
1678 | expected:'C' | got:'C' | concept: 'jump motorcycle'
1679 | expected:'B' | got:'B' | concept: 'jump motorcycle'
1680 | expected:'D' | got:'D' | concept: 'walk horse'
1681 | expected:'B' | got:'A' | concept: 'walk horse'
1682 | expected:'C' | got:'C' | concept: 'walk horse'
1683 | expected:'B' | got:'B' | concept: 'walk horse'
1684 | expected:'B' | got:'B' | concept: 'walk cow'
1685 | expected:'B' | got:'B' | concept: 'walk cow'
1686 | expected:'A' | got:'A' | concept: 'walk cow'
1687 | expected:'A' | got:'A' | concept: 'walk cow'
1688 | expected:'B' | got:'B' | concept: 'pet horse'
1689 | expected:'C' | got:'C' | concept: 'pet horse'
1690 | expected:'C' | got:'C' | concept: 'pet horse'
1691 | expected:'C' | got:'C' | concept: 'pet horse'
1692 | expected:'C' | got:'C' | concept: 'kiss horse'
1693 | expected:'D' | got:'D' | concept: 'kiss horse'
1694 | expected:'A' | got:'C' | concept: 'kiss horse'
1695 | expected:'B' | got:'D' | concept: 'kiss horse'
1696 | expected:'B' | got:'B' | concept: 'sit_on skateboard'
1697 | expected:'C' | got:'C' | concept: 'sit_on skateboard'
1698 | expected:'A' | got:'A' | concept: 'sit_on skateboard'
1699 | expected:'C' | got:'C' | concept: 'sit_on skateboard'
1700 | expected:'B' | got:'B' | concept: 'sit_on truck'
1701 | expected:'D' | got:'D' | concept: 'sit_on truck'
1702 | expected:'A' | got:'A' | concept: 'sit_on truck'
1703 | expected:'A' | got:'A' | concept: 'sit_on truck'
1704 | expected:'C' | got:'C' | concept: 'sit_on bed'
1705 | expected:'D' | got:'D' | concept: 'sit_on bed'
1706 | expected:'A' | got:'C' | concept: 'sit_on bed'
1707 | expected:'D' | got:'B' | concept: 'sit_on bed'
1708 | expected:'B' | got:'B' | concept: 'lie_on bed'
1709 | expected:'B' | got:'B' | concept: 'lie_on bed'
1710 | expected:'C' | got:'C' | concept: 'lie_on bed'
1711 | expected:'D' | got:'B' | concept: 'lie_on bed'
1712 | expected:'A' | got:'A' | concept: 'hold pizza'
1713 | expected:'A' | got:'A' | concept: 'hold pizza'
1714 | expected:'C' | got:'C' | concept: 'hold pizza'
1715 | expected:'D' | got:'D' | concept: 'hold pizza'
1716 | expected:'B' | got:'B' | concept: 'hold orange'
1717 | expected:'A' | got:'A' | concept: 'hold orange'
1718 | expected:'C' | got:'C' | concept: 'hold orange'
1719 | expected:'B' | got:'B' | concept: 'hold orange'
1720 | expected:'A' | got:'A' | concept: 'hold tennis_racket'
1721 | expected:'A' | got:'A' | concept: 'hold tennis_racket'
1722 | expected:'A' | got:'A' | concept: 'hold tennis_racket'
1723 | expected:'B' | got:'B' | concept: 'hold tennis_racket'
1724 | expected:'D' | got:'D' | concept: 'hold umbrella'
1725 | expected:'C' | got:'C' | concept: 'hold umbrella'
1726 | expected:'B' | got:'B' | concept: 'hold umbrella'
1727 | expected:'A' | got:'A' | concept: 'hold umbrella'
1728 | expected:'A' | got:'C' | concept: 'read laptop'
1729 | expected:'C' | got:'C' | concept: 'read laptop'
1730 | expected:'D' | got:'A' | concept: 'read laptop'
1731 | expected:'B' | got:'B' | concept: 'read laptop'
1732 | expected:'B' | got:'B' | concept: 'hold book'
1733 | expected:'B' | got:'B' | concept: 'hold book'
1734 | expected:'B' | got:'B' | concept: 'hold book'
1735 | expected:'A' | got:'A' | concept: 'hold book'
1736 | expected:'C' | got:'C' | concept: 'read book'
1737 | expected:'D' | got:'C' | concept: 'read book'
1738 | expected:'B' | got:'A' | concept: 'read book'
1739 | expected:'A' | got:'C' | concept: 'read book'
1740 | expected:'A' | got:'A' | concept: 'hold banana'
1741 | expected:'C' | got:'C' | concept: 'hold banana'
1742 | expected:'B' | got:'B' | concept: 'hold banana'
1743 | expected:'C' | got:'C' | concept: 'hold banana'
1744 | expected:'A' | got:'C' | concept: 'smell apple'
1745 | expected:'B' | got:'B' | concept: 'smell apple'
1746 | expected:'B' | got:'D' | concept: 'smell apple'
1747 | expected:'D' | got:'A' | concept: 'smell apple'
1748 | expected:'A' | got:'A' | concept: 'wash apple'
1749 | expected:'B' | got:'B' | concept: 'wash apple'
1750 | expected:'C' | got:'C' | concept: 'wash apple'
1751 | expected:'C' | got:'A' | concept: 'wash apple'
1752 | expected:'A' | got:'A' | concept: 'pick apple'
1753 | expected:'C' | got:'C' | concept: 'pick apple'
1754 | expected:'B' | got:'D' | concept: 'pick apple'
1755 | expected:'C' | got:'C' | concept: 'pick apple'
1756 | expected:'C' | got:'C' | concept: 'hold_and_about_to_eat apple'
1757 | expected:'B' | got:'B' | concept: 'hold_and_about_to_eat apple'
1758 | expected:'A' | got:'A' | concept: 'hold_and_about_to_eat apple'
1759 | expected:'A' | got:'A' | concept: 'hold_and_about_to_eat apple'
1760 | expected:'C' | got:'C' | concept: 'feed horse'
1761 | expected:'D' | got:'D' | concept: 'feed horse'
1762 | expected:'D' | got:'D' | concept: 'feed horse'
1763 | expected:'D' | got:'D' | concept: 'feed horse'
1764 | expected:'A' | got:'A' | concept: 'feed giraffe'
1765 | expected:'D' | got:'C' | concept: 'feed giraffe'
1766 | expected:'D' | got:'D' | concept: 'feed giraffe'
1767 | expected:'D' | got:'A' | concept: 'feed giraffe'
1768 | expected:'B' | got:'B' | concept: 'feed sheep'
1769 | expected:'A' | got:'A' | concept: 'feed sheep'
1770 | expected:'B' | got:'A' | concept: 'feed sheep'
1771 | expected:'C' | got:'C' | concept: 'feed sheep'
1772 | expected:'B' | got:'B' | concept: 'feed elephant'
1773 | expected:'A' | got:'A' | concept: 'feed elephant'
1774 | expected:'A' | got:'A' | concept: 'feed elephant'
1775 | expected:'A' | got:'A' | concept: 'feed elephant'
1776 | expected:'C' | got:'D' | concept: 'inspect oven'
1777 | expected:'C' | got:'B' | concept: 'inspect oven'
1778 | expected:'D' | got:'C' | concept: 'inspect oven'
1779 | expected:'D' | got:'C' | concept: 'inspect oven'
1780 | expected:'B' | got:'B' | concept: 'clean oven'
1781 | expected:'A' | got:'A' | concept: 'clean oven'
1782 | expected:'A' | got:'A' | concept: 'clean oven'
1783 | expected:'D' | got:'D' | concept: 'clean oven'
1784 | expected:'A' | got:'A' | concept: 'open microwave'
1785 | expected:'D' | got:'A' | concept: 'open microwave'
1786 | expected:'B' | got:'B' | concept: 'open microwave'
1787 | expected:'C' | got:'C' | concept: 'open microwave'
1788 | expected:'B' | got:'C' | concept: 'open oven'
1789 | expected:'B' | got:'B' | concept: 'open oven'
1790 | expected:'A' | got:'A' | concept: 'open oven'
1791 | expected:'B' | got:'B' | concept: 'open oven'
1792 | expected:'C' | got:'C' | concept: 'hug dog'
1793 | expected:'B' | got:'B' | concept: 'hug dog'
1794 | expected:'C' | got:'C' | concept: 'hug dog'
1795 | expected:'D' | got:'D' | concept: 'hug dog'
1796 | expected:'A' | got:'A' | concept: 'wash dog'
1797 | expected:'D' | got:'D' | concept: 'wash dog'
1798 | expected:'A' | got:'A' | concept: 'wash dog'
1799 | expected:'D' | got:'D' | concept: 'wash dog'
1800 | expected:'C' | got:'C' | concept: 'walk dog'
1801 | expected:'A' | got:'A' | concept: 'walk dog'
1802 | expected:'D' | got:'D' | concept: 'walk dog'
1803 | expected:'A' | got:'A' | concept: 'walk dog'
1804 | expected:'C' | got:'C' | concept: 'kiss dog'
1805 | expected:'D' | got:'D' | concept: 'kiss dog'
1806 | expected:'A' | got:'A' | concept: 'kiss dog'
1807 | expected:'C' | got:'C' | concept: 'kiss dog'
1808 | expected:'D' | got:'A' | concept: 'hold wine_glass'
1809 | expected:'B' | got:'B' | concept: 'hold wine_glass'
1810 | expected:'A' | got:'A' | concept: 'hold wine_glass'
1811 | expected:'D' | got:'D' | concept: 'hold wine_glass'
1812 | expected:'C' | got:'C' | concept: 'hold handbag'
1813 | expected:'B' | got:'A' | concept: 'hold handbag'
1814 | expected:'A' | got:'A' | concept: 'hold handbag'
1815 | expected:'D' | got:'A' | concept: 'hold handbag'
1816 | expected:'B' | got:'B' | concept: 'hold toothbrush'
1817 | expected:'A' | got:'A' | concept: 'hold toothbrush'
1818 | expected:'B' | got:'B' | concept: 'hold toothbrush'
1819 | expected:'C' | got:'C' | concept: 'hold toothbrush'
1820 | expected:'C' | got:'A' | concept: 'hold knife'
1821 | expected:'B' | got:'B' | concept: 'hold knife'
1822 | expected:'B' | got:'B' | concept: 'hold knife'
1823 | expected:'C' | got:'C' | concept: 'hold knife'
1824 | expected:'B' | got:'B' | concept: 'catch frisbee'
1825 | expected:'D' | got:'A' | concept: 'catch frisbee'
1826 | expected:'B' | got:'B' | concept: 'catch frisbee'
1827 | expected:'A' | got:'A' | concept: 'catch frisbee'
1828 | expected:'C' | got:'C' | concept: 'drag suitcase'
1829 | expected:'C' | got:'C' | concept: 'drag suitcase'
1830 | expected:'B' | got:'B' | concept: 'drag suitcase'
1831 | expected:'D' | got:'D' | concept: 'drag suitcase'
1832 | expected:'B' | got:'D' | concept: 'throw frisbee'
1833 | expected:'A' | got:'C' | concept: 'throw frisbee'
1834 | expected:'B' | got:'B' | concept: 'throw frisbee'
1835 | expected:'B' | got:'C' | concept: 'throw frisbee'
1836 | expected:'C' | got:'C' | concept: 'hold knife'
1837 | expected:'A' | got:'A' | concept: 'hold knife'
1838 | expected:'D' | got:'D' | concept: 'hold knife'
1839 | expected:'B' | got:'B' | concept: 'hold knife'
1840 | expected:'C' | got:'C' | concept: 'read_like cell_phone'
1841 | expected:'C' | got:'D' | concept: 'read_like cell_phone'
1842 | expected:'B' | got:'A' | concept: 'read_like cell_phone'
1843 | expected:'B' | got:'C' | concept: 'read_like cell_phone'
1844 | expected:'C' | got:'C' | concept: 'hold skateboard'
1845 | expected:'B' | got:'B' | concept: 'hold skateboard'
1846 | expected:'A' | got:'A' | concept: 'hold skateboard'
1847 | expected:'B' | got:'B' | concept: 'hold skateboard'
1848 | expected:'D' | got:'D' | concept: 'hold cell_phone'
1849 | expected:'D' | got:'C' | concept: 'hold cell_phone'
1850 | expected:'D' | got:'C' | concept: 'hold cell_phone'
1851 | expected:'A' | got:'D' | concept: 'hold cell_phone'
1852 | expected:'B' | got:'B' | concept: 'talk_on_or_listen_to cell_phone'
1853 | expected:'A' | got:'A' | concept: 'talk_on_or_listen_to cell_phone'
1854 | expected:'A' | got:'A' | concept: 'talk_on_or_listen_to cell_phone'
1855 | expected:'B' | got:'B' | concept: 'talk_on_or_listen_to cell_phone'
1856 | expected:'C' | got:'C' | concept: 'hold remote'
1857 | expected:'D' | got:'D' | concept: 'hold remote'
1858 | expected:'A' | got:'A' | concept: 'hold remote'
1859 | expected:'D' | got:'D' | concept: 'hold remote'
1860 | expected:'B' | got:'B' | concept: 'hold scissors'
1861 | expected:'B' | got:'B' | concept: 'hold scissors'
1862 | expected:'B' | got:'C' | concept: 'hold scissors'
1863 | expected:'D' | got:'D' | concept: 'hold scissors'
1864 | expected:'C' | got:'C' | concept: 'hold dog'
1865 | expected:'A' | got:'A' | concept: 'hold dog'
1866 | expected:'A' | got:'A' | concept: 'hold dog'
1867 | expected:'B' | got:'B' | concept: 'hold dog'
1868 | expected:'D' | got:'D' | concept: 'hold tennis_racket'
1869 | expected:'D' | got:'D' | concept: 'hold tennis_racket'
1870 | expected:'C' | got:'C' | concept: 'hold tennis_racket'
1871 | expected:'C' | got:'C' | concept: 'hold tennis_racket'
1872 | expected:'C' | got:'C' | concept: 'pet cat'
1873 | expected:'D' | got:'A' | concept: 'pet cat'
1874 | expected:'B' | got:'B' | concept: 'pet cat'
1875 | expected:'C' | got:'C' | concept: 'pet cat'
1876 | expected:'C' | got:'A' | concept: 'hold sheep'
1877 | expected:'B' | got:'B' | concept: 'hold sheep'
1878 | expected:'D' | got:'D' | concept: 'hold sheep'
1879 | expected:'A' | got:'C' | concept: 'hold sheep'
1880 | expected:'C' | got:'D' | concept: 'pet sheep'
1881 | expected:'C' | got:'C' | concept: 'pet sheep'
1882 | expected:'C' | got:'C' | concept: 'pet sheep'
1883 | expected:'B' | got:'B' | concept: 'pet sheep'
1884 | expected:'B' | got:'B' | concept: 'shear sheep'
1885 | expected:'A' | got:'D' | concept: 'shear sheep'
1886 | expected:'B' | got:'B' | concept: 'shear sheep'
1887 | expected:'B' | got:'B' | concept: 'shear sheep'
1888 | expected:'D' | got:'D' | concept: 'sit_on chair'
1889 | expected:'B' | got:'B' | concept: 'sit_on chair'
1890 | expected:'D' | got:'D' | concept: 'sit_on chair'
1891 | expected:'B' | got:'B' | concept: 'sit_on chair'
1892 | expected:'A' | got:'A' | concept: 'stand_on chair'
1893 | expected:'D' | got:'D' | concept: 'stand_on chair'
1894 | expected:'B' | got:'B' | concept: 'stand_on chair'
1895 | expected:'B' | got:'C' | concept: 'stand_on chair'
1896 | expected:'A' | got:'A' | concept: 'stand_on boat'
1897 | expected:'D' | got:'D' | concept: 'stand_on boat'
1898 | expected:'A' | got:'A' | concept: 'stand_on boat'
1899 | expected:'A' | got:'A' | concept: 'stand_on boat'
1900 | expected:'A' | got:'B' | concept: 'lie_on_like chair'
1901 | expected:'D' | got:'A' | concept: 'lie_on_like chair'
1902 | expected:'B' | got:'C' | concept: 'lie_on_like chair'
1903 | expected:'D' | got:'D' | concept: 'lie_on_like chair'
1904 | expected:'B' | got:'B' | concept: 'hold knife'
1905 | expected:'A' | got:'C' | concept: 'hold knife'
1906 | expected:'D' | got:'A' | concept: 'hold knife'
1907 | expected:'B' | got:'C' | concept: 'hold knife'
1908 | expected:'B' | got:'C' | concept: 'wield knife'
1909 | expected:'D' | got:'A' | concept: 'wield knife'
1910 | expected:'C' | got:'D' | concept: 'wield knife'
1911 | expected:'C' | got:'D' | concept: 'wield knife'
1912 | expected:'A' | got:'A' | concept: 'cut_with knife'
1913 | expected:'D' | got:'D' | concept: 'cut_with knife'
1914 | expected:'D' | got:'A' | concept: 'cut_with knife'
1915 | expected:'A' | got:'A' | concept: 'cut_with knife'
1916 | expected:'A' | got:'A' | concept: 'lick knife'
1917 | expected:'A' | got:'A' | concept: 'lick knife'
1918 | expected:'D' | got:'INVALID' | concept: 'lick knife'
1919 | expected:'D' | got:'C' | concept: 'lick knife'
1920 | expected:'A' | got:'A' | concept: 'direct airplane'
1921 | expected:'A' | got:'C' | concept: 'direct airplane'
1922 | expected:'C' | got:'C' | concept: 'direct airplane'
1923 | expected:'D' | got:'D' | concept: 'direct airplane'
1924 | expected:'B' | got:'B' | concept: 'sit_inside bus'
1925 | expected:'B' | got:'B' | concept: 'sit_inside bus'
1926 | expected:'D' | got:'D' | concept: 'sit_inside bus'
1927 | expected:'A' | got:'A' | concept: 'sit_inside bus'
1928 | expected:'D' | got:'D' | concept: 'lie_on surfboard'
1929 | expected:'D' | got:'D' | concept: 'lie_on surfboard'
1930 | expected:'A' | got:'A' | concept: 'lie_on surfboard'
1931 | expected:'B' | got:'B' | concept: 'lie_on surfboard'
1932 | expected:'B' | got:'B' | concept: 'point_at_camera remote'
1933 | expected:'A' | got:'A' | concept: 'point_at_camera remote'
1934 | expected:'C' | got:'C' | concept: 'point_at_camera remote'
1935 | expected:'B' | got:'B' | concept: 'point_at_camera remote'
1936 | expected:'B' | got:'B' | concept: 'walk dog'
1937 | expected:'B' | got:'B' | concept: 'walk dog'
1938 | expected:'A' | got:'A' | concept: 'walk dog'
1939 | expected:'C' | got:'C' | concept: 'walk dog'
1940 | expected:'B' | got:'C' | concept: 'kiss horse'
1941 | expected:'C' | got:'C' | concept: 'kiss horse'
1942 | expected:'C' | got:'C' | concept: 'kiss horse'
1943 | expected:'D' | got:'D' | concept: 'kiss horse'
1944 | expected:'D' | got:'D' | concept: 'kiss dog'
1945 | expected:'A' | got:'A' | concept: 'kiss dog'
1946 | expected:'D' | got:'D' | concept: 'kiss dog'
1947 | expected:'A' | got:'A' | concept: 'kiss dog'
1948 | expected:'B' | got:'D' | concept: 'wash dog'
1949 | expected:'B' | got:'B' | concept: 'wash dog'
1950 | expected:'C' | got:'C' | concept: 'wash dog'
1951 | expected:'C' | got:'C' | concept: 'wash dog'
1952 | expected:'B' | got:'B' | concept: 'sit_on couch'
1953 | expected:'C' | got:'C' | concept: 'sit_on couch'
1954 | expected:'D' | got:'D' | concept: 'sit_on couch'
1955 | expected:'A' | got:'A' | concept: 'sit_on couch'
1956 | expected:'D' | got:'D' | concept: 'sit_on bench'
1957 | expected:'A' | got:'A' | concept: 'sit_on bench'
1958 | expected:'A' | got:'A' | concept: 'sit_on bench'
1959 | expected:'D' | got:'D' | concept: 'sit_on bench'
1960 | expected:'D' | got:'D' | concept: 'sit_on truck'
1961 | expected:'B' | got:'B' | concept: 'sit_on truck'
1962 | expected:'D' | got:'D' | concept: 'sit_on truck'
1963 | expected:'B' | got:'B' | concept: 'sit_on truck'
1964 | expected:'A' | got:'A' | concept: 'sit_on skateboard'
1965 | expected:'D' | got:'D' | concept: 'sit_on skateboard'
1966 | expected:'B' | got:'B' | concept: 'sit_on skateboard'
1967 | expected:'D' | got:'D' | concept: 'sit_on skateboard'
1968 | expected:'D' | got:'D' | concept: 'sit_on bed'
1969 | expected:'D' | got:'D' | concept: 'sit_on bed'
1970 | expected:'D' | got:'D' | concept: 'sit_on bed'
1971 | expected:'B' | got:'B' | concept: 'sit_on bed'
1972 | expected:'C' | got:'C' | concept: 'lie_on bench'
1973 | expected:'B' | got:'B' | concept: 'lie_on bench'
1974 | expected:'B' | got:'B' | concept: 'lie_on bench'
1975 | expected:'C' | got:'C' | concept: 'lie_on bench'
1976 | expected:'C' | got:'C' | concept: 'sit_on bench'
1977 | expected:'A' | got:'A' | concept: 'sit_on bench'
1978 | expected:'C' | got:'C' | concept: 'sit_on bench'
1979 | expected:'C' | got:'C' | concept: 'sit_on bench'
1980 | expected:'D' | got:'D' | concept: 'sit_on chair'
1981 | expected:'D' | got:'D' | concept: 'sit_on chair'
1982 | expected:'B' | got:'B' | concept: 'sit_on chair'
1983 | expected:'D' | got:'C' | concept: 'sit_on chair'
1984 | expected:'C' | got:'C' | concept: 'hold sports_ball'
1985 | expected:'C' | got:'C' | concept: 'hold sports_ball'
1986 | expected:'A' | got:'A' | concept: 'hold sports_ball'
1987 | expected:'D' | got:'C' | concept: 'hold sports_ball'
1988 | expected:'D' | got:'D' | concept: 'hold horse'
1989 | expected:'C' | got:'C' | concept: 'hold horse'
1990 | expected:'A' | got:'A' | concept: 'hold horse'
1991 | expected:'B' | got:'A' | concept: 'hold horse'
1992 | expected:'C' | got:'C' | concept: 'hold hot_dog'
1993 | expected:'A' | got:'A' | concept: 'hold hot_dog'
1994 | expected:'B' | got:'B' | concept: 'hold hot_dog'
1995 | expected:'D' | got:'D' | concept: 'hold hot_dog'
1996 | expected:'D' | got:'D' | concept: 'hold person'
1997 | expected:'C' | got:'C' | concept: 'hold person'
1998 | expected:'A' | got:'A' | concept: 'hold person'
1999 | expected:'C' | got:'C' | concept: 'hold person'
2000 | expected:'C' | got:'C' | concept: 'ride skateboard'
2001 | expected:'C' | got:'C' | concept: 'ride skateboard'
2002 | expected:'B' | got:'B' | concept: 'ride skateboard'
2003 | expected:'B' | got:'B' | concept: 'ride skateboard'
2004 | expected:'C' | got:'C' | concept: 'hold hot_dog'
2005 | expected:'A' | got:'A' | concept: 'hold hot_dog'
2006 | expected:'A' | got:'A' | concept: 'hold hot_dog'
2007 | expected:'B' | got:'B' | concept: 'hold hot_dog'
2008 | expected:'D' | got:'D' | concept: 'hold cake'
2009 | expected:'D' | got:'B' | concept: 'hold cake'
2010 | expected:'A' | got:'C' | concept: 'hold cake'
2011 | expected:'D' | got:'A' | concept: 'hold cake'
2012 | expected:'A' | got:'A' | concept: 'hold skateboard'
2013 | expected:'B' | got:'B' | concept: 'hold skateboard'
2014 | expected:'B' | got:'B' | concept: 'hold skateboard'
2015 | expected:'A' | got:'A' | concept: 'hold skateboard'
2016 | expected:'A' | got:'A' | concept: 'ride skateboard'
2017 | expected:'B' | got:'C' | concept: 'ride skateboard'
2018 | expected:'A' | got:'A' | concept: 'ride skateboard'
2019 | expected:'A' | got:'A' | concept: 'ride skateboard'
2020 | expected:'D' | got:'D' | concept: 'hold skateboard'
2021 | expected:'B' | got:'B' | concept: 'hold skateboard'
2022 | expected:'A' | got:'A' | concept: 'hold skateboard'
2023 | expected:'D' | got:'D' | concept: 'hold skateboard'
2024 | expected:'D' | got:'D' | concept: 'jump skateboard'
2025 | expected:'A' | got:'A' | concept: 'jump skateboard'
2026 | expected:'B' | got:'B' | concept: 'jump skateboard'
2027 | expected:'D' | got:'D' | concept: 'jump skateboard'
2028 | expected:'C' | got:'C' | concept: 'ride skis'
2029 | expected:'C' | got:'C' | concept: 'ride skis'
2030 | expected:'A' | got:'A' | concept: 'ride skis'
2031 | expected:'C' | got:'C' | concept: 'ride skis'
2032 | expected:'C' | got:'C' | concept: 'jump skateboard'
2033 | expected:'A' | got:'A' | concept: 'jump skateboard'
2034 | expected:'D' | got:'D' | concept: 'jump skateboard'
2035 | expected:'A' | got:'A' | concept: 'jump skateboard'
2036 | expected:'D' | got:'D' | concept: 'jump snowboard'
2037 | expected:'B' | got:'D' | concept: 'jump snowboard'
2038 | expected:'D' | got:'D' | concept: 'jump snowboard'
2039 | expected:'D' | got:'D' | concept: 'jump snowboard'
2040 | expected:'C' | got:'C' | concept: 'jump bicycle'
2041 | expected:'A' | got:'A' | concept: 'jump bicycle'
2042 | expected:'D' | got:'D' | concept: 'jump bicycle'
2043 | expected:'B' | got:'B' | concept: 'jump bicycle'
2044 | expected:'A' | got:'A' | concept: 'jump skis'
2045 | expected:'C' | got:'A' | concept: 'jump skis'
2046 | expected:'B' | got:'B' | concept: 'jump skis'
2047 | expected:'D' | got:'D' | concept: 'jump skis'
2048 | expected:'D' | got:'D' | concept: 'drive train'
2049 | expected:'D' | got:'D' | concept: 'drive train'
2050 | expected:'B' | got:'B' | concept: 'drive train'
2051 | expected:'C' | got:'C' | concept: 'drive train'
2052 | expected:'D' | got:'D' | concept: 'board train'
2053 | expected:'B' | got:'B' | concept: 'board train'
2054 | expected:'D' | got:'D' | concept: 'board train'
2055 | expected:'A' | got:'A' | concept: 'board train'
2056 | expected:'C' | got:'C' | concept: 'wash car'
2057 | expected:'C' | got:'C' | concept: 'wash car'
2058 | expected:'C' | got:'C' | concept: 'wash car'
2059 | expected:'C' | got:'C' | concept: 'wash car'
2060 | expected:'B' | got:'B' | concept: 'drive car'
2061 | expected:'A' | got:'A' | concept: 'drive car'
2062 | expected:'C' | got:'C' | concept: 'drive car'
2063 | expected:'C' | got:'C' | concept: 'drive car'
2064 | expected:'D' | got:'D' | concept: 'jump bicycle'
2065 | expected:'A' | got:'A' | concept: 'jump bicycle'
2066 | expected:'D' | got:'D' | concept: 'jump bicycle'
2067 | expected:'A' | got:'A' | concept: 'jump bicycle'
2068 | expected:'B' | got:'A' | concept: 'straddle bicycle'
2069 | expected:'A' | got:'D' | concept: 'straddle bicycle'
2070 | expected:'A' | got:'B' | concept: 'straddle bicycle'
2071 | expected:'B' | got:'D' | concept: 'straddle bicycle'
2072 | expected:'C' | got:'C' | concept: 'ride bicycle'
2073 | expected:'B' | got:'B' | concept: 'ride bicycle'
2074 | expected:'C' | got:'C' | concept: 'ride bicycle'
2075 | expected:'D' | got:'D' | concept: 'ride bicycle'
2076 | expected:'B' | got:'D' | concept: 'walk bicycle'
2077 | expected:'C' | got:'C' | concept: 'walk bicycle'
2078 | expected:'B' | got:'B' | concept: 'walk bicycle'
2079 | expected:'B' | got:'D' | concept: 'walk bicycle'
2080 | expected:'C' | got:'C' | concept: 'hold mouse'
2081 | expected:'B' | got:'B' | concept: 'hold mouse'
2082 | expected:'A' | got:'A' | concept: 'hold mouse'
2083 | expected:'C' | got:'C' | concept: 'hold mouse'
2084 | expected:'C' | got:'C' | concept: 'hold wine_glass'
2085 | expected:'B' | got:'B' | concept: 'hold wine_glass'
2086 | expected:'A' | got:'A' | concept: 'hold wine_glass'
2087 | expected:'D' | got:'A' | concept: 'hold wine_glass'
2088 | expected:'A' | got:'A' | concept: 'hold apple'
2089 | expected:'C' | got:'C' | concept: 'hold apple'
2090 | expected:'B' | got:'B' | concept: 'hold apple'
2091 | expected:'B' | got:'B' | concept: 'hold apple'
2092 | expected:'C' | got:'C' | concept: 'hold handbag'
2093 | expected:'A' | got:'A' | concept: 'hold handbag'
2094 | expected:'D' | got:'A' | concept: 'hold handbag'
2095 | expected:'B' | got:'B' | concept: 'hold handbag'
2096 | expected:'B' | got:'D' | concept: 'clean microwave'
2097 | expected:'B' | got:'D' | concept: 'clean microwave'
2098 | expected:'D' | got:'A' | concept: 'clean microwave'
2099 | expected:'B' | got:'B' | concept: 'clean microwave'
2100 | expected:'D' | got:'D' | concept: 'open refrigerator'
2101 | expected:'D' | got:'D' | concept: 'open refrigerator'
2102 | expected:'B' | got:'B' | concept: 'open refrigerator'
2103 | expected:'B' | got:'B' | concept: 'open refrigerator'
2104 | expected:'C' | got:'C' | concept: 'clean refrigerator'
2105 | expected:'A' | got:'A' | concept: 'clean refrigerator'
2106 | expected:'A' | got:'A' | concept: 'clean refrigerator'
2107 | expected:'B' | got:'A' | concept: 'clean refrigerator'
2108 | expected:'B' | got:'B' | concept: 'open microwave'
2109 | expected:'D' | got:'A' | concept: 'open microwave'
2110 | expected:'B' | got:'B' | concept: 'open microwave'
2111 | expected:'D' | got:'D' | concept: 'open microwave'
2112 | expected:'D' | got:'A' | concept: 'stick knife'
2113 | expected:'B' | got:'D' | concept: 'stick knife'
2114 | expected:'C' | got:'B' | concept: 'stick knife'
2115 | expected:'C' | got:'D' | concept: 'stick knife'
2116 | expected:'A' | got:'A' | concept: 'hold knife'
2117 | expected:'C' | got:'C' | concept: 'hold knife'
2118 | expected:'C' | got:'C' | concept: 'hold knife'
2119 | expected:'C' | got:'C' | concept: 'hold knife'
2120 | expected:'B' | got:'B' | concept: 'hold mouse'
2121 | expected:'A' | got:'A' | concept: 'hold mouse'
2122 | expected:'C' | got:'C' | concept: 'hold mouse'
2123 | expected:'B' | got:'B' | concept: 'hold mouse'
2124 | expected:'D' | got:'D' | concept: 'hold sheep'
2125 | expected:'B' | got:'B' | concept: 'hold sheep'
2126 | expected:'B' | got:'B' | concept: 'hold sheep'
2127 | expected:'B' | got:'B' | concept: 'hold sheep'
2128 | expected:'B' | got:'B' | concept: 'clean keyboard'
2129 | expected:'D' | got:'A' | concept: 'clean keyboard'
2130 | expected:'D' | got:'D' | concept: 'clean keyboard'
2131 | expected:'D' | got:'D' | concept: 'clean keyboard'
2132 | expected:'B' | got:'B' | concept: 'inspect oven'
2133 | expected:'D' | got:'C' | concept: 'inspect oven'
2134 | expected:'D' | got:'C' | concept: 'inspect oven'
2135 | expected:'B' | got:'C' | concept: 'inspect oven'
2136 | expected:'A' | got:'A' | concept: 'clean oven'
2137 | expected:'A' | got:'A' | concept: 'clean oven'
2138 | expected:'D' | got:'A' | concept: 'clean oven'
2139 | expected:'D' | got:'D' | concept: 'clean oven'
2140 | expected:'C' | got:'C' | concept: 'clean refrigerator'
2141 | expected:'C' | got:'C' | concept: 'clean refrigerator'
2142 | expected:'D' | got:'D' | concept: 'clean refrigerator'
2143 | expected:'D' | got:'A' | concept: 'clean refrigerator'
2144 | expected:'A' | got:'A' | concept: 'lie_on bench'
2145 | expected:'C' | got:'C' | concept: 'lie_on bench'
2146 | expected:'C' | got:'C' | concept: 'lie_on bench'
2147 | expected:'A' | got:'A' | concept: 'lie_on bench'
2148 | expected:'B' | got:'B' | concept: 'sit_on couch'
2149 | expected:'A' | got:'C' | concept: 'sit_on couch'
2150 | expected:'A' | got:'A' | concept: 'sit_on couch'
2151 | expected:'B' | got:'B' | concept: 'sit_on couch'
2152 | expected:'B' | got:'B' | concept: 'lie_on bed'
2153 | expected:'B' | got:'B' | concept: 'lie_on bed'
2154 | expected:'A' | got:'C' | concept: 'lie_on bed'
2155 | expected:'B' | got:'B' | concept: 'lie_on bed'
2156 | expected:'A' | got:'D' | concept: 'lie_on couch'
2157 | expected:'D' | got:'D' | concept: 'lie_on couch'
2158 | expected:'A' | got:'A' | concept: 'lie_on couch'
2159 | expected:'A' | got:'A' | concept: 'lie_on couch'
2160 | expected:'C' | got:'C' | concept: 'hold bird'
2161 | expected:'D' | got:'D' | concept: 'hold bird'
2162 | expected:'A' | got:'A' | concept: 'hold bird'
2163 | expected:'B' | got:'B' | concept: 'hold bird'
2164 | expected:'D' | got:'D' | concept: 'hold horse'
2165 | expected:'D' | got:'D' | concept: 'hold horse'
2166 | expected:'B' | got:'B' | concept: 'hold horse'
2167 | expected:'C' | got:'C' | concept: 'hold horse'
2168 | expected:'C' | got:'C' | concept: 'hold cell_phone'
2169 | expected:'B' | got:'B' | concept: 'hold cell_phone'
2170 | expected:'D' | got:'D' | concept: 'hold cell_phone'
2171 | expected:'A' | got:'A' | concept: 'hold cell_phone'
2172 | expected:'D' | got:'D' | concept: 'hold vase'
2173 | expected:'C' | got:'C' | concept: 'hold vase'
2174 | expected:'D' | got:'A' | concept: 'hold vase'
2175 | expected:'D' | got:'D' | concept: 'hold vase'
2176 | expected:'A' | got:'A' | concept: 'jump motorcycle'
2177 | expected:'B' | got:'B' | concept: 'jump motorcycle'
2178 | expected:'D' | got:'D' | concept: 'jump motorcycle'
2179 | expected:'B' | got:'B' | concept: 'jump motorcycle'
2180 | expected:'D' | got:'D' | concept: 'inspect motorcycle'
2181 | expected:'A' | got:'A' | concept: 'inspect motorcycle'
2182 | expected:'D' | got:'D' | concept: 'inspect motorcycle'
2183 | expected:'A' | got:'A' | concept: 'inspect motorcycle'
2184 | expected:'D' | got:'D' | concept: 'push motorcycle'
2185 | expected:'C' | got:'C' | concept: 'push motorcycle'
2186 | expected:'C' | got:'C' | concept: 'push motorcycle'
2187 | expected:'A' | got:'D' | concept: 'push motorcycle'
2188 | expected:'D' | got:'D' | concept: 'wash motorcycle'
2189 | expected:'D' | got:'D' | concept: 'wash motorcycle'
2190 | expected:'B' | got:'B' | concept: 'wash motorcycle'
2191 | expected:'D' | got:'D' | concept: 'wash motorcycle'
2192 | expected:'C' | got:'C' | concept: 'kick sports_ball'
2193 | expected:'C' | got:'C' | concept: 'kick sports_ball'
2194 | expected:'A' | got:'A' | concept: 'kick sports_ball'
2195 | expected:'B' | got:'B' | concept: 'kick sports_ball'
2196 | expected:'B' | got:'D' | concept: 'hold sports_ball'
2197 | expected:'B' | got:'D' | concept: 'hold sports_ball'
2198 | expected:'C' | got:'A' | concept: 'hold sports_ball'
2199 | expected:'A' | got:'A' | concept: 'hold sports_ball'
2200 | expected:'B' | got:'B' | concept: 'hold knife'
2201 | expected:'C' | got:'C' | concept: 'hold knife'
2202 | expected:'D' | got:'D' | concept: 'hold knife'
2203 | expected:'C' | got:'C' | concept: 'hold knife'
2204 | expected:'A' | got:'C' | concept: 'block sports_ball'
2205 | expected:'B' | got:'B' | concept: 'block sports_ball'
2206 | expected:'B' | got:'C' | concept: 'block sports_ball'
2207 | expected:'D' | got:'C' | concept: 'block sports_ball'
2208 | expected:'C' | got:'D' | concept: 'jump motorcycle'
2209 | expected:'C' | got:'C' | concept: 'jump motorcycle'
2210 | expected:'A' | got:'A' | concept: 'jump motorcycle'
2211 | expected:'C' | got:'C' | concept: 'jump motorcycle'
2212 | expected:'A' | got:'A' | concept: 'wash motorcycle'
2213 | expected:'C' | got:'C' | concept: 'wash motorcycle'
2214 | expected:'B' | got:'A' | concept: 'wash motorcycle'
2215 | expected:'D' | got:'D' | concept: 'wash motorcycle'
2216 | expected:'D' | got:'D' | concept: 'sit_on motorcycle'
2217 | expected:'A' | got:'A' | concept: 'sit_on motorcycle'
2218 | expected:'A' | got:'A' | concept: 'sit_on motorcycle'
2219 | expected:'D' | got:'D' | concept: 'sit_on motorcycle'
2220 | expected:'A' | got:'A' | concept: 'turn motorcycle'
2221 | expected:'D' | got:'D' | concept: 'turn motorcycle'
2222 | expected:'D' | got:'D' | concept: 'turn motorcycle'
2223 | expected:'C' | got:'C' | concept: 'turn motorcycle'
2224 | expected:'C' | got:'C' | concept: 'clean toilet'
2225 | expected:'B' | got:'B' | concept: 'clean toilet'
2226 | expected:'D' | got:'D' | concept: 'clean toilet'
2227 | expected:'A' | got:'A' | concept: 'clean toilet'
2228 | expected:'B' | got:'B' | concept: 'clean oven'
2229 | expected:'D' | got:'D' | concept: 'clean oven'
2230 | expected:'A' | got:'A' | concept: 'clean oven'
2231 | expected:'B' | got:'B' | concept: 'clean oven'
2232 | expected:'B' | got:'B' | concept: 'clean keyboard'
2233 | expected:'B' | got:'B' | concept: 'clean keyboard'
2234 | expected:'D' | got:'D' | concept: 'clean keyboard'
2235 | expected:'D' | got:'A' | concept: 'clean keyboard'
2236 | expected:'C' | got:'C' | concept: 'clean microwave'
2237 | expected:'D' | got:'D' | concept: 'clean microwave'
2238 | expected:'B' | got:'B' | concept: 'clean microwave'
2239 | expected:'B' | got:'B' | concept: 'clean microwave'
2240 | expected:'A' | got:'A' | concept: 'wash motorcycle'
2241 | expected:'D' | got:'D' | concept: 'wash motorcycle'
2242 | expected:'C' | got:'C' | concept: 'wash motorcycle'
2243 | expected:'C' | got:'C' | concept: 'wash motorcycle'
2244 | expected:'A' | got:'A' | concept: 'adjust_or_tie tie'
2245 | expected:'B' | got:'B' | concept: 'adjust_or_tie tie'
2246 | expected:'A' | got:'A' | concept: 'adjust_or_tie tie'
2247 | expected:'D' | got:'A' | concept: 'adjust_or_tie tie'
2248 | expected:'A' | got:'A' | concept: 'wear tie'
2249 | expected:'C' | got:'C' | concept: 'wear tie'
2250 | expected:'B' | got:'A' | concept: 'wear tie'
2251 | expected:'C' | got:'A' | concept: 'wear tie'
2252 | expected:'B' | got:'B' | concept: 'wear backpack'
2253 | expected:'B' | got:'B' | concept: 'wear backpack'
2254 | expected:'C' | got:'C' | concept: 'wear backpack'
2255 | expected:'C' | got:'C' | concept: 'wear backpack'
2256 | expected:'C' | got:'A' | concept: 'grind snowboard'
2257 | expected:'D' | got:'B' | concept: 'grind snowboard'
2258 | expected:'C' | got:'A' | concept: 'grind snowboard'
2259 | expected:'B' | got:'A' | concept: 'grind snowboard'
2260 | expected:'D' | got:'D' | concept: 'ride snowboard'
2261 | expected:'C' | got:'C' | concept: 'ride snowboard'
2262 | expected:'A' | got:'A' | concept: 'ride snowboard'
2263 | expected:'A' | got:'A' | concept: 'ride snowboard'
2264 | expected:'B' | got:'B' | concept: 'grind skateboard'
2265 | expected:'C' | got:'C' | concept: 'grind skateboard'
2266 | expected:'A' | got:'A' | concept: 'grind skateboard'
2267 | expected:'D' | got:'A' | concept: 'grind skateboard'
2268 | expected:'A' | got:'A' | concept: 'jump snowboard'
2269 | expected:'A' | got:'C' | concept: 'jump snowboard'
2270 | expected:'C' | got:'C' | concept: 'jump snowboard'
2271 | expected:'A' | got:'A' | concept: 'jump snowboard'
2272 | expected:'C' | got:'C' | concept: 'hold vase'
2273 | expected:'D' | got:'A' | concept: 'hold vase'
2274 | expected:'C' | got:'B' | concept: 'hold vase'
2275 | expected:'C' | got:'D' | concept: 'hold vase'
2276 | expected:'B' | got:'B' | concept: 'hold dog'
2277 | expected:'A' | got:'A' | concept: 'hold dog'
2278 | expected:'B' | got:'B' | concept: 'hold dog'
2279 | expected:'D' | got:'D' | concept: 'hold dog'
2280 | expected:'D' | got:'D' | concept: 'hold donut'
2281 | expected:'B' | got:'B' | concept: 'hold donut'
2282 | expected:'C' | got:'C' | concept: 'hold donut'
2283 | expected:'D' | got:'D' | concept: 'hold donut'
2284 | expected:'B' | got:'B' | concept: 'hold sports_ball'
2285 | expected:'A' | got:'A' | concept: 'hold sports_ball'
2286 | expected:'D' | got:'B' | concept: 'hold sports_ball'
2287 | expected:'B' | got:'B' | concept: 'hold sports_ball'
2288 | expected:'D' | got:'D' | concept: 'jump horse'
2289 | expected:'C' | got:'C' | concept: 'jump horse'
2290 | expected:'A' | got:'A' | concept: 'jump horse'
2291 | expected:'C' | got:'D' | concept: 'jump horse'
2292 | expected:'B' | got:'B' | concept: 'jump skateboard'
2293 | expected:'D' | got:'D' | concept: 'jump skateboard'
2294 | expected:'C' | got:'C' | concept: 'jump skateboard'
2295 | expected:'C' | got:'C' | concept: 'jump skateboard'
2296 | expected:'B' | got:'B' | concept: 'jump snowboard'
2297 | expected:'A' | got:'C' | concept: 'jump snowboard'
2298 | expected:'A' | got:'A' | concept: 'jump snowboard'
2299 | expected:'D' | got:'D' | concept: 'jump snowboard'
2300 | expected:'A' | got:'A' | concept: 'ride horse'
2301 | expected:'C' | got:'C' | concept: 'ride horse'
2302 | expected:'A' | got:'A' | concept: 'ride horse'
2303 | expected:'C' | got:'C' | concept: 'ride horse'
2304 | expected:'D' | got:'D' | concept: 'jump motorcycle'
2305 | expected:'D' | got:'D' | concept: 'jump motorcycle'
2306 | expected:'A' | got:'A' | concept: 'jump motorcycle'
2307 | expected:'B' | got:'B' | concept: 'jump motorcycle'
2308 | expected:'A' | got:'A' | concept: 'inspect motorcycle'
2309 | expected:'D' | got:'D' | concept: 'inspect motorcycle'
2310 | expected:'D' | got:'D' | concept: 'inspect motorcycle'
2311 | expected:'A' | got:'A' | concept: 'inspect motorcycle'
2312 | expected:'C' | got:'C' | concept: 'wash motorcycle'
2313 | expected:'A' | got:'A' | concept: 'wash motorcycle'
2314 | expected:'A' | got:'A' | concept: 'wash motorcycle'
2315 | expected:'A' | got:'A' | concept: 'wash motorcycle'
2316 | expected:'B' | got:'B' | concept: 'jump horse'
2317 | expected:'A' | got:'A' | concept: 'jump horse'
2318 | expected:'C' | got:'C' | concept: 'jump horse'
2319 | expected:'D' | got:'D' | concept: 'jump horse'
2320 | expected:'D' | got:'B' | concept: 'hold hot_dog'
2321 | expected:'C' | got:'C' | concept: 'hold hot_dog'
2322 | expected:'C' | got:'A' | concept: 'hold hot_dog'
2323 | expected:'C' | got:'C' | concept: 'hold hot_dog'
2324 | expected:'B' | got:'B' | concept: 'eat hot_dog'
2325 | expected:'A' | got:'A' | concept: 'eat hot_dog'
2326 | expected:'A' | got:'A' | concept: 'eat hot_dog'
2327 | expected:'D' | got:'D' | concept: 'eat hot_dog'
2328 | expected:'C' | got:'C' | concept: 'eat apple'
2329 | expected:'C' | got:'C' | concept: 'eat apple'
2330 | expected:'C' | got:'C' | concept: 'eat apple'
2331 | expected:'A' | got:'A' | concept: 'eat apple'
2332 | expected:'C' | got:'C' | concept: 'eat sandwich'
2333 | expected:'A' | got:'A' | concept: 'eat sandwich'
2334 | expected:'D' | got:'C' | concept: 'eat sandwich'
2335 | expected:'B' | got:'B' | concept: 'eat sandwich'
2336 | expected:'A' | got:'A' | concept: 'lie_on_like chair'
2337 | expected:'B' | got:'B' | concept: 'lie_on_like chair'
2338 | expected:'B' | got:'B' | concept: 'lie_on_like chair'
2339 | expected:'A' | got:'A' | concept: 'lie_on_like chair'
2340 | expected:'C' | got:'C' | concept: 'stand_on chair'
2341 | expected:'D' | got:'D' | concept: 'stand_on chair'
2342 | expected:'D' | got:'A' | concept: 'stand_on chair'
2343 | expected:'A' | got:'A' | concept: 'stand_on chair'
2344 | expected:'C' | got:'C' | concept: 'row boat'
2345 | expected:'D' | got:'D' | concept: 'row boat'
2346 | expected:'D' | got:'D' | concept: 'row boat'
2347 | expected:'C' | got:'D' | concept: 'row boat'
2348 | expected:'A' | got:'A' | concept: 'stand_on boat'
2349 | expected:'C' | got:'C' | concept: 'stand_on boat'
2350 | expected:'B' | got:'A' | concept: 'stand_on boat'
2351 | expected:'B' | got:'B' | concept: 'stand_on boat'
2352 | expected:'B' | got:'B' | concept: 'hold dog'
2353 | expected:'C' | got:'C' | concept: 'hold dog'
2354 | expected:'B' | got:'B' | concept: 'hold dog'
2355 | expected:'C' | got:'C' | concept: 'hold dog'
2356 | expected:'C' | got:'C' | concept: 'hold donut'
2357 | expected:'B' | got:'B' | concept: 'hold donut'
2358 | expected:'C' | got:'C' | concept: 'hold donut'
2359 | expected:'C' | got:'C' | concept: 'hold donut'
2360 | expected:'D' | got:'C' | concept: 'hold cake'
2361 | expected:'D' | got:'INVALID' | concept: 'hold cake'
2362 | expected:'B' | got:'C' | concept: 'hold cake'
2363 | expected:'C' | got:'D' | concept: 'hold cake'
2364 | expected:'B' | got:'B' | concept: 'hold wine_glass'
2365 | expected:'B' | got:'B' | concept: 'hold wine_glass'
2366 | expected:'A' | got:'A' | concept: 'hold wine_glass'
2367 | expected:'B' | got:'B' | concept: 'hold wine_glass'
2368 | expected:'B' | got:'B' | concept: 'train dog'
2369 | expected:'A' | got:'A' | concept: 'train dog'
2370 | expected:'B' | got:'B' | concept: 'train dog'
2371 | expected:'D' | got:'D' | concept: 'train dog'
2372 | expected:'A' | got:'A' | concept: 'control tv'
2373 | expected:'C' | got:'C' | concept: 'control tv'
2374 | expected:'B' | got:'B' | concept: 'control tv'
2375 | expected:'D' | got:'D' | concept: 'control tv'
2376 | expected:'D' | got:'A' | concept: 'watch tv'
2377 | expected:'B' | got:'B' | concept: 'watch tv'
2378 | expected:'B' | got:'B' | concept: 'watch tv'
2379 | expected:'C' | got:'C' | concept: 'watch tv'
2380 | expected:'B' | got:'B' | concept: 'hug person'
2381 | expected:'C' | got:'C' | concept: 'hug person'
2382 | expected:'A' | got:'A' | concept: 'hug person'
2383 | expected:'D' | got:'D' | concept: 'hug person'
2384 | expected:'D' | got:'D' | concept: 'hold vase'
2385 | expected:'D' | got:'A' | concept: 'hold vase'
2386 | expected:'A' | got:'A' | concept: 'hold vase'
2387 | expected:'B' | got:'B' | concept: 'hold vase'
2388 | expected:'C' | got:'D' | concept: 'hold knife'
2389 | expected:'B' | got:'B' | concept: 'hold knife'
2390 | expected:'C' | got:'C' | concept: 'hold knife'
2391 | expected:'C' | got:'C' | concept: 'hold knife'
2392 | expected:'B' | got:'B' | concept: 'hold spoon'
2393 | expected:'D' | got:'D' | concept: 'hold spoon'
2394 | expected:'B' | got:'B' | concept: 'hold spoon'
2395 | expected:'B' | got:'B' | concept: 'hold spoon'
2396 | expected:'A' | got:'A' | concept: 'hold cup'
2397 | expected:'D' | got:'C' | concept: 'hold cup'
2398 | expected:'B' | got:'B' | concept: 'hold cup'
2399 | expected:'A' | got:'A' | concept: 'hold cup'
2400 | expected:'A' | got:'A' | concept: 'ride motorcycle'
2401 | expected:'C' | got:'C' | concept: 'ride motorcycle'
2402 | expected:'D' | got:'D' | concept: 'ride motorcycle'
2403 | expected:'C' | got:'C' | concept: 'ride motorcycle'
2404 | expected:'C' | got:'C' | concept: 'ride skis'
2405 | expected:'B' | got:'B' | concept: 'ride skis'
2406 | expected:'A' | got:'A' | concept: 'ride skis'
2407 | expected:'C' | got:'C' | concept: 'ride skis'
2408 | expected:'A' | got:'A' | concept: 'sit_on motorcycle'
2409 | expected:'C' | got:'B' | concept: 'sit_on motorcycle'
2410 | expected:'C' | got:'C' | concept: 'sit_on motorcycle'
2411 | expected:'D' | got:'B' | concept: 'sit_on motorcycle'
2412 | expected:'A' | got:'C' | concept: 'turn motorcycle'
2413 | expected:'A' | got:'B' | concept: 'turn motorcycle'
2414 | expected:'D' | got:'C' | concept: 'turn motorcycle'
2415 | expected:'C' | got:'C' | concept: 'turn motorcycle'
2416 | expected:'A' | got:'A' | concept: 'hold sandwich'
2417 | expected:'D' | got:'A' | concept: 'hold sandwich'
2418 | expected:'C' | got:'C' | concept: 'hold sandwich'
2419 | expected:'D' | got:'D' | concept: 'hold sandwich'
2420 | expected:'D' | got:'D' | concept: 'jump horse'
2421 | expected:'D' | got:'D' | concept: 'jump horse'
2422 | expected:'C' | got:'C' | concept: 'jump horse'
2423 | expected:'A' | got:'A' | concept: 'jump horse'
2424 | expected:'C' | got:'C' | concept: 'hold bird'
2425 | expected:'D' | got:'D' | concept: 'hold bird'
2426 | expected:'A' | got:'A' | concept: 'hold bird'
2427 | expected:'B' | got:'B' | concept: 'hold bird'
2428 | expected:'D' | got:'D' | concept: 'hold horse'
2429 | expected:'D' | got:'D' | concept: 'hold horse'
2430 | expected:'C' | got:'C' | concept: 'hold horse'
2431 | expected:'A' | got:'A' | concept: 'hold horse'
2432 | expected:'A' | got:'A' | concept: 'hold skateboard'
2433 | expected:'A' | got:'A' | concept: 'hold skateboard'
2434 | expected:'B' | got:'B' | concept: 'hold skateboard'
2435 | expected:'B' | got:'B' | concept: 'hold skateboard'
2436 | expected:'D' | got:'D' | concept: 'hold bird'
2437 | expected:'A' | got:'A' | concept: 'hold bird'
2438 | expected:'A' | got:'A' | concept: 'hold bird'
2439 | expected:'D' | got:'B' | concept: 'hold bird'
2440 | expected:'A' | got:'A' | concept: 'hold toothbrush'
2441 | expected:'A' | got:'A' | concept: 'hold toothbrush'
2442 | expected:'B' | got:'B' | concept: 'hold toothbrush'
2443 | expected:'C' | got:'C' | concept: 'hold toothbrush'
2444 | expected:'D' | got:'D' | concept: 'hold laptop'
2445 | expected:'A' | got:'A' | concept: 'hold laptop'
2446 | expected:'B' | got:'B' | concept: 'hold laptop'
2447 | expected:'C' | got:'C' | concept: 'hold laptop'
2448 | expected:'B' | got:'B' | concept: 'sit_on motorcycle'
2449 | expected:'A' | got:'A' | concept: 'sit_on motorcycle'
2450 | expected:'A' | got:'A' | concept: 'sit_on motorcycle'
2451 | expected:'A' | got:'A' | concept: 'sit_on motorcycle'
2452 | expected:'C' | got:'C' | concept: 'sit_on bench'
2453 | expected:'C' | got:'C' | concept: 'sit_on bench'
2454 | expected:'A' | got:'A' | concept: 'sit_on bench'
2455 | expected:'A' | got:'A' | concept: 'sit_on bench'
2456 | expected:'D' | got:'D' | concept: 'sit_on skateboard'
2457 | expected:'C' | got:'C' | concept: 'sit_on skateboard'
2458 | expected:'D' | got:'D' | concept: 'sit_on skateboard'
2459 | expected:'D' | got:'D' | concept: 'sit_on skateboard'
2460 | expected:'D' | got:'D' | concept: 'sit_on truck'
2461 | expected:'A' | got:'D' | concept: 'sit_on truck'
2462 | expected:'A' | got:'B' | concept: 'sit_on truck'
2463 | expected:'D' | got:'D' | concept: 'sit_on truck'
2464 | expected:'A' | got:'A' | concept: 'hold pizza'
2465 | expected:'A' | got:'A' | concept: 'hold pizza'
2466 | expected:'C' | got:'C' | concept: 'hold pizza'
2467 | expected:'D' | got:'D' | concept: 'hold pizza'
2468 | expected:'C' | got:'C' | concept: 'hold donut'
2469 | expected:'A' | got:'A' | concept: 'hold donut'
2470 | expected:'D' | got:'D' | concept: 'hold donut'
2471 | expected:'B' | got:'B' | concept: 'hold donut'
2472 | expected:'C' | got:'C' | concept: 'hold cell_phone'
2473 | expected:'B' | got:'B' | concept: 'hold cell_phone'
2474 | expected:'D' | got:'D' | concept: 'hold cell_phone'
2475 | expected:'A' | got:'A' | concept: 'hold cell_phone'
2476 | expected:'B' | got:'B' | concept: 'hold spoon'
2477 | expected:'D' | got:'D' | concept: 'hold spoon'
2478 | expected:'A' | got:'A' | concept: 'hold spoon'
2479 | expected:'D' | got:'D' | concept: 'hold spoon'
2480 | expected:'C' | got:'C' | concept: 'jump horse'
2481 | expected:'A' | got:'A' | concept: 'jump horse'
2482 | expected:'D' | got:'D' | concept: 'jump horse'
2483 | expected:'D' | got:'D' | concept: 'jump horse'
2484 | expected:'A' | got:'A' | concept: 'jump skateboard'
2485 | expected:'C' | got:'C' | concept: 'jump skateboard'
2486 | expected:'A' | got:'A' | concept: 'jump skateboard'
2487 | expected:'D' | got:'D' | concept: 'jump skateboard'
2488 | expected:'C' | got:'C' | concept: 'jump skis'
2489 | expected:'D' | got:'D' | concept: 'jump skis'
2490 | expected:'C' | got:'C' | concept: 'jump skis'
2491 | expected:'C' | got:'C' | concept: 'jump skis'
2492 | expected:'C' | got:'C' | concept: 'jump motorcycle'
2493 | expected:'D' | got:'D' | concept: 'jump motorcycle'
2494 | expected:'A' | got:'A' | concept: 'jump motorcycle'
2495 | expected:'A' | got:'A' | concept: 'jump motorcycle'
2496 | expected:'C' | got:'B' | concept: 'clean microwave'
2497 | expected:'B' | got:'B' | concept: 'clean microwave'
2498 | expected:'B' | got:'B' | concept: 'clean microwave'
2499 | expected:'D' | got:'C' | concept: 'clean microwave'
2500 | expected:'B' | got:'B' | concept: 'clean refrigerator'
2501 | expected:'B' | got:'B' | concept: 'clean refrigerator'
2502 | expected:'D' | got:'A' | concept: 'clean refrigerator'
2503 | expected:'D' | got:'D' | concept: 'clean refrigerator'
2504 | expected:'A' | got:'A' | concept: 'open refrigerator'
2505 | expected:'D' | got:'D' | concept: 'open refrigerator'
2506 | expected:'D' | got:'D' | concept: 'open refrigerator'
2507 | expected:'B' | got:'B' | concept: 'open refrigerator'
2508 | expected:'D' | got:'A' | concept: 'open microwave'
2509 | expected:'C' | got:'C' | concept: 'open microwave'
2510 | expected:'D' | got:'D' | concept: 'open microwave'
2511 | expected:'D' | got:'D' | concept: 'open microwave'
2512 | expected:'C' | got:'C' | concept: 'hug cat'
2513 | expected:'B' | got:'A' | concept: 'hug cat'
2514 | expected:'A' | got:'A' | concept: 'hug cat'
2515 | expected:'D' | got:'A' | concept: 'hug cat'
2516 | expected:'B' | got:'B' | concept: 'hug person'
2517 | expected:'B' | got:'B' | concept: 'hug person'
2518 | expected:'D' | got:'D' | concept: 'hug person'
2519 | expected:'B' | got:'B' | concept: 'hug person'
2520 | expected:'B' | got:'D' | concept: 'pet cat'
2521 | expected:'B' | got:'B' | concept: 'pet cat'
2522 | expected:'C' | got:'C' | concept: 'pet cat'
2523 | expected:'D' | got:'A' | concept: 'pet cat'
2524 | expected:'C' | got:'C' | concept: 'hug horse'
2525 | expected:'B' | got:'B' | concept: 'hug horse'
2526 | expected:'C' | got:'C' | concept: 'hug horse'
2527 | expected:'C' | got:'C' | concept: 'hug horse'
2528 | expected:'B' | got:'C' | concept: 'hold wine_glass'
2529 | expected:'D' | got:'D' | concept: 'hold wine_glass'
2530 | expected:'B' | got:'B' | concept: 'hold wine_glass'
2531 | expected:'D' | got:'C' | concept: 'hold wine_glass'
2532 | expected:'B' | got:'B' | concept: 'hold apple'
2533 | expected:'B' | got:'B' | concept: 'hold apple'
2534 | expected:'C' | got:'C' | concept: 'hold apple'
2535 | expected:'B' | got:'B' | concept: 'hold apple'
2536 | expected:'B' | got:'B' | concept: 'toast wine_glass'
2537 | expected:'D' | got:'D' | concept: 'toast wine_glass'
2538 | expected:'D' | got:'D' | concept: 'toast wine_glass'
2539 | expected:'A' | got:'A' | concept: 'toast wine_glass'
2540 | expected:'B' | got:'A' | concept: 'sip wine_glass'
2541 | expected:'D' | got:'D' | concept: 'sip wine_glass'
2542 | expected:'C' | got:'C' | concept: 'sip wine_glass'
2543 | expected:'D' | got:'D' | concept: 'sip wine_glass'
2544 | expected:'B' | got:'B' | concept: 'hold wine_glass'
2545 | expected:'A' | got:'A' | concept: 'hold wine_glass'
2546 | expected:'D' | got:'D' | concept: 'hold wine_glass'
2547 | expected:'A' | got:'A' | concept: 'hold wine_glass'
2548 | expected:'C' | got:'C' | concept: 'hold pizza'
2549 | expected:'B' | got:'B' | concept: 'hold pizza'
2550 | expected:'A' | got:'A' | concept: 'hold pizza'
2551 | expected:'B' | got:'B' | concept: 'hold pizza'
2552 | expected:'D' | got:'D' | concept: 'hold donut'
2553 | expected:'B' | got:'B' | concept: 'hold donut'
2554 | expected:'A' | got:'A' | concept: 'hold donut'
2555 | expected:'C' | got:'C' | concept: 'hold donut'
2556 | expected:'A' | got:'A' | concept: 'hold mouse'
2557 | expected:'A' | got:'A' | concept: 'hold mouse'
2558 | expected:'B' | got:'B' | concept: 'hold mouse'
2559 | expected:'C' | got:'C' | concept: 'hold mouse'
2560 | expected:'C' | got:'C' | concept: 'hold dog'
2561 | expected:'A' | got:'C' | concept: 'hold dog'
2562 | expected:'C' | got:'C' | concept: 'hold dog'
2563 | expected:'D' | got:'D' | concept: 'hold dog'
2564 | expected:'D' | got:'D' | concept: 'kick sports_ball'
2565 | expected:'B' | got:'B' | concept: 'kick sports_ball'
2566 | expected:'D' | got:'D' | concept: 'kick sports_ball'
2567 | expected:'A' | got:'A' | concept: 'kick sports_ball'
2568 | expected:'C' | got:'C' | concept: 'hold sports_ball'
2569 | expected:'A' | got:'C' | concept: 'hold sports_ball'
2570 | expected:'D' | got:'A' | concept: 'hold sports_ball'
2571 | expected:'B' | got:'B' | concept: 'hold sports_ball'
2572 | expected:'C' | got:'C' | concept: 'block sports_ball'
2573 | expected:'A' | got:'D' | concept: 'block sports_ball'
2574 | expected:'B' | got:'D' | concept: 'block sports_ball'
2575 | expected:'C' | got:'C' | concept: 'block sports_ball'
2576 | expected:'C' | got:'C' | concept: 'feed giraffe'
2577 | expected:'B' | got:'B' | concept: 'feed giraffe'
2578 | expected:'A' | got:'A' | concept: 'feed giraffe'
2579 | expected:'B' | got:'B' | concept: 'feed giraffe'
2580 | expected:'D' | got:'A' | concept: 'feed elephant'
2581 | expected:'C' | got:'C' | concept: 'feed elephant'
2582 | expected:'D' | got:'A' | concept: 'feed elephant'
2583 | expected:'B' | got:'B' | concept: 'feed elephant'
2584 | expected:'D' | got:'D' | concept: 'pet horse'
2585 | expected:'A' | got:'A' | concept: 'pet horse'
2586 | expected:'D' | got:'D' | concept: 'pet horse'
2587 | expected:'C' | got:'C' | concept: 'pet horse'
2588 | expected:'C' | got:'D' | concept: 'feed horse'
2589 | expected:'C' | got:'C' | concept: 'feed horse'
2590 | expected:'D' | got:'A' | concept: 'feed horse'
2591 | expected:'D' | got:'D' | concept: 'feed horse'
2592 | expected:'B' | got:'C' | concept: 'hold mouse'
2593 | expected:'D' | got:'D' | concept: 'hold mouse'
2594 | expected:'D' | got:'D' | concept: 'hold mouse'
2595 | expected:'B' | got:'C' | concept: 'hold mouse'
2596 | expected:'C' | got:'C' | concept: 'hold wine_glass'
2597 | expected:'D' | got:'D' | concept: 'hold wine_glass'
2598 | expected:'A' | got:'D' | concept: 'hold wine_glass'
2599 | expected:'C' | got:'C' | concept: 'hold wine_glass'
2600 | expected:'C' | got:'C' | concept: 'hold cell_phone'
2601 | expected:'A' | got:'A' | concept: 'hold cell_phone'
2602 | expected:'D' | got:'D' | concept: 'hold cell_phone'
2603 | expected:'C' | got:'D' | concept: 'hold cell_phone'
2604 | expected:'C' | got:'C' | concept: 'toast wine_glass'
2605 | expected:'C' | got:'C' | concept: 'toast wine_glass'
2606 | expected:'D' | got:'D' | concept: 'toast wine_glass'
2607 | expected:'D' | got:'D' | concept: 'toast wine_glass'
2608 | expected:'D' | got:'C' | concept: 'wield knife'
2609 | expected:'C' | got:'C' | concept: 'wield knife'
2610 | expected:'B' | got:'A' | concept: 'wield knife'
2611 | expected:'B' | got:'D' | concept: 'wield knife'
2612 | expected:'C' | got:'A' | concept: 'stick knife'
2613 | expected:'B' | got:'A' | concept: 'stick knife'
2614 | expected:'D' | got:'B' | concept: 'stick knife'
2615 | expected:'A' | got:'B' | concept: 'stick knife'
2616 | expected:'A' | got:'A' | concept: 'hold knife'
2617 | expected:'D' | got:'A' | concept: 'hold knife'
2618 | expected:'D' | got:'B' | concept: 'hold knife'
2619 | expected:'B' | got:'B' | concept: 'hold knife'
2620 | expected:'D' | got:'D' | concept: 'lick knife'
2621 | expected:'C' | got:'C' | concept: 'lick knife'
2622 | expected:'C' | got:'C' | concept: 'lick knife'
2623 | expected:'C' | got:'C' | concept: 'lick knife'
2624 | expected:'A' | got:'A' | concept: 'hold knife'
2625 | expected:'B' | got:'B' | concept: 'hold knife'
2626 | expected:'C' | got:'C' | concept: 'hold knife'
2627 | expected:'A' | got:'A' | concept: 'hold knife'
2628 | expected:'C' | got:'C' | concept: 'hold tennis_racket'
2629 | expected:'C' | got:'C' | concept: 'hold tennis_racket'
2630 | expected:'C' | got:'C' | concept: 'hold tennis_racket'
2631 | expected:'C' | got:'C' | concept: 'hold tennis_racket'
2632 | expected:'C' | got:'C' | concept: 'hold sandwich'
2633 | expected:'A' | got:'A' | concept: 'hold sandwich'
2634 | expected:'C' | got:'C' | concept: 'hold sandwich'
2635 | expected:'B' | got:'B' | concept: 'hold sandwich'
2636 | expected:'C' | got:'C' | concept: 'hold umbrella'
2637 | expected:'D' | got:'D' | concept: 'hold umbrella'
2638 | expected:'B' | got:'B' | concept: 'hold umbrella'
2639 | expected:'B' | got:'A' | concept: 'hold umbrella'
2640 | expected:'D' | got:'D' | concept: 'hold pizza'
2641 | expected:'A' | got:'A' | concept: 'hold pizza'
2642 | expected:'A' | got:'A' | concept: 'hold pizza'
2643 | expected:'C' | got:'C' | concept: 'hold pizza'
2644 | expected:'A' | got:'A' | concept: 'hold cake'
2645 | expected:'D' | got:'C' | concept: 'hold cake'
2646 | expected:'A' | got:'C' | concept: 'hold cake'
2647 | expected:'A' | got:'B' | concept: 'hold cake'
2648 | expected:'B' | got:'B' | concept: 'hold scissors'
2649 | expected:'B' | got:'B' | concept: 'hold scissors'
2650 | expected:'C' | got:'C' | concept: 'hold scissors'
2651 | expected:'B' | got:'B' | concept: 'hold scissors'
2652 | expected:'A' | got:'A' | concept: 'hold sandwich'
2653 | expected:'C' | got:'C' | concept: 'hold sandwich'
2654 | expected:'A' | got:'A' | concept: 'hold sandwich'
2655 | expected:'C' | got:'C' | concept: 'hold sandwich'
2656 | expected:'B' | got:'D' | concept: 'hold cell_phone'
2657 | expected:'C' | got:'C' | concept: 'hold cell_phone'
2658 | expected:'D' | got:'D' | concept: 'hold cell_phone'
2659 | expected:'B' | got:'B' | concept: 'hold cell_phone'
2660 | expected:'C' | got:'C' | concept: 'talk_on_or_listen_to cell_phone'
2661 | expected:'B' | got:'B' | concept: 'talk_on_or_listen_to cell_phone'
2662 | expected:'D' | got:'A' | concept: 'talk_on_or_listen_to cell_phone'
2663 | expected:'C' | got:'C' | concept: 'talk_on_or_listen_to cell_phone'
2664 | expected:'B' | got:'A' | concept: 'read_like cell_phone'
2665 | expected:'B' | got:'D' | concept: 'read_like cell_phone'
2666 | expected:'D' | got:'A' | concept: 'read_like cell_phone'
2667 | expected:'C' | got:'A' | concept: 'read_like cell_phone'
2668 | expected:'D' | got:'A' | concept: 'hold sandwich'
2669 | expected:'B' | got:'B' | concept: 'hold sandwich'
2670 | expected:'C' | got:'C' | concept: 'hold sandwich'
2671 | expected:'D' | got:'A' | concept: 'hold sandwich'
2672 | expected:'D' | got:'D' | concept: 'greet person'
2673 | expected:'B' | got:'C' | concept: 'greet person'
2674 | expected:'D' | got:'D' | concept: 'greet person'
2675 | expected:'B' | got:'B' | concept: 'greet person'
2676 | expected:'B' | got:'B' | concept: 'kiss person'
2677 | expected:'D' | got:'C' | concept: 'kiss person'
2678 | expected:'D' | got:'D' | concept: 'kiss person'
2679 | expected:'D' | got:'D' | concept: 'kiss person'
2680 | expected:'C' | got:'C' | concept: 'hug cat'
2681 | expected:'C' | got:'C' | concept: 'hug cat'
2682 | expected:'A' | got:'A' | concept: 'hug cat'
2683 | expected:'B' | got:'B' | concept: 'hug cat'
2684 | expected:'D' | got:'D' | concept: 'hug person'
2685 | expected:'D' | got:'D' | concept: 'hug person'
2686 | expected:'C' | got:'C' | concept: 'hug person'
2687 | expected:'D' | got:'D' | concept: 'hug person'
2688 | expected:'C' | got:'C' | concept: 'hold toothbrush'
2689 | expected:'B' | got:'B' | concept: 'hold toothbrush'
2690 | expected:'A' | got:'A' | concept: 'hold toothbrush'
2691 | expected:'D' | got:'D' | concept: 'hold toothbrush'
2692 | expected:'A' | got:'C' | concept: 'carry handbag'
2693 | expected:'C' | got:'C' | concept: 'carry handbag'
2694 | expected:'C' | got:'C' | concept: 'carry handbag'
2695 | expected:'B' | got:'A' | concept: 'carry handbag'
2696 | expected:'A' | got:'B' | concept: 'hold handbag'
2697 | expected:'D' | got:'D' | concept: 'hold handbag'
2698 | expected:'C' | got:'B' | concept: 'hold handbag'
2699 | expected:'C' | got:'A' | concept: 'hold handbag'
2700 | expected:'A' | got:'B' | concept: 'hold sports_ball'
2701 | expected:'B' | got:'B' | concept: 'hold sports_ball'
2702 | expected:'B' | got:'B' | concept: 'hold sports_ball'
2703 | expected:'A' | got:'A' | concept: 'hold sports_ball'
2704 | expected:'B' | got:'B' | concept: 'push motorcycle'
2705 | expected:'A' | got:'C' | concept: 'push motorcycle'
2706 | expected:'A' | got:'D' | concept: 'push motorcycle'
2707 | expected:'B' | got:'B' | concept: 'push motorcycle'
2708 | expected:'B' | got:'B' | concept: 'ride motorcycle'
2709 | expected:'C' | got:'B' | concept: 'ride motorcycle'
2710 | expected:'B' | got:'B' | concept: 'ride motorcycle'
2711 | expected:'B' | got:'B' | concept: 'ride motorcycle'
2712 | expected:'A' | got:'C' | concept: 'straddle motorcycle'
2713 | expected:'A' | got:'B' | concept: 'straddle motorcycle'
2714 | expected:'A' | got:'D' | concept: 'straddle motorcycle'
2715 | expected:'B' | got:'C' | concept: 'straddle motorcycle'
2716 | expected:'D' | got:'B' | concept: 'sit_on motorcycle'
2717 | expected:'A' | got:'A' | concept: 'sit_on motorcycle'
2718 | expected:'B' | got:'C' | concept: 'sit_on motorcycle'
2719 | expected:'B' | got:'A' | concept: 'sit_on motorcycle'
2720 | expected:'B' | got:'B' | concept: 'eat donut'
2721 | expected:'B' | got:'B' | concept: 'eat donut'
2722 | expected:'D' | got:'D' | concept: 'eat donut'
2723 | expected:'A' | got:'A' | concept: 'eat donut'
2724 | expected:'C' | got:'C' | concept: 'cut pizza'
2725 | expected:'C' | got:'C' | concept: 'cut pizza'
2726 | expected:'A' | got:'A' | concept: 'cut pizza'
2727 | expected:'D' | got:'D' | concept: 'cut pizza'
2728 | expected:'D' | got:'D' | concept: 'eat pizza'
2729 | expected:'A' | got:'C' | concept: 'eat pizza'
2730 | expected:'A' | got:'A' | concept: 'eat pizza'
2731 | expected:'C' | got:'C' | concept: 'eat pizza'
2732 | expected:'B' | got:'B' | concept: 'eat apple'
2733 | expected:'A' | got:'A' | concept: 'eat apple'
2734 | expected:'B' | got:'B' | concept: 'eat apple'
2735 | expected:'B' | got:'B' | concept: 'eat apple'
2736 | expected:'D' | got:'D' | concept: 'eat apple'
2737 | expected:'B' | got:'B' | concept: 'eat apple'
2738 | expected:'C' | got:'A' | concept: 'eat apple'
2739 | expected:'D' | got:'D' | concept: 'eat apple'
2740 | expected:'C' | got:'C' | concept: 'eat banana'
2741 | expected:'D' | got:'D' | concept: 'eat banana'
2742 | expected:'D' | got:'D' | concept: 'eat banana'
2743 | expected:'B' | got:'B' | concept: 'eat banana'
2744 | expected:'C' | got:'C' | concept: 'eat hot_dog'
2745 | expected:'C' | got:'C' | concept: 'eat hot_dog'
2746 | expected:'B' | got:'B' | concept: 'eat hot_dog'
2747 | expected:'A' | got:'D' | concept: 'eat hot_dog'
2748 | expected:'A' | got:'A' | concept: 'eat orange'
2749 | expected:'D' | got:'B' | concept: 'eat orange'
2750 | expected:'A' | got:'A' | concept: 'eat orange'
2751 | expected:'C' | got:'C' | concept: 'eat orange'
2752 | expected:'B' | got:'B' | concept: 'sit_on motorcycle'
2753 | expected:'D' | got:'D' | concept: 'sit_on motorcycle'
2754 | expected:'A' | got:'D' | concept: 'sit_on motorcycle'
2755 | expected:'A' | got:'C' | concept: 'sit_on motorcycle'
2756 | expected:'D' | got:'D' | concept: 'push motorcycle'
2757 | expected:'C' | got:'C' | concept: 'push motorcycle'
2758 | expected:'D' | got:'D' | concept: 'push motorcycle'
2759 | expected:'A' | got:'A' | concept: 'push motorcycle'
2760 | expected:'B' | got:'C' | concept: 'ride motorcycle'
2761 | expected:'A' | got:'A' | concept: 'ride motorcycle'
2762 | expected:'D' | got:'D' | concept: 'ride motorcycle'
2763 | expected:'D' | got:'D' | concept: 'ride motorcycle'
2764 | expected:'C' | got:'C' | concept: 'ride horse'
2765 | expected:'D' | got:'D' | concept: 'ride horse'
2766 | expected:'C' | got:'C' | concept: 'ride horse'
2767 | expected:'A' | got:'A' | concept: 'ride horse'
2768 | expected:'A' | got:'A' | concept: 'wash bicycle'
2769 | expected:'C' | got:'C' | concept: 'wash bicycle'
2770 | expected:'A' | got:'A' | concept: 'wash bicycle'
2771 | expected:'B' | got:'B' | concept: 'wash bicycle'
2772 | expected:'C' | got:'A' | concept: 'wash car'
2773 | expected:'A' | got:'A' | concept: 'wash car'
2774 | expected:'A' | got:'A' | concept: 'wash car'
2775 | expected:'A' | got:'A' | concept: 'wash car'
2776 | expected:'A' | got:'A' | concept: 'drive car'
2777 | expected:'C' | got:'C' | concept: 'drive car'
2778 | expected:'C' | got:'C' | concept: 'drive car'
2779 | expected:'C' | got:'C' | concept: 'drive car'
2780 | expected:'C' | got:'D' | concept: 'drive train'
2781 | expected:'B' | got:'C' | concept: 'drive train'
2782 | expected:'B' | got:'B' | concept: 'drive train'
2783 | expected:'B' | got:'B' | concept: 'drive train'
2784 | expected:'B' | got:'B' | concept: 'wear tie'
2785 | expected:'D' | got:'D' | concept: 'wear tie'
2786 | expected:'A' | got:'A' | concept: 'wear tie'
2787 | expected:'D' | got:'D' | concept: 'wear tie'
2788 | expected:'A' | got:'A' | concept: 'control tv'
2789 | expected:'A' | got:'A' | concept: 'control tv'
2790 | expected:'C' | got:'C' | concept: 'control tv'
2791 | expected:'B' | got:'A' | concept: 'control tv'
2792 | expected:'A' | got:'A' | concept: 'watch tv'
2793 | expected:'C' | got:'A' | concept: 'watch tv'
2794 | expected:'A' | got:'A' | concept: 'watch tv'
2795 | expected:'B' | got:'C' | concept: 'watch tv'
2796 | expected:'B' | got:'B' | concept: 'grind skateboard'
2797 | expected:'D' | got:'D' | concept: 'grind skateboard'
2798 | expected:'B' | got:'B' | concept: 'grind skateboard'
2799 | expected:'A' | got:'A' | concept: 'grind skateboard'
2800 | expected:'D' | got:'C' | concept: 'hold scissors'
2801 | expected:'A' | got:'A' | concept: 'hold scissors'
2802 | expected:'A' | got:'D' | concept: 'hold scissors'
2803 | expected:'D' | got:'C' | concept: 'hold scissors'
2804 | expected:'D' | got:'D' | concept: 'wield knife'
2805 | expected:'D' | got:'C' | concept: 'wield knife'
2806 | expected:'C' | got:'C' | concept: 'wield knife'
2807 | expected:'C' | got:'B' | concept: 'wield knife'
2808 | expected:'D' | got:'D' | concept: 'cut_with scissors'
2809 | expected:'D' | got:'D' | concept: 'cut_with scissors'
2810 | expected:'B' | got:'C' | concept: 'cut_with scissors'
2811 | expected:'D' | got:'D' | concept: 'cut_with scissors'
2812 | expected:'A' | got:'A' | concept: 'cut_with knife'
2813 | expected:'C' | got:'C' | concept: 'cut_with knife'
2814 | expected:'C' | got:'C' | concept: 'cut_with knife'
2815 | expected:'A' | got:'A' | concept: 'cut_with knife'
2816 | expected:'D' | got:'D' | concept: 'sit_on chair'
2817 | expected:'D' | got:'D' | concept: 'sit_on chair'
2818 | expected:'A' | got:'A' | concept: 'sit_on chair'
2819 | expected:'A' | got:'A' | concept: 'sit_on chair'
2820 | expected:'C' | got:'C' | concept: 'repair truck'
2821 | expected:'B' | got:'A' | concept: 'repair truck'
2822 | expected:'B' | got:'B' | concept: 'repair truck'
2823 | expected:'B' | got:'B' | concept: 'repair truck'
2824 | expected:'C' | got:'C' | concept: 'sit_on truck'
2825 | expected:'D' | got:'D' | concept: 'sit_on truck'
2826 | expected:'C' | got:'A' | concept: 'sit_on truck'
2827 | expected:'C' | got:'C' | concept: 'sit_on truck'
2828 | expected:'B' | got:'B' | concept: 'sit_on bed'
2829 | expected:'B' | got:'B' | concept: 'sit_on bed'
2830 | expected:'C' | got:'C' | concept: 'sit_on bed'
2831 | expected:'B' | got:'B' | concept: 'sit_on bed'
2832 | expected:'D' | got:'D' | concept: 'pet horse'
2833 | expected:'D' | got:'D' | concept: 'pet horse'
2834 | expected:'A' | got:'A' | concept: 'pet horse'
2835 | expected:'B' | got:'C' | concept: 'pet horse'
2836 | expected:'B' | got:'B' | concept: 'kiss horse'
2837 | expected:'C' | got:'C' | concept: 'kiss horse'
2838 | expected:'B' | got:'B' | concept: 'kiss horse'
2839 | expected:'C' | got:'C' | concept: 'kiss horse'
2840 | expected:'C' | got:'C' | concept: 'ride horse'
2841 | expected:'B' | got:'B' | concept: 'ride horse'
2842 | expected:'C' | got:'C' | concept: 'ride horse'
2843 | expected:'B' | got:'B' | concept: 'ride horse'
2844 | expected:'C' | got:'C' | concept: 'hug horse'
2845 | expected:'A' | got:'B' | concept: 'hug horse'
2846 | expected:'D' | got:'D' | concept: 'hug horse'
2847 | expected:'C' | got:'D' | concept: 'hug horse'
2848 | expected:'B' | got:'B' | concept: 'clean toilet'
2849 | expected:'B' | got:'B' | concept: 'clean toilet'
2850 | expected:'B' | got:'B' | concept: 'clean toilet'
2851 | expected:'D' | got:'D' | concept: 'clean toilet'
2852 | expected:'C' | got:'C' | concept: 'inspect oven'
2853 | expected:'D' | got:'C' | concept: 'inspect oven'
2854 | expected:'B' | got:'A' | concept: 'inspect oven'
2855 | expected:'D' | got:'C' | concept: 'inspect oven'
2856 | expected:'A' | got:'A' | concept: 'clean oven'
2857 | expected:'A' | got:'A' | concept: 'clean oven'
2858 | expected:'C' | got:'C' | concept: 'clean oven'
2859 | expected:'C' | got:'C' | concept: 'clean oven'
2860 | expected:'D' | got:'A' | concept: 'clean keyboard'
2861 | expected:'C' | got:'C' | concept: 'clean keyboard'
2862 | expected:'C' | got:'C' | concept: 'clean keyboard'
2863 | expected:'D' | got:'A' | concept: 'clean keyboard'
2864 | expected:'C' | got:'A' | concept: 'wield knife'
2865 | expected:'A' | got:'A' | concept: 'wield knife'
2866 | expected:'B' | got:'B' | concept: 'wield knife'
2867 | expected:'C' | got:'C' | concept: 'wield knife'
2868 | expected:'C' | got:'C' | concept: 'cut_with knife'
2869 | expected:'C' | got:'C' | concept: 'cut_with knife'
2870 | expected:'D' | got:'D' | concept: 'cut_with knife'
2871 | expected:'A' | got:'A' | concept: 'cut_with knife'
2872 | expected:'C' | got:'A' | concept: 'lick knife'
2873 | expected:'D' | got:'C' | concept: 'lick knife'
2874 | expected:'D' | got:'C' | concept: 'lick knife'
2875 | expected:'A' | got:'A' | concept: 'lick knife'
2876 | expected:'D' | got:'A' | concept: 'stick knife'
2877 | expected:'A' | got:'D' | concept: 'stick knife'
2878 | expected:'B' | got:'D' | concept: 'stick knife'
2879 | expected:'B' | got:'A' | concept: 'stick knife'
2880 | expected:'B' | got:'B' | concept: 'ride skateboard'
2881 | expected:'C' | got:'C' | concept: 'ride skateboard'
2882 | expected:'B' | got:'B' | concept: 'ride skateboard'
2883 | expected:'C' | got:'C' | concept: 'ride skateboard'
2884 | expected:'B' | got:'B' | concept: 'ride snowboard'
2885 | expected:'D' | got:'D' | concept: 'ride snowboard'
2886 | expected:'B' | got:'B' | concept: 'ride snowboard'
2887 | expected:'A' | got:'A' | concept: 'ride snowboard'
2888 | expected:'B' | got:'B' | concept: 'ride surfboard'
2889 | expected:'A' | got:'A' | concept: 'ride surfboard'
2890 | expected:'D' | got:'D' | concept: 'ride surfboard'
2891 | expected:'A' | got:'A' | concept: 'ride surfboard'
2892 | expected:'C' | got:'C' | concept: 'ride elephant'
2893 | expected:'A' | got:'A' | concept: 'ride elephant'
2894 | expected:'B' | got:'B' | concept: 'ride elephant'
2895 | expected:'B' | got:'B' | concept: 'ride elephant'
2896 | expected:'A' | got:'A' | concept: 'lie_on bed'
2897 | expected:'A' | got:'A' | concept: 'lie_on bed'
2898 | expected:'A' | got:'A' | concept: 'lie_on bed'
2899 | expected:'D' | got:'B' | concept: 'lie_on bed'
2900 | expected:'B' | got:'B' | concept: 'sit_on couch'
2901 | expected:'A' | got:'A' | concept: 'sit_on couch'
2902 | expected:'C' | got:'C' | concept: 'sit_on couch'
2903 | expected:'C' | got:'C' | concept: 'sit_on couch'
2904 | expected:'B' | got:'C' | concept: 'sit_on bed'
2905 | expected:'C' | got:'B' | concept: 'sit_on bed'
2906 | expected:'B' | got:'B' | concept: 'sit_on bed'
2907 | expected:'A' | got:'A' | concept: 'sit_on bed'
2908 | expected:'C' | got:'C' | concept: 'sit_on motorcycle'
2909 | expected:'A' | got:'A' | concept: 'sit_on motorcycle'
2910 | expected:'B' | got:'B' | concept: 'sit_on motorcycle'
2911 | expected:'A' | got:'A' | concept: 'sit_on motorcycle'
2912 | expected:'C' | got:'C' | concept: 'hold skateboard'
2913 | expected:'C' | got:'C' | concept: 'hold skateboard'
2914 | expected:'D' | got:'D' | concept: 'hold skateboard'
2915 | expected:'C' | got:'C' | concept: 'hold skateboard'
2916 | expected:'D' | got:'D' | concept: 'hold dog'
2917 | expected:'A' | got:'A' | concept: 'hold dog'
2918 | expected:'A' | got:'A' | concept: 'hold dog'
2919 | expected:'D' | got:'D' | concept: 'hold dog'
2920 | expected:'B' | got:'B' | concept: 'hold bottle'
2921 | expected:'B' | got:'B' | concept: 'hold bottle'
2922 | expected:'C' | got:'C' | concept: 'hold bottle'
2923 | expected:'C' | got:'C' | concept: 'hold bottle'
2924 | expected:'C' | got:'B' | concept: 'hold kite'
2925 | expected:'D' | got:'D' | concept: 'hold kite'
2926 | expected:'A' | got:'A' | concept: 'hold kite'
2927 | expected:'C' | got:'C' | concept: 'hold kite'
2928 | expected:'A' | got:'B' | concept: 'cut pizza'
2929 | expected:'B' | got:'D' | concept: 'cut pizza'
2930 | expected:'C' | got:'C' | concept: 'cut pizza'
2931 | expected:'D' | got:'D' | concept: 'cut pizza'
2932 | expected:'C' | got:'D' | concept: 'hold pizza'
2933 | expected:'B' | got:'B' | concept: 'hold pizza'
2934 | expected:'A' | got:'A' | concept: 'hold pizza'
2935 | expected:'C' | got:'D' | concept: 'hold pizza'
2936 | expected:'C' | got:'C' | concept: 'eat pizza'
2937 | expected:'C' | got:'C' | concept: 'eat pizza'
2938 | expected:'C' | got:'C' | concept: 'eat pizza'
2939 | expected:'D' | got:'D' | concept: 'eat pizza'
2940 | expected:'A' | got:'A' | concept: 'make pizza'
2941 | expected:'D' | got:'D' | concept: 'make pizza'
2942 | expected:'B' | got:'B' | concept: 'make pizza'
2943 | expected:'A' | got:'A' | concept: 'make pizza'
2944 | expected:'A' | got:'A' | concept: 'hold_and_about_to_eat apple'
2945 | expected:'C' | got:'C' | concept: 'hold_and_about_to_eat apple'
2946 | expected:'C' | got:'C' | concept: 'hold_and_about_to_eat apple'
2947 | expected:'A' | got:'A' | concept: 'hold_and_about_to_eat apple'
2948 | expected:'B' | got:'D' | concept: 'smell apple'
2949 | expected:'B' | got:'C' | concept: 'smell apple'
2950 | expected:'A' | got:'C' | concept: 'smell apple'
2951 | expected:'B' | got:'D' | concept: 'smell apple'
2952 | expected:'B' | got:'B' | concept: 'pick apple'
2953 | expected:'B' | got:'B' | concept: 'pick apple'
2954 | expected:'D' | got:'D' | concept: 'pick apple'
2955 | expected:'A' | got:'A' | concept: 'pick apple'
2956 | expected:'C' | got:'C' | concept: 'peel_or_cut apple'
2957 | expected:'D' | got:'D' | concept: 'peel_or_cut apple'
2958 | expected:'B' | got:'B' | concept: 'peel_or_cut apple'
2959 | expected:'C' | got:'C' | concept: 'peel_or_cut apple'
2960 | expected:'C' | got:'C' | concept: 'inspect motorcycle'
2961 | expected:'A' | got:'A' | concept: 'inspect motorcycle'
2962 | expected:'A' | got:'A' | concept: 'inspect motorcycle'
2963 | expected:'D' | got:'D' | concept: 'inspect motorcycle'
2964 | expected:'D' | got:'D' | concept: 'ride motorcycle'
2965 | expected:'C' | got:'C' | concept: 'ride motorcycle'
2966 | expected:'C' | got:'A' | concept: 'ride motorcycle'
2967 | expected:'C' | got:'C' | concept: 'ride motorcycle'
2968 | expected:'C' | got:'A' | concept: 'turn motorcycle'
2969 | expected:'D' | got:'C' | concept: 'turn motorcycle'
2970 | expected:'B' | got:'C' | concept: 'turn motorcycle'
2971 | expected:'B' | got:'C' | concept: 'turn motorcycle'
2972 | expected:'A' | got:'B' | concept: 'straddle motorcycle'
2973 | expected:'B' | got:'D' | concept: 'straddle motorcycle'
2974 | expected:'C' | got:'C' | concept: 'straddle motorcycle'
2975 | expected:'D' | got:'C' | concept: 'straddle motorcycle'
2976 | expected:'C' | got:'C' | concept: 'lick knife'
2977 | expected:'A' | got:'A' | concept: 'lick knife'
2978 | expected:'B' | got:'B' | concept: 'lick knife'
2979 | expected:'C' | got:'C' | concept: 'lick knife'
2980 | expected:'B' | got:'B' | concept: 'hold knife'
2981 | expected:'C' | got:'C' | concept: 'hold knife'
2982 | expected:'C' | got:'C' | concept: 'hold knife'
2983 | expected:'C' | got:'C' | concept: 'hold knife'
2984 | expected:'D' | got:'D' | concept: 'cut_with knife'
2985 | expected:'A' | got:'B' | concept: 'cut_with knife'
2986 | expected:'A' | got:'A' | concept: 'cut_with knife'
2987 | expected:'C' | got:'C' | concept: 'cut_with knife'
2988 | expected:'B' | got:'A' | concept: 'wield knife'
2989 | expected:'A' | got:'D' | concept: 'wield knife'
2990 | expected:'D' | got:'C' | concept: 'wield knife'
2991 | expected:'D' | got:'C' | concept: 'wield knife'
2992 | expected:'C' | got:'C' | concept: 'open refrigerator'
2993 | expected:'C' | got:'C' | concept: 'open refrigerator'
2994 | expected:'A' | got:'A' | concept: 'open refrigerator'
2995 | expected:'C' | got:'C' | concept: 'open refrigerator'
2996 | expected:'D' | got:'A' | concept: 'open microwave'
2997 | expected:'B' | got:'A' | concept: 'open microwave'
2998 | expected:'D' | got:'A' | concept: 'open microwave'
2999 | expected:'C' | got:'A' | concept: 'open microwave'
3000 | expected:'C' | got:'C' | concept: 'operate microwave'
3001 | expected:'C' | got:'A' | concept: 'operate microwave'
3002 | expected:'D' | got:'D' | concept: 'operate microwave'
3003 | expected:'D' | got:'D' | concept: 'operate microwave'
3004 | expected:'C' | got:'C' | concept: 'clean microwave'
3005 | expected:'C' | got:'C' | concept: 'clean microwave'
3006 | expected:'D' | got:'D' | concept: 'clean microwave'
3007 | expected:'B' | got:'A' | concept: 'clean microwave'
3008 | expected:'B' | got:'C' | concept: 'hug dog'
3009 | expected:'B' | got:'D' | concept: 'hug dog'
3010 | expected:'B' | got:'A' | concept: 'hug dog'
3011 | expected:'B' | got:'C' | concept: 'hug dog'
3012 | expected:'B' | got:'B' | concept: 'kiss dog'
3013 | expected:'D' | got:'D' | concept: 'kiss dog'
3014 | expected:'C' | got:'C' | concept: 'kiss dog'
3015 | expected:'C' | got:'C' | concept: 'kiss dog'
3016 | expected:'C' | got:'C' | concept: 'hold dog'
3017 | expected:'A' | got:'A' | concept: 'hold dog'
3018 | expected:'D' | got:'D' | concept: 'hold dog'
3019 | expected:'D' | got:'C' | concept: 'hold dog'
3020 | expected:'A' | got:'A' | concept: 'walk dog'
3021 | expected:'D' | got:'D' | concept: 'walk dog'
3022 | expected:'B' | got:'B' | concept: 'walk dog'
3023 | expected:'B' | got:'B' | concept: 'walk dog'
3024 | expected:'B' | got:'B' | concept: 'talk_on_or_listen_to cell_phone'
3025 | expected:'D' | got:'D' | concept: 'talk_on_or_listen_to cell_phone'
3026 | expected:'B' | got:'B' | concept: 'talk_on_or_listen_to cell_phone'
3027 | expected:'C' | got:'C' | concept: 'talk_on_or_listen_to cell_phone'
3028 | expected:'D' | got:'B' | concept: 'hold cake'
3029 | expected:'C' | got:'A' | concept: 'hold cake'
3030 | expected:'A' | got:'A' | concept: 'hold cake'
3031 | expected:'D' | got:'A' | concept: 'hold cake'
3032 | expected:'C' | got:'C' | concept: 'hold cell_phone'
3033 | expected:'C' | got:'C' | concept: 'hold cell_phone'
3034 | expected:'C' | got:'C' | concept: 'hold cell_phone'
3035 | expected:'A' | got:'A' | concept: 'hold cell_phone'
3036 | expected:'D' | got:'B' | concept: 'read_like cell_phone'
3037 | expected:'C' | got:'D' | concept: 'read_like cell_phone'
3038 | expected:'B' | got:'C' | concept: 'read_like cell_phone'
3039 | expected:'A' | got:'D' | concept: 'read_like cell_phone'
3040 | expected:'D' | got:'D' | concept: 'hold dog'
3041 | expected:'D' | got:'D' | concept: 'hold dog'
3042 | expected:'C' | got:'C' | concept: 'hold dog'
3043 | expected:'B' | got:'B' | concept: 'hold dog'
3044 | expected:'D' | got:'D' | concept: 'hold laptop'
3045 | expected:'D' | got:'A' | concept: 'hold laptop'
3046 | expected:'D' | got:'D' | concept: 'hold laptop'
3047 | expected:'C' | got:'C' | concept: 'hold laptop'
3048 | expected:'D' | got:'D' | concept: 'hold scissors'
3049 | expected:'D' | got:'C' | concept: 'hold scissors'
3050 | expected:'C' | got:'C' | concept: 'hold scissors'
3051 | expected:'D' | got:'C' | concept: 'hold scissors'
3052 | expected:'C' | got:'C' | concept: 'hold apple'
3053 | expected:'B' | got:'B' | concept: 'hold apple'
3054 | expected:'B' | got:'B' | concept: 'hold apple'
3055 | expected:'D' | got:'D' | concept: 'hold apple'
3056 | expected:'C' | got:'C' | concept: 'ride surfboard'
3057 | expected:'C' | got:'C' | concept: 'ride surfboard'
3058 | expected:'B' | got:'B' | concept: 'ride surfboard'
3059 | expected:'D' | got:'D' | concept: 'ride surfboard'
3060 | expected:'A' | got:'A' | concept: 'ride bicycle'
3061 | expected:'B' | got:'B' | concept: 'ride bicycle'
3062 | expected:'C' | got:'C' | concept: 'ride bicycle'
3063 | expected:'A' | got:'A' | concept: 'ride bicycle'
3064 | expected:'B' | got:'B' | concept: 'ride skateboard'
3065 | expected:'B' | got:'B' | concept: 'ride skateboard'
3066 | expected:'B' | got:'B' | concept: 'ride skateboard'
3067 | expected:'B' | got:'B' | concept: 'ride skateboard'
3068 | expected:'C' | got:'C' | concept: 'ride elephant'
3069 | expected:'A' | got:'A' | concept: 'ride elephant'
3070 | expected:'D' | got:'D' | concept: 'ride elephant'
3071 | expected:'C' | got:'C' | concept: 'ride elephant'
3072 | expected:'C' | got:'D' | concept: 'straddle motorcycle'
3073 | expected:'A' | got:'D' | concept: 'straddle motorcycle'
3074 | expected:'B' | got:'D' | concept: 'straddle motorcycle'
3075 | expected:'D' | got:'D' | concept: 'straddle motorcycle'
3076 | expected:'A' | got:'A' | concept: 'jump skis'
3077 | expected:'B' | got:'B' | concept: 'jump skis'
3078 | expected:'C' | got:'C' | concept: 'jump skis'
3079 | expected:'C' | got:'C' | concept: 'jump skis'
3080 | expected:'D' | got:'D' | concept: 'ride motorcycle'
3081 | expected:'D' | got:'D' | concept: 'ride motorcycle'
3082 | expected:'B' | got:'B' | concept: 'ride motorcycle'
3083 | expected:'A' | got:'A' | concept: 'ride motorcycle'
3084 | expected:'B' | got:'B' | concept: 'jump motorcycle'
3085 | expected:'C' | got:'C' | concept: 'jump motorcycle'
3086 | expected:'C' | got:'C' | concept: 'jump motorcycle'
3087 | expected:'B' | got:'B' | concept: 'jump motorcycle'
3088 | expected:'C' | got:'C' | concept: 'read book'
3089 | expected:'A' | got:'C' | concept: 'read book'
3090 | expected:'B' | got:'B' | concept: 'read book'
3091 | expected:'B' | got:'B' | concept: 'read book'
3092 | expected:'C' | got:'C' | concept: 'hold book'
3093 | expected:'C' | got:'C' | concept: 'hold book'
3094 | expected:'C' | got:'C' | concept: 'hold book'
3095 | expected:'A' | got:'A' | concept: 'hold book'
3096 | expected:'D' | got:'A' | concept: 'hold laptop'
3097 | expected:'B' | got:'B' | concept: 'hold laptop'
3098 | expected:'B' | got:'B' | concept: 'hold laptop'
3099 | expected:'C' | got:'C' | concept: 'hold laptop'
3100 | expected:'A' | got:'C' | concept: 'read laptop'
3101 | expected:'A' | got:'A' | concept: 'read laptop'
3102 | expected:'D' | got:'B' | concept: 'read laptop'
3103 | expected:'D' | got:'A' | concept: 'read laptop'
3104 | expected:'B' | got:'B' | concept: 'ride motorcycle'
3105 | expected:'B' | got:'B' | concept: 'ride motorcycle'
3106 | expected:'D' | got:'D' | concept: 'ride motorcycle'
3107 | expected:'A' | got:'A' | concept: 'ride motorcycle'
3108 | expected:'B' | got:'D' | concept: 'push motorcycle'
3109 | expected:'A' | got:'A' | concept: 'push motorcycle'
3110 | expected:'A' | got:'A' | concept: 'push motorcycle'
3111 | expected:'C' | got:'C' | concept: 'push motorcycle'
3112 | expected:'D' | got:'D' | concept: 'inspect motorcycle'
3113 | expected:'C' | got:'C' | concept: 'inspect motorcycle'
3114 | expected:'D' | got:'D' | concept: 'inspect motorcycle'
3115 | expected:'A' | got:'A' | concept: 'inspect motorcycle'
3116 | expected:'D' | got:'D' | concept: 'ride elephant'
3117 | expected:'D' | got:'D' | concept: 'ride elephant'
3118 | expected:'B' | got:'B' | concept: 'ride elephant'
3119 | expected:'A' | got:'A' | concept: 'ride elephant'
3120 | expected:'B' | got:'C' | concept: 'kiss horse'
3121 | expected:'B' | got:'A' | concept: 'kiss horse'
3122 | expected:'B' | got:'A' | concept: 'kiss horse'
3123 | expected:'A' | got:'C' | concept: 'kiss horse'
3124 | expected:'D' | got:'D' | concept: 'pet horse'
3125 | expected:'A' | got:'A' | concept: 'pet horse'
3126 | expected:'C' | got:'C' | concept: 'pet horse'
3127 | expected:'C' | got:'C' | concept: 'pet horse'
3128 | expected:'B' | got:'B' | concept: 'jump skis'
3129 | expected:'C' | got:'C' | concept: 'jump skis'
3130 | expected:'B' | got:'B' | concept: 'jump skis'
3131 | expected:'C' | got:'C' | concept: 'jump skis'
3132 | expected:'D' | got:'D' | concept: 'jump horse'
3133 | expected:'C' | got:'C' | concept: 'jump horse'
3134 | expected:'B' | got:'B' | concept: 'jump horse'
3135 | expected:'D' | got:'D' | concept: 'jump horse'
3136 | expected:'B' | got:'B' | concept: 'hold dog'
3137 | expected:'D' | got:'D' | concept: 'hold dog'
3138 | expected:'A' | got:'A' | concept: 'hold dog'
3139 | expected:'D' | got:'A' | concept: 'hold dog'
3140 | expected:'D' | got:'D' | concept: 'walk dog'
3141 | expected:'C' | got:'C' | concept: 'walk dog'
3142 | expected:'D' | got:'D' | concept: 'walk dog'
3143 | expected:'B' | got:'B' | concept: 'walk dog'
3144 | expected:'A' | got:'A' | concept: 'hold kite'
3145 | expected:'B' | got:'B' | concept: 'hold kite'
3146 | expected:'D' | got:'D' | concept: 'hold kite'
3147 | expected:'D' | got:'D' | concept: 'hold kite'
3148 | expected:'A' | got:'A' | concept: 'hold cake'
3149 | expected:'C' | got:'C' | concept: 'hold cake'
3150 | expected:'A' | got:'C' | concept: 'hold cake'
3151 | expected:'C' | got:'C' | concept: 'hold cake'
3152 | expected:'A' | got:'A' | concept: 'hold horse'
3153 | expected:'A' | got:'A' | concept: 'hold horse'
3154 | expected:'B' | got:'B' | concept: 'hold horse'
3155 | expected:'C' | got:'C' | concept: 'hold horse'
3156 | expected:'A' | got:'A' | concept: 'hold wine_glass'
3157 | expected:'B' | got:'B' | concept: 'hold wine_glass'
3158 | expected:'A' | got:'A' | concept: 'hold wine_glass'
3159 | expected:'D' | got:'D' | concept: 'hold wine_glass'
3160 | expected:'C' | got:'B' | concept: 'hold bottle'
3161 | expected:'B' | got:'B' | concept: 'hold bottle'
3162 | expected:'D' | got:'D' | concept: 'hold bottle'
3163 | expected:'C' | got:'A' | concept: 'hold bottle'
3164 | expected:'B' | got:'B' | concept: 'hold hot_dog'
3165 | expected:'C' | got:'C' | concept: 'hold hot_dog'
3166 | expected:'A' | got:'A' | concept: 'hold hot_dog'
3167 | expected:'B' | got:'B' | concept: 'hold hot_dog'
3168 | expected:'D' | got:'D' | concept: 'jump skateboard'
3169 | expected:'B' | got:'B' | concept: 'jump skateboard'
3170 | expected:'B' | got:'B' | concept: 'jump skateboard'
3171 | expected:'B' | got:'B' | concept: 'jump skateboard'
3172 | expected:'A' | got:'A' | concept: 'hold pizza'
3173 | expected:'B' | got:'B' | concept: 'hold pizza'
3174 | expected:'C' | got:'C' | concept: 'hold pizza'
3175 | expected:'D' | got:'D' | concept: 'hold pizza'
3176 | expected:'C' | got:'C' | concept: 'hold skateboard'
3177 | expected:'A' | got:'A' | concept: 'hold skateboard'
3178 | expected:'A' | got:'A' | concept: 'hold skateboard'
3179 | expected:'D' | got:'D' | concept: 'hold skateboard'
3180 | expected:'A' | got:'A' | concept: 'hold apple'
3181 | expected:'A' | got:'A' | concept: 'hold apple'
3182 | expected:'C' | got:'C' | concept: 'hold apple'
3183 | expected:'B' | got:'B' | concept: 'hold apple'
3184 | expected:'A' | got:'A' | concept: 'jump bicycle'
3185 | expected:'C' | got:'C' | concept: 'jump bicycle'
3186 | expected:'D' | got:'D' | concept: 'jump bicycle'
3187 | expected:'C' | got:'C' | concept: 'jump bicycle'
3188 | expected:'D' | got:'D' | concept: 'jump motorcycle'
3189 | expected:'A' | got:'A' | concept: 'jump motorcycle'
3190 | expected:'D' | got:'D' | concept: 'jump motorcycle'
3191 | expected:'B' | got:'B' | concept: 'jump motorcycle'
3192 | expected:'C' | got:'C' | concept: 'jump skateboard'
3193 | expected:'A' | got:'A' | concept: 'jump skateboard'
3194 | expected:'C' | got:'C' | concept: 'jump skateboard'
3195 | expected:'A' | got:'A' | concept: 'jump skateboard'
3196 | expected:'D' | got:'D' | concept: 'jump skis'
3197 | expected:'C' | got:'C' | concept: 'jump skis'
3198 | expected:'B' | got:'B' | concept: 'jump skis'
3199 | expected:'C' | got:'C' | concept: 'jump skis'
3200 | expected:'C' | got:'C' | concept: 'clean refrigerator'
3201 | expected:'C' | got:'C' | concept: 'clean refrigerator'
3202 | expected:'B' | got:'B' | concept: 'clean refrigerator'
3203 | expected:'B' | got:'B' | concept: 'clean refrigerator'
3204 | expected:'A' | got:'A' | concept: 'clean keyboard'
3205 | expected:'A' | got:'A' | concept: 'clean keyboard'
3206 | expected:'D' | got:'A' | concept: 'clean keyboard'
3207 | expected:'B' | got:'B' | concept: 'clean keyboard'
3208 | expected:'A' | got:'A' | concept: 'open refrigerator'
3209 | expected:'B' | got:'B' | concept: 'open refrigerator'
3210 | expected:'B' | got:'B' | concept: 'open refrigerator'
3211 | expected:'A' | got:'A' | concept: 'open refrigerator'
3212 | expected:'C' | got:'C' | concept: 'clean microwave'
3213 | expected:'D' | got:'D' | concept: 'clean microwave'
3214 | expected:'D' | got:'A' | concept: 'clean microwave'
3215 | expected:'A' | got:'A' | concept: 'clean microwave'
3216 | expected:'A' | got:'A' | concept: 'hold book'
3217 | expected:'C' | got:'C' | concept: 'hold book'
3218 | expected:'A' | got:'A' | concept: 'hold book'
3219 | expected:'B' | got:'B' | concept: 'hold book'
3220 | expected:'B' | got:'D' | concept: 'read laptop'
3221 | expected:'A' | got:'C' | concept: 'read laptop'
3222 | expected:'D' | got:'C' | concept: 'read laptop'
3223 | expected:'B' | got:'D' | concept: 'read laptop'
3224 | expected:'C' | got:'C' | concept: 'read book'
3225 | expected:'D' | got:'A' | concept: 'read book'
3226 | expected:'B' | got:'D' | concept: 'read book'
3227 | expected:'C' | got:'C' | concept: 'read book'
3228 | expected:'C' | got:'C' | concept: 'type_on laptop'
3229 | expected:'B' | got:'B' | concept: 'type_on laptop'
3230 | expected:'B' | got:'B' | concept: 'type_on laptop'
3231 | expected:'B' | got:'B' | concept: 'type_on laptop'
3232 | expected:'A' | got:'A' | concept: 'kiss person'
3233 | expected:'D' | got:'D' | concept: 'kiss person'
3234 | expected:'A' | got:'D' | concept: 'kiss person'
3235 | expected:'A' | got:'A' | concept: 'kiss person'
3236 | expected:'B' | got:'B' | concept: 'greet person'
3237 | expected:'B' | got:'B' | concept: 'greet person'
3238 | expected:'D' | got:'D' | concept: 'greet person'
3239 | expected:'C' | got:'C' | concept: 'greet person'
3240 | expected:'D' | got:'D' | concept: 'hug horse'
3241 | expected:'D' | got:'D' | concept: 'hug horse'
3242 | expected:'B' | got:'B' | concept: 'hug horse'
3243 | expected:'B' | got:'D' | concept: 'hug horse'
3244 | expected:'A' | got:'A' | concept: 'hug person'
3245 | expected:'D' | got:'D' | concept: 'hug person'
3246 | expected:'B' | got:'B' | concept: 'hug person'
3247 | expected:'B' | got:'B' | concept: 'hug person'
3248 | expected:'C' | got:'B' | concept: 'cut cake'
3249 | expected:'A' | got:'A' | concept: 'cut cake'
3250 | expected:'A' | got:'A' | concept: 'cut cake'
3251 | expected:'B' | got:'B' | concept: 'cut cake'
3252 | expected:'A' | got:'A' | concept: 'hold pizza'
3253 | expected:'B' | got:'C' | concept: 'hold pizza'
3254 | expected:'D' | got:'C' | concept: 'hold pizza'
3255 | expected:'C' | got:'C' | concept: 'hold pizza'
3256 | expected:'C' | got:'C' | concept: 'cut pizza'
3257 | expected:'D' | got:'D' | concept: 'cut pizza'
3258 | expected:'B' | got:'B' | concept: 'cut pizza'
3259 | expected:'B' | got:'B' | concept: 'cut pizza'
3260 | expected:'D' | got:'A' | concept: 'make pizza'
3261 | expected:'D' | got:'C' | concept: 'make pizza'
3262 | expected:'B' | got:'B' | concept: 'make pizza'
3263 | expected:'A' | got:'A' | concept: 'make pizza'
3264 | expected:'A' | got:'INVALID' | concept: 'hold sports_ball'
3265 | expected:'B' | got:'B' | concept: 'hold sports_ball'
3266 | expected:'A' | got:'A' | concept: 'hold sports_ball'
3267 | expected:'B' | got:'B' | concept: 'hold sports_ball'
3268 | expected:'D' | got:'D' | concept: 'hold horse'
3269 | expected:'D' | got:'D' | concept: 'hold horse'
3270 | expected:'C' | got:'C' | concept: 'hold horse'
3271 | expected:'B' | got:'B' | concept: 'hold horse'
3272 | expected:'A' | got:'A' | concept: 'hold cake'
3273 | expected:'C' | got:'C' | concept: 'hold cake'
3274 | expected:'A' | got:'A' | concept: 'hold cake'
3275 | expected:'A' | got:'C' | concept: 'hold cake'
3276 | expected:'D' | got:'A' | concept: 'hold apple'
3277 | expected:'A' | got:'A' | concept: 'hold apple'
3278 | expected:'D' | got:'D' | concept: 'hold apple'
3279 | expected:'A' | got:'A' | concept: 'hold apple'
3280 | expected:'B' | got:'C' | concept: 'hold spoon'
3281 | expected:'D' | got:'B' | concept: 'hold spoon'
3282 | expected:'B' | got:'C' | concept: 'hold spoon'
3283 | expected:'C' | got:'C' | concept: 'hold spoon'
3284 | expected:'D' | got:'D' | concept: 'hold donut'
3285 | expected:'D' | got:'D' | concept: 'hold donut'
3286 | expected:'A' | got:'C' | concept: 'hold donut'
3287 | expected:'C' | got:'C' | concept: 'hold donut'
3288 | expected:'C' | got:'C' | concept: 'lick_or_sip spoon'
3289 | expected:'D' | got:'B' | concept: 'lick_or_sip spoon'
3290 | expected:'D' | got:'C' | concept: 'lick_or_sip spoon'
3291 | expected:'A' | got:'A' | concept: 'lick_or_sip spoon'
3292 | expected:'C' | got:'C' | concept: 'hold remote'
3293 | expected:'C' | got:'C' | concept: 'hold remote'
3294 | expected:'C' | got:'C' | concept: 'hold remote'
3295 | expected:'C' | got:'C' | concept: 'hold remote'
3296 | expected:'B' | got:'B' | concept: 'wash bicycle'
3297 | expected:'D' | got:'D' | concept: 'wash bicycle'
3298 | expected:'D' | got:'D' | concept: 'wash bicycle'
3299 | expected:'A' | got:'D' | concept: 'wash bicycle'
3300 | expected:'B' | got:'B' | concept: 'drive car'
3301 | expected:'C' | got:'C' | concept: 'drive car'
3302 | expected:'C' | got:'C' | concept: 'drive car'
3303 | expected:'A' | got:'A' | concept: 'drive car'
3304 | expected:'D' | got:'D' | concept: 'wash car'
3305 | expected:'D' | got:'D' | concept: 'wash car'
3306 | expected:'C' | got:'C' | concept: 'wash car'
3307 | expected:'A' | got:'A' | concept: 'wash car'
3308 | expected:'B' | got:'A' | concept: 'wash motorcycle'
3309 | expected:'C' | got:'C' | concept: 'wash motorcycle'
3310 | expected:'D' | got:'A' | concept: 'wash motorcycle'
3311 | expected:'A' | got:'A' | concept: 'wash motorcycle'
3312 | expected:'C' | got:'C' | concept: 'lie_on couch'
3313 | expected:'A' | got:'A' | concept: 'lie_on couch'
3314 | expected:'A' | got:'B' | concept: 'lie_on couch'
3315 | expected:'C' | got:'C' | concept: 'lie_on couch'
3316 | expected:'D' | got:'D' | concept: 'sit_on couch'
3317 | expected:'A' | got:'A' | concept: 'sit_on couch'
3318 | expected:'B' | got:'B' | concept: 'sit_on couch'
3319 | expected:'D' | got:'D' | concept: 'sit_on couch'
3320 | expected:'C' | got:'B' | concept: 'lie_on bed'
3321 | expected:'B' | got:'B' | concept: 'lie_on bed'
3322 | expected:'D' | got:'D' | concept: 'lie_on bed'
3323 | expected:'C' | got:'C' | concept: 'lie_on bed'
3324 | expected:'C' | got:'C' | concept: 'lie_on bench'
3325 | expected:'D' | got:'B' | concept: 'lie_on bench'
3326 | expected:'D' | got:'B' | concept: 'lie_on bench'
3327 | expected:'B' | got:'B' | concept: 'lie_on bench'
3328 | expected:'D' | got:'D' | concept: 'ride bicycle'
3329 | expected:'D' | got:'D' | concept: 'ride bicycle'
3330 | expected:'A' | got:'A' | concept: 'ride bicycle'
3331 | expected:'D' | got:'D' | concept: 'ride bicycle'
3332 | expected:'B' | got:'B' | concept: 'ride skateboard'
3333 | expected:'C' | got:'C' | concept: 'ride skateboard'
3334 | expected:'C' | got:'C' | concept: 'ride skateboard'
3335 | expected:'D' | got:'D' | concept: 'ride skateboard'
3336 | expected:'A' | got:'A' | concept: 'ride skis'
3337 | expected:'C' | got:'C' | concept: 'ride skis'
3338 | expected:'A' | got:'A' | concept: 'ride skis'
3339 | expected:'A' | got:'A' | concept: 'ride skis'
3340 | expected:'C' | got:'D' | concept: 'straddle bicycle'
3341 | expected:'B' | got:'C' | concept: 'straddle bicycle'
3342 | expected:'D' | got:'A' | concept: 'straddle bicycle'
3343 | expected:'C' | got:'A' | concept: 'straddle bicycle'
3344 | expected:'C' | got:'B' | concept: 'hug dog'
3345 | expected:'B' | got:'B' | concept: 'hug dog'
3346 | expected:'D' | got:'C' | concept: 'hug dog'
3347 | expected:'B' | got:'B' | concept: 'hug dog'
3348 | expected:'B' | got:'B' | concept: 'hug horse'
3349 | expected:'C' | got:'C' | concept: 'hug horse'
3350 | expected:'C' | got:'C' | concept: 'hug horse'
3351 | expected:'D' | got:'D' | concept: 'hug horse'
3352 | expected:'B' | got:'B' | concept: 'train dog'
3353 | expected:'B' | got:'B' | concept: 'train dog'
3354 | expected:'C' | got:'D' | concept: 'train dog'
3355 | expected:'D' | got:'D' | concept: 'train dog'
3356 | expected:'C' | got:'C' | concept: 'hold dog'
3357 | expected:'D' | got:'B' | concept: 'hold dog'
3358 | expected:'C' | got:'B' | concept: 'hold dog'
3359 | expected:'A' | got:'C' | concept: 'hold dog'
3360 | expected:'B' | got:'B' | concept: 'control tv'
3361 | expected:'B' | got:'A' | concept: 'control tv'
3362 | expected:'A' | got:'A' | concept: 'control tv'
3363 | expected:'C' | got:'C' | concept: 'control tv'
3364 | expected:'C' | got:'C' | concept: 'grind skateboard'
3365 | expected:'D' | got:'D' | concept: 'grind skateboard'
3366 | expected:'D' | got:'D' | concept: 'grind skateboard'
3367 | expected:'D' | got:'D' | concept: 'grind skateboard'
3368 | expected:'D' | got:'D' | concept: 'watch tv'
3369 | expected:'C' | got:'C' | concept: 'watch tv'
3370 | expected:'C' | got:'A' | concept: 'watch tv'
3371 | expected:'A' | got:'A' | concept: 'watch tv'
3372 | expected:'A' | got:'A' | concept: 'push motorcycle'
3373 | expected:'C' | got:'C' | concept: 'push motorcycle'
3374 | expected:'B' | got:'B' | concept: 'push motorcycle'
3375 | expected:'B' | got:'B' | concept: 'push motorcycle'
3376 | expected:'B' | got:'C' | concept: 'sit_at dining_table'
3377 | expected:'D' | got:'D' | concept: 'sit_at dining_table'
3378 | expected:'A' | got:'A' | concept: 'sit_at dining_table'
3379 | expected:'C' | got:'C' | concept: 'sit_at dining_table'
3380 | expected:'C' | got:'C' | concept: 'eat hot_dog'
3381 | expected:'D' | got:'D' | concept: 'eat hot_dog'
3382 | expected:'D' | got:'C' | concept: 'eat hot_dog'
3383 | expected:'B' | got:'B' | concept: 'eat hot_dog'
3384 | expected:'D' | got:'D' | concept: 'eat_at dining_table'
3385 | expected:'C' | got:'C' | concept: 'eat_at dining_table'
3386 | expected:'A' | got:'A' | concept: 'eat_at dining_table'
3387 | expected:'D' | got:'D' | concept: 'eat_at dining_table'
3388 | expected:'C' | got:'C' | concept: 'make pizza'
3389 | expected:'B' | got:'B' | concept: 'make pizza'
3390 | expected:'B' | got:'A' | concept: 'make pizza'
3391 | expected:'D' | got:'D' | concept: 'make pizza'
3392 | expected:'A' | got:'A' | concept: 'ride horse'
3393 | expected:'C' | got:'C' | concept: 'ride horse'
3394 | expected:'C' | got:'C' | concept: 'ride horse'
3395 | expected:'B' | got:'B' | concept: 'ride horse'
3396 | expected:'D' | got:'D' | concept: 'ride surfboard'
3397 | expected:'B' | got:'B' | concept: 'ride surfboard'
3398 | expected:'B' | got:'B' | concept: 'ride surfboard'
3399 | expected:'D' | got:'D' | concept: 'ride surfboard'
3400 | expected:'C' | got:'C' | concept: 'ride skateboard'
3401 | expected:'C' | got:'C' | concept: 'ride skateboard'
3402 | expected:'B' | got:'B' | concept: 'ride skateboard'
3403 | expected:'B' | got:'B' | concept: 'ride skateboard'
3404 | expected:'A' | got:'A' | concept: 'ride motorcycle'
3405 | expected:'C' | got:'C' | concept: 'ride motorcycle'
3406 | expected:'A' | got:'A' | concept: 'ride motorcycle'
3407 | expected:'D' | got:'D' | concept: 'ride motorcycle'
3408 | expected:'A' | got:'A' | concept: 'carry surfboard'
3409 | expected:'A' | got:'A' | concept: 'carry surfboard'
3410 | expected:'C' | got:'C' | concept: 'carry surfboard'
3411 | expected:'C' | got:'C' | concept: 'carry surfboard'
3412 | expected:'B' | got:'B' | concept: 'carry handbag'
3413 | expected:'C' | got:'C' | concept: 'carry handbag'
3414 | expected:'C' | got:'C' | concept: 'carry handbag'
3415 | expected:'C' | got:'C' | concept: 'carry handbag'
3416 | expected:'D' | got:'A' | concept: 'carry suitcase'
3417 | expected:'D' | got:'D' | concept: 'carry suitcase'
3418 | expected:'D' | got:'D' | concept: 'carry suitcase'
3419 | expected:'B' | got:'B' | concept: 'carry suitcase'
3420 | expected:'A' | got:'B' | concept: 'drag suitcase'
3421 | expected:'C' | got:'C' | concept: 'drag suitcase'
3422 | expected:'D' | got:'D' | concept: 'drag suitcase'
3423 | expected:'B' | got:'D' | concept: 'drag suitcase'
3424 | expected:'B' | got:'C' | concept: 'grind skateboard'
3425 | expected:'C' | got:'B' | concept: 'grind skateboard'
3426 | expected:'B' | got:'D' | concept: 'grind skateboard'
3427 | expected:'D' | got:'C' | concept: 'grind skateboard'
3428 | expected:'D' | got:'D' | concept: 'jump motorcycle'
3429 | expected:'B' | got:'B' | concept: 'jump motorcycle'
3430 | expected:'D' | got:'D' | concept: 'jump motorcycle'
3431 | expected:'B' | got:'B' | concept: 'jump motorcycle'
3432 | expected:'A' | got:'A' | concept: 'jump horse'
3433 | expected:'A' | got:'A' | concept: 'jump horse'
3434 | expected:'C' | got:'C' | concept: 'jump horse'
3435 | expected:'B' | got:'B' | concept: 'jump horse'
3436 | expected:'B' | got:'B' | concept: 'jump skateboard'
3437 | expected:'A' | got:'A' | concept: 'jump skateboard'
3438 | expected:'C' | got:'C' | concept: 'jump skateboard'
3439 | expected:'C' | got:'C' | concept: 'jump skateboard'
3440 | expected:'A' | got:'A' | concept: 'hold cell_phone'
3441 | expected:'A' | got:'A' | concept: 'hold cell_phone'
3442 | expected:'D' | got:'D' | concept: 'hold cell_phone'
3443 | expected:'B' | got:'B' | concept: 'hold cell_phone'
3444 | expected:'A' | got:'A' | concept: 'talk_on_or_listen_to cell_phone'
3445 | expected:'D' | got:'D' | concept: 'talk_on_or_listen_to cell_phone'
3446 | expected:'D' | got:'D' | concept: 'talk_on_or_listen_to cell_phone'
3447 | expected:'D' | got:'D' | concept: 'talk_on_or_listen_to cell_phone'
3448 | expected:'B' | got:'A' | concept: 'read_like cell_phone'
3449 | expected:'A' | got:'B' | concept: 'read_like cell_phone'
3450 | expected:'C' | got:'A' | concept: 'read_like cell_phone'
3451 | expected:'C' | got:'A' | concept: 'read_like cell_phone'
3452 | expected:'C' | got:'C' | concept: 'hold scissors'
3453 | expected:'D' | got:'C' | concept: 'hold scissors'
3454 | expected:'C' | got:'C' | concept: 'hold scissors'
3455 | expected:'C' | got:'C' | concept: 'hold scissors'
3456 | expected:'C' | got:'C' | concept: 'catch frisbee'
3457 | expected:'A' | got:'A' | concept: 'catch frisbee'
3458 | expected:'A' | got:'A' | concept: 'catch frisbee'
3459 | expected:'C' | got:'C' | concept: 'catch frisbee'
3460 | expected:'B' | got:'B' | concept: 'adjust_or_tie tie'
3461 | expected:'A' | got:'B' | concept: 'adjust_or_tie tie'
3462 | expected:'A' | got:'A' | concept: 'adjust_or_tie tie'
3463 | expected:'A' | got:'A' | concept: 'adjust_or_tie tie'
3464 | expected:'C' | got:'C' | concept: 'wear backpack'
3465 | expected:'A' | got:'A' | concept: 'wear backpack'
3466 | expected:'A' | got:'A' | concept: 'wear backpack'
3467 | expected:'B' | got:'B' | concept: 'wear backpack'
3468 | expected:'A' | got:'A' | concept: 'wear tie'
3469 | expected:'A' | got:'B' | concept: 'wear tie'
3470 | expected:'D' | got:'C' | concept: 'wear tie'
3471 | expected:'A' | got:'B' | concept: 'wear tie'
3472 | expected:'C' | got:'C' | concept: 'hug cat'
3473 | expected:'D' | got:'C' | concept: 'hug cat'
3474 | expected:'A' | got:'A' | concept: 'hug cat'
3475 | expected:'C' | got:'C' | concept: 'hug cat'
3476 | expected:'D' | got:'D' | concept: 'hug person'
3477 | expected:'C' | got:'C' | concept: 'hug person'
3478 | expected:'A' | got:'B' | concept: 'hug person'
3479 | expected:'C' | got:'D' | concept: 'hug person'
3480 | expected:'A' | got:'A' | concept: 'kiss person'
3481 | expected:'C' | got:'C' | concept: 'kiss person'
3482 | expected:'A' | got:'A' | concept: 'kiss person'
3483 | expected:'A' | got:'A' | concept: 'kiss person'
3484 | expected:'C' | got:'C' | concept: 'hug dog'
3485 | expected:'D' | got:'D' | concept: 'hug dog'
3486 | expected:'D' | got:'D' | concept: 'hug dog'
3487 | expected:'B' | got:'B' | concept: 'hug dog'
3488 | expected:'A' | got:'A' | concept: 'hold cell_phone'
3489 | expected:'B' | got:'B' | concept: 'hold cell_phone'
3490 | expected:'C' | got:'C' | concept: 'hold cell_phone'
3491 | expected:'A' | got:'A' | concept: 'hold cell_phone'
3492 | expected:'C' | got:'C' | concept: 'hold handbag'
3493 | expected:'C' | got:'D' | concept: 'hold handbag'
3494 | expected:'B' | got:'B' | concept: 'hold handbag'
3495 | expected:'A' | got:'A' | concept: 'hold handbag'
3496 | expected:'D' | got:'A' | concept: 'hold banana'
3497 | expected:'D' | got:'A' | concept: 'hold banana'
3498 | expected:'A' | got:'A' | concept: 'hold banana'
3499 | expected:'D' | got:'A' | concept: 'hold banana'
3500 | expected:'D' | got:'D' | concept: 'hold dog'
3501 | expected:'C' | got:'C' | concept: 'hold dog'
3502 | expected:'C' | got:'C' | concept: 'hold dog'
3503 | expected:'C' | got:'C' | concept: 'hold dog'
3504 | expected:'B' | got:'D' | concept: 'train dog'
3505 | expected:'D' | got:'A' | concept: 'train dog'
3506 | expected:'D' | got:'D' | concept: 'train dog'
3507 | expected:'D' | got:'D' | concept: 'train dog'
3508 | expected:'C' | got:'C' | concept: 'kiss dog'
3509 | expected:'B' | got:'B' | concept: 'kiss dog'
3510 | expected:'B' | got:'B' | concept: 'kiss dog'
3511 | expected:'C' | got:'C' | concept: 'kiss dog'
3512 | expected:'A' | got:'A' | concept: 'walk dog'
3513 | expected:'A' | got:'A' | concept: 'walk dog'
3514 | expected:'C' | got:'C' | concept: 'walk dog'
3515 | expected:'C' | got:'C' | concept: 'walk dog'
3516 | expected:'A' | got:'A' | concept: 'kiss horse'
3517 | expected:'D' | got:'D' | concept: 'kiss horse'
3518 | expected:'C' | got:'C' | concept: 'kiss horse'
3519 | expected:'A' | got:'A' | concept: 'kiss horse'
3520 | expected:'C' | got:'C' | concept: 'wash bicycle'
3521 | expected:'D' | got:'A' | concept: 'wash bicycle'
3522 | expected:'C' | got:'C' | concept: 'wash bicycle'
3523 | expected:'A' | got:'A' | concept: 'wash bicycle'
3524 | expected:'B' | got:'B' | concept: 'jump bicycle'
3525 | expected:'A' | got:'A' | concept: 'jump bicycle'
3526 | expected:'A' | got:'A' | concept: 'jump bicycle'
3527 | expected:'C' | got:'C' | concept: 'jump bicycle'
3528 | expected:'A' | got:'A' | concept: 'straddle bicycle'
3529 | expected:'A' | got:'A' | concept: 'straddle bicycle'
3530 | expected:'C' | got:'C' | concept: 'straddle bicycle'
3531 | expected:'A' | got:'A' | concept: 'straddle bicycle'
3532 | expected:'D' | got:'D' | concept: 'repair bicycle'
3533 | expected:'C' | got:'C' | concept: 'repair bicycle'
3534 | expected:'B' | got:'B' | concept: 'repair bicycle'
3535 | expected:'B' | got:'B' | concept: 'repair bicycle'
3536 | expected:'B' | got:'B' | concept: 'kiss horse'
3537 | expected:'D' | got:'D' | concept: 'kiss horse'
3538 | expected:'A' | got:'A' | concept: 'kiss horse'
3539 | expected:'B' | got:'B' | concept: 'kiss horse'
3540 | expected:'C' | got:'C' | concept: 'jump horse'
3541 | expected:'D' | got:'D' | concept: 'jump horse'
3542 | expected:'C' | got:'C' | concept: 'jump horse'
3543 | expected:'D' | got:'D' | concept: 'jump horse'
3544 | expected:'C' | got:'C' | concept: 'ride horse'
3545 | expected:'A' | got:'A' | concept: 'ride horse'
3546 | expected:'B' | got:'B' | concept: 'ride horse'
3547 | expected:'C' | got:'C' | concept: 'ride horse'
3548 | expected:'C' | got:'C' | concept: 'ride skis'
3549 | expected:'A' | got:'A' | concept: 'ride skis'
3550 | expected:'A' | got:'A' | concept: 'ride skis'
3551 | expected:'B' | got:'B' | concept: 'ride skis'
3552 | expected:'C' | got:'C' | concept: 'lick knife'
3553 | expected:'A' | got:'A' | concept: 'lick knife'
3554 | expected:'D' | got:'D' | concept: 'lick knife'
3555 | expected:'D' | got:'C' | concept: 'lick knife'
3556 | expected:'D' | got:'D' | concept: 'cut_with knife'
3557 | expected:'C' | got:'C' | concept: 'cut_with knife'
3558 | expected:'B' | got:'A' | concept: 'cut_with knife'
3559 | expected:'A' | got:'A' | concept: 'cut_with knife'
3560 | expected:'D' | got:'B' | concept: 'wield knife'
3561 | expected:'C' | got:'D' | concept: 'wield knife'
3562 | expected:'D' | got:'A' | concept: 'wield knife'
3563 | expected:'C' | got:'C' | concept: 'wield knife'
3564 | expected:'C' | got:'C' | concept: 'hold knife'
3565 | expected:'B' | got:'B' | concept: 'hold knife'
3566 | expected:'A' | got:'C' | concept: 'hold knife'
3567 | expected:'B' | got:'B' | concept: 'hold knife'
3568 | expected:'B' | got:'B' | concept: 'ride motorcycle'
3569 | expected:'A' | got:'A' | concept: 'ride motorcycle'
3570 | expected:'D' | got:'D' | concept: 'ride motorcycle'
3571 | expected:'A' | got:'A' | concept: 'ride motorcycle'
3572 | expected:'B' | got:'B' | concept: 'ride surfboard'
3573 | expected:'C' | got:'C' | concept: 'ride surfboard'
3574 | expected:'D' | got:'D' | concept: 'ride surfboard'
3575 | expected:'C' | got:'C' | concept: 'ride surfboard'
3576 | expected:'D' | got:'D' | concept: 'ride elephant'
3577 | expected:'C' | got:'C' | concept: 'ride elephant'
3578 | expected:'B' | got:'B' | concept: 'ride elephant'
3579 | expected:'C' | got:'C' | concept: 'ride elephant'
3580 | expected:'C' | got:'B' | concept: 'turn motorcycle'
3581 | expected:'C' | got:'A' | concept: 'turn motorcycle'
3582 | expected:'D' | got:'B' | concept: 'turn motorcycle'
3583 | expected:'B' | got:'A' | concept: 'turn motorcycle'
3584 | expected:'D' | got:'D' | concept: 'ride bicycle'
3585 | expected:'B' | got:'B' | concept: 'ride bicycle'
3586 | expected:'A' | got:'A' | concept: 'ride bicycle'
3587 | expected:'D' | got:'D' | concept: 'ride bicycle'
3588 | expected:'C' | got:'C' | concept: 'jump bicycle'
3589 | expected:'D' | got:'D' | concept: 'jump bicycle'
3590 | expected:'C' | got:'C' | concept: 'jump bicycle'
3591 | expected:'D' | got:'D' | concept: 'jump bicycle'
3592 | expected:'C' | got:'D' | concept: 'straddle bicycle'
3593 | expected:'D' | got:'A' | concept: 'straddle bicycle'
3594 | expected:'B' | got:'D' | concept: 'straddle bicycle'
3595 | expected:'D' | got:'C' | concept: 'straddle bicycle'
3596 | expected:'B' | got:'B' | concept: 'walk bicycle'
3597 | expected:'B' | got:'B' | concept: 'walk bicycle'
3598 | expected:'A' | got:'C' | concept: 'walk bicycle'
3599 | expected:'B' | got:'B' | concept: 'walk bicycle'
3600 | expected:'B' | got:'B' | concept: 'use mouse'
3601 | expected:'B' | got:'B' | concept: 'use mouse'
3602 | expected:'C' | got:'C' | concept: 'use mouse'
3603 | expected:'B' | got:'B' | concept: 'use mouse'
3604 | expected:'A' | got:'A' | concept: 'hold toothbrush'
3605 | expected:'D' | got:'B' | concept: 'hold toothbrush'
3606 | expected:'A' | got:'A' | concept: 'hold toothbrush'
3607 | expected:'C' | got:'B' | concept: 'hold toothbrush'
3608 | expected:'C' | got:'C' | concept: 'hold tennis_racket'
3609 | expected:'B' | got:'B' | concept: 'hold tennis_racket'
3610 | expected:'C' | got:'C' | concept: 'hold tennis_racket'
3611 | expected:'A' | got:'A' | concept: 'hold tennis_racket'
3612 | expected:'D' | got:'C' | concept: 'hold mouse'
3613 | expected:'C' | got:'A' | concept: 'hold mouse'
3614 | expected:'A' | got:'C' | concept: 'hold mouse'
3615 | expected:'D' | got:'A' | concept: 'hold mouse'
3616 | expected:'C' | got:'C' | concept: 'hold tennis_racket'
3617 | expected:'D' | got:'D' | concept: 'hold tennis_racket'
3618 | expected:'C' | got:'C' | concept: 'hold tennis_racket'
3619 | expected:'D' | got:'D' | concept: 'hold tennis_racket'
3620 | expected:'D' | got:'C' | concept: 'hold sports_ball'
3621 | expected:'A' | got:'A' | concept: 'hold sports_ball'
3622 | expected:'B' | got:'C' | concept: 'hold sports_ball'
3623 | expected:'B' | got:'D' | concept: 'hold sports_ball'
3624 | expected:'D' | got:'D' | concept: 'hold book'
3625 | expected:'C' | got:'C' | concept: 'hold book'
3626 | expected:'C' | got:'C' | concept: 'hold book'
3627 | expected:'B' | got:'B' | concept: 'hold book'
3628 | expected:'A' | got:'A' | concept: 'hold remote'
3629 | expected:'A' | got:'A' | concept: 'hold remote'
3630 | expected:'A' | got:'A' | concept: 'hold remote'
3631 | expected:'C' | got:'C' | concept: 'hold remote'
3632 | expected:'C' | got:'B' | concept: 'hold wine_glass'
3633 | expected:'B' | got:'B' | concept: 'hold wine_glass'
3634 | expected:'B' | got:'B' | concept: 'hold wine_glass'
3635 | expected:'D' | got:'D' | concept: 'hold wine_glass'
3636 | expected:'D' | got:'A' | concept: 'hold handbag'
3637 | expected:'C' | got:'C' | concept: 'hold handbag'
3638 | expected:'D' | got:'D' | concept: 'hold handbag'
3639 | expected:'A' | got:'A' | concept: 'hold handbag'
3640 | expected:'D' | got:'D' | concept: 'toast wine_glass'
3641 | expected:'A' | got:'A' | concept: 'toast wine_glass'
3642 | expected:'B' | got:'B' | concept: 'toast wine_glass'
3643 | expected:'C' | got:'A' | concept: 'toast wine_glass'
3644 | expected:'A' | got:'A' | concept: 'hold sandwich'
3645 | expected:'A' | got:'A' | concept: 'hold sandwich'
3646 | expected:'C' | got:'C' | concept: 'hold sandwich'
3647 | expected:'C' | got:'C' | concept: 'hold sandwich'
3648 | expected:'A' | got:'C' | concept: 'lie_on_like chair'
3649 | expected:'A' | got:'C' | concept: 'lie_on_like chair'
3650 | expected:'B' | got:'D' | concept: 'lie_on_like chair'
3651 | expected:'A' | got:'B' | concept: 'lie_on_like chair'
3652 | expected:'B' | got:'B' | concept: 'stand_on chair'
3653 | expected:'A' | got:'A' | concept: 'stand_on chair'
3654 | expected:'C' | got:'C' | concept: 'stand_on chair'
3655 | expected:'C' | got:'C' | concept: 'stand_on chair'
3656 | expected:'C' | got:'C' | concept: 'stand_on boat'
3657 | expected:'B' | got:'B' | concept: 'stand_on boat'
3658 | expected:'D' | got:'C' | concept: 'stand_on boat'
3659 | expected:'D' | got:'D' | concept: 'stand_on boat'
3660 | expected:'C' | got:'C' | concept: 'sit_on chair'
3661 | expected:'A' | got:'A' | concept: 'sit_on chair'
3662 | expected:'C' | got:'C' | concept: 'sit_on chair'
3663 | expected:'C' | got:'C' | concept: 'sit_on chair'
3664 | expected:'D' | got:'D' | concept: 'eat apple'
3665 | expected:'B' | got:'B' | concept: 'eat apple'
3666 | expected:'B' | got:'B' | concept: 'eat apple'
3667 | expected:'D' | got:'D' | concept: 'eat apple'
3668 | expected:'A' | got:'A' | concept: 'eat donut'
3669 | expected:'D' | got:'D' | concept: 'eat donut'
3670 | expected:'A' | got:'A' | concept: 'eat donut'
3671 | expected:'A' | got:'A' | concept: 'eat donut'
3672 | expected:'A' | got:'A' | concept: 'eat banana'
3673 | expected:'B' | got:'B' | concept: 'eat banana'
3674 | expected:'A' | got:'A' | concept: 'eat banana'
3675 | expected:'A' | got:'A' | concept: 'eat banana'
3676 | expected:'C' | got:'C' | concept: 'eat orange'
3677 | expected:'D' | got:'D' | concept: 'eat orange'
3678 | expected:'B' | got:'B' | concept: 'eat orange'
3679 | expected:'A' | got:'A' | concept: 'eat orange'
3680 | expected:'D' | got:'C' | concept: 'drag suitcase'
3681 | expected:'B' | got:'B' | concept: 'drag suitcase'
3682 | expected:'B' | got:'D' | concept: 'drag suitcase'
3683 | expected:'A' | got:'A' | concept: 'drag suitcase'
3684 | expected:'A' | got:'A' | concept: 'carry handbag'
3685 | expected:'C' | got:'C' | concept: 'carry handbag'
3686 | expected:'D' | got:'D' | concept: 'carry handbag'
3687 | expected:'D' | got:'A' | concept: 'carry handbag'
3688 | expected:'C' | got:'C' | concept: 'carry surfboard'
3689 | expected:'C' | got:'C' | concept: 'carry surfboard'
3690 | expected:'A' | got:'A' | concept: 'carry surfboard'
3691 | expected:'B' | got:'B' | concept: 'carry surfboard'
3692 | expected:'D' | got:'A' | concept: 'carry suitcase'
3693 | expected:'A' | got:'A' | concept: 'carry suitcase'
3694 | expected:'D' | got:'C' | concept: 'carry suitcase'
3695 | expected:'D' | got:'D' | concept: 'carry suitcase'
3696 | expected:'A' | got:'A' | concept: 'hold apple'
3697 | expected:'D' | got:'D' | concept: 'hold apple'
3698 | expected:'C' | got:'C' | concept: 'hold apple'
3699 | expected:'C' | got:'C' | concept: 'hold apple'
3700 | expected:'D' | got:'D' | concept: 'hold tennis_racket'
3701 | expected:'A' | got:'C' | concept: 'hold tennis_racket'
3702 | expected:'B' | got:'C' | concept: 'hold tennis_racket'
3703 | expected:'C' | got:'C' | concept: 'hold tennis_racket'
3704 | expected:'A' | got:'A' | concept: 'hold knife'
3705 | expected:'A' | got:'D' | concept: 'hold knife'
3706 | expected:'C' | got:'C' | concept: 'hold knife'
3707 | expected:'D' | got:'D' | concept: 'hold knife'
3708 | expected:'C' | got:'C' | concept: 'swing tennis_racket'
3709 | expected:'B' | got:'B' | concept: 'swing tennis_racket'
3710 | expected:'D' | got:'A' | concept: 'swing tennis_racket'
3711 | expected:'B' | got:'B' | concept: 'swing tennis_racket'
3712 | expected:'A' | got:'A' | concept: 'brush_with toothbrush'
3713 | expected:'A' | got:'A' | concept: 'brush_with toothbrush'
3714 | expected:'C' | got:'C' | concept: 'brush_with toothbrush'
3715 | expected:'A' | got:'A' | concept: 'brush_with toothbrush'
3716 | expected:'D' | got:'D' | concept: 'sit_on bed'
3717 | expected:'B' | got:'B' | concept: 'sit_on bed'
3718 | expected:'C' | got:'C' | concept: 'sit_on bed'
3719 | expected:'B' | got:'B' | concept: 'sit_on bed'
3720 | expected:'C' | got:'C' | concept: 'adjust_or_tie tie'
3721 | expected:'D' | got:'D' | concept: 'adjust_or_tie tie'
3722 | expected:'A' | got:'A' | concept: 'adjust_or_tie tie'
3723 | expected:'D' | got:'D' | concept: 'adjust_or_tie tie'
3724 | expected:'D' | got:'D' | concept: 'stand_under umbrella'
3725 | expected:'B' | got:'B' | concept: 'stand_under umbrella'
3726 | expected:'D' | got:'A' | concept: 'stand_under umbrella'
3727 | expected:'D' | got:'A' | concept: 'stand_under umbrella'
3728 | expected:'B' | got:'B' | concept: 'ride skateboard'
3729 | expected:'B' | got:'C' | concept: 'ride skateboard'
3730 | expected:'D' | got:'C' | concept: 'ride skateboard'
3731 | expected:'D' | got:'C' | concept: 'ride skateboard'
3732 | expected:'C' | got:'C' | concept: 'grind skateboard'
3733 | expected:'D' | got:'D' | concept: 'grind skateboard'
3734 | expected:'B' | got:'B' | concept: 'grind skateboard'
3735 | expected:'A' | got:'A' | concept: 'grind skateboard'
3736 | expected:'A' | got:'A' | concept: 'grind snowboard'
3737 | expected:'B' | got:'A' | concept: 'grind snowboard'
3738 | expected:'A' | got:'B' | concept: 'grind snowboard'
3739 | expected:'C' | got:'D' | concept: 'grind snowboard'
3740 | expected:'B' | got:'D' | concept: 'sit_on skateboard'
3741 | expected:'B' | got:'B' | concept: 'sit_on skateboard'
3742 | expected:'C' | got:'D' | concept: 'sit_on skateboard'
3743 | expected:'D' | got:'D' | concept: 'sit_on skateboard'
3744 | expected:'D' | got:'D' | concept: 'hold pizza'
3745 | expected:'D' | got:'D' | concept: 'hold pizza'
3746 | expected:'A' | got:'A' | concept: 'hold pizza'
3747 | expected:'A' | got:'A' | concept: 'hold pizza'
3748 | expected:'A' | got:'A' | concept: 'hold dog'
3749 | expected:'A' | got:'A' | concept: 'hold dog'
3750 | expected:'A' | got:'A' | concept: 'hold dog'
3751 | expected:'C' | got:'C' | concept: 'hold dog'
3752 | expected:'B' | got:'B' | concept: 'hold knife'
3753 | expected:'B' | got:'B' | concept: 'hold knife'
3754 | expected:'A' | got:'A' | concept: 'hold knife'
3755 | expected:'D' | got:'D' | concept: 'hold knife'
3756 | expected:'C' | got:'C' | concept: 'hold mouse'
3757 | expected:'D' | got:'D' | concept: 'hold mouse'
3758 | expected:'A' | got:'A' | concept: 'hold mouse'
3759 | expected:'A' | got:'A' | concept: 'hold mouse'
3760 | expected:'C' | got:'C' | concept: 'hold toothbrush'
3761 | expected:'D' | got:'D' | concept: 'hold toothbrush'
3762 | expected:'A' | got:'A' | concept: 'hold toothbrush'
3763 | expected:'A' | got:'A' | concept: 'hold toothbrush'
3764 | expected:'C' | got:'INVALID' | concept: 'hold cake'
3765 | expected:'C' | got:'INVALID' | concept: 'hold cake'
3766 | expected:'C' | got:'C' | concept: 'hold cake'
3767 | expected:'D' | got:'D' | concept: 'hold cake'
3768 | expected:'A' | got:'A' | concept: 'hold dog'
3769 | expected:'C' | got:'C' | concept: 'hold dog'
3770 | expected:'A' | got:'A' | concept: 'hold dog'
3771 | expected:'C' | got:'C' | concept: 'hold dog'
3772 | expected:'B' | got:'B' | concept: 'hold banana'
3773 | expected:'C' | got:'C' | concept: 'hold banana'
3774 | expected:'A' | got:'A' | concept: 'hold banana'
3775 | expected:'B' | got:'B' | concept: 'hold banana'
3776 | expected:'B' | got:'B' | concept: 'clean microwave'
3777 | expected:'B' | got:'B' | concept: 'clean microwave'
3778 | expected:'C' | got:'C' | concept: 'clean microwave'
3779 | expected:'A' | got:'A' | concept: 'clean microwave'
3780 | expected:'A' | got:'A' | concept: 'clean keyboard'
3781 | expected:'C' | got:'C' | concept: 'clean keyboard'
3782 | expected:'C' | got:'C' | concept: 'clean keyboard'
3783 | expected:'D' | got:'A' | concept: 'clean keyboard'
3784 | expected:'D' | got:'D' | concept: 'clean toilet'
3785 | expected:'C' | got:'C' | concept: 'clean toilet'
3786 | expected:'A' | got:'A' | concept: 'clean toilet'
3787 | expected:'D' | got:'D' | concept: 'clean toilet'
3788 | expected:'A' | got:'A' | concept: 'clean refrigerator'
3789 | expected:'C' | got:'C' | concept: 'clean refrigerator'
3790 | expected:'C' | got:'C' | concept: 'clean refrigerator'
3791 | expected:'A' | got:'A' | concept: 'clean refrigerator'
3792 | expected:'A' | got:'A' | concept: 'ride skateboard'
3793 | expected:'A' | got:'A' | concept: 'ride skateboard'
3794 | expected:'C' | got:'C' | concept: 'ride skateboard'
3795 | expected:'D' | got:'D' | concept: 'ride skateboard'
3796 | expected:'C' | got:'C' | concept: 'ride bicycle'
3797 | expected:'A' | got:'A' | concept: 'ride bicycle'
3798 | expected:'B' | got:'B' | concept: 'ride bicycle'
3799 | expected:'D' | got:'D' | concept: 'ride bicycle'
3800 | expected:'B' | got:'B' | concept: 'ride snowboard'
3801 | expected:'A' | got:'A' | concept: 'ride snowboard'
3802 | expected:'D' | got:'D' | concept: 'ride snowboard'
3803 | expected:'D' | got:'D' | concept: 'ride snowboard'
3804 | expected:'C' | got:'C' | concept: 'ride elephant'
3805 | expected:'B' | got:'B' | concept: 'ride elephant'
3806 | expected:'D' | got:'D' | concept: 'ride elephant'
3807 | expected:'C' | got:'C' | concept: 'ride elephant'
3808 | expected:'C' | got:'C' | concept: 'eat pizza'
3809 | expected:'C' | got:'C' | concept: 'eat pizza'
3810 | expected:'A' | got:'A' | concept: 'eat pizza'
3811 | expected:'B' | got:'B' | concept: 'eat pizza'
3812 | expected:'B' | got:'C' | concept: 'make pizza'
3813 | expected:'B' | got:'A' | concept: 'make pizza'
3814 | expected:'B' | got:'B' | concept: 'make pizza'
3815 | expected:'B' | got:'B' | concept: 'make pizza'
3816 | expected:'C' | got:'C' | concept: 'cut pizza'
3817 | expected:'A' | got:'A' | concept: 'cut pizza'
3818 | expected:'D' | got:'D' | concept: 'cut pizza'
3819 | expected:'B' | got:'C' | concept: 'cut pizza'
3820 | expected:'B' | got:'B' | concept: 'hold pizza'
3821 | expected:'A' | got:'A' | concept: 'hold pizza'
3822 | expected:'A' | got:'D' | concept: 'hold pizza'
3823 | expected:'B' | got:'B' | concept: 'hold pizza'
3824 | expected:'A' | got:'A' | concept: 'ride bicycle'
3825 | expected:'D' | got:'D' | concept: 'ride bicycle'
3826 | expected:'A' | got:'A' | concept: 'ride bicycle'
3827 | expected:'A' | got:'A' | concept: 'ride bicycle'
3828 | expected:'D' | got:'D' | concept: 'ride skateboard'
3829 | expected:'C' | got:'C' | concept: 'ride skateboard'
3830 | expected:'D' | got:'D' | concept: 'ride skateboard'
3831 | expected:'C' | got:'C' | concept: 'ride skateboard'
3832 | expected:'D' | got:'D' | concept: 'ride elephant'
3833 | expected:'C' | got:'C' | concept: 'ride elephant'
3834 | expected:'B' | got:'B' | concept: 'ride elephant'
3835 | expected:'D' | got:'D' | concept: 'ride elephant'
3836 | expected:'D' | got:'D' | concept: 'ride motorcycle'
3837 | expected:'B' | got:'B' | concept: 'ride motorcycle'
3838 | expected:'D' | got:'D' | concept: 'ride motorcycle'
3839 | expected:'D' | got:'D' | concept: 'ride motorcycle'
3840 | expected:'D' | got:'D' | concept: 'hold spoon'
3841 | expected:'C' | got:'C' | concept: 'hold spoon'
3842 | expected:'B' | got:'B' | concept: 'hold spoon'
3843 | expected:'B' | got:'A' | concept: 'hold spoon'
3844 | expected:'C' | got:'C' | concept: 'hold cup'
3845 | expected:'B' | got:'B' | concept: 'hold cup'
3846 | expected:'A' | got:'A' | concept: 'hold cup'
3847 | expected:'B' | got:'B' | concept: 'hold cup'
3848 | expected:'C' | got:'C' | concept: 'hold skateboard'
3849 | expected:'B' | got:'B' | concept: 'hold skateboard'
3850 | expected:'B' | got:'B' | concept: 'hold skateboard'
3851 | expected:'A' | got:'A' | concept: 'hold skateboard'
3852 | expected:'C' | got:'C' | concept: 'hold orange'
3853 | expected:'A' | got:'A' | concept: 'hold orange'
3854 | expected:'B' | got:'B' | concept: 'hold orange'
3855 | expected:'A' | got:'A' | concept: 'hold orange'
3856 | expected:'B' | got:'B' | concept: 'hug horse'
3857 | expected:'B' | got:'B' | concept: 'hug horse'
3858 | expected:'D' | got:'D' | concept: 'hug horse'
3859 | expected:'D' | got:'D' | concept: 'hug horse'
3860 | expected:'D' | got:'D' | concept: 'hug dog'
3861 | expected:'D' | got:'D' | concept: 'hug dog'
3862 | expected:'B' | got:'B' | concept: 'hug dog'
3863 | expected:'A' | got:'A' | concept: 'hug dog'
3864 | expected:'D' | got:'A' | concept: 'pet cat'
3865 | expected:'A' | got:'A' | concept: 'pet cat'
3866 | expected:'A' | got:'A' | concept: 'pet cat'
3867 | expected:'C' | got:'C' | concept: 'pet cat'
3868 | expected:'D' | got:'A' | concept: 'hug cat'
3869 | expected:'B' | got:'B' | concept: 'hug cat'
3870 | expected:'C' | got:'C' | concept: 'hug cat'
3871 | expected:'B' | got:'B' | concept: 'hug cat'
3872 | expected:'D' | got:'D' | concept: 'hold book'
3873 | expected:'D' | got:'B' | concept: 'hold book'
3874 | expected:'B' | got:'B' | concept: 'hold book'
3875 | expected:'B' | got:'B' | concept: 'hold book'
3876 | expected:'D' | got:'D' | concept: 'hold tennis_racket'
3877 | expected:'B' | got:'B' | concept: 'hold tennis_racket'
3878 | expected:'A' | got:'A' | concept: 'hold tennis_racket'
3879 | expected:'A' | got:'A' | concept: 'hold tennis_racket'
3880 | expected:'B' | got:'B' | concept: 'hold handbag'
3881 | expected:'A' | got:'A' | concept: 'hold handbag'
3882 | expected:'C' | got:'C' | concept: 'hold handbag'
3883 | expected:'D' | got:'D' | concept: 'hold handbag'
3884 | expected:'B' | got:'B' | concept: 'hold cell_phone'
3885 | expected:'D' | got:'D' | concept: 'hold cell_phone'
3886 | expected:'D' | got:'D' | concept: 'hold cell_phone'
3887 | expected:'A' | got:'A' | concept: 'hold cell_phone'
3888 | expected:'B' | got:'B' | concept: 'sit_at dining_table'
3889 | expected:'A' | got:'A' | concept: 'sit_at dining_table'
3890 | expected:'B' | got:'B' | concept: 'sit_at dining_table'
3891 | expected:'B' | got:'B' | concept: 'sit_at dining_table'
3892 | expected:'A' | got:'A' | concept: 'direct airplane'
3893 | expected:'A' | got:'A' | concept: 'direct airplane'
3894 | expected:'A' | got:'A' | concept: 'direct airplane'
3895 | expected:'C' | got:'C' | concept: 'direct airplane'
3896 | expected:'C' | got:'C' | concept: 'type_on laptop'
3897 | expected:'D' | got:'D' | concept: 'type_on laptop'
3898 | expected:'B' | got:'B' | concept: 'type_on laptop'
3899 | expected:'D' | got:'D' | concept: 'type_on laptop'
3900 | expected:'D' | got:'D' | concept: 'kiss horse'
3901 | expected:'B' | got:'B' | concept: 'kiss horse'
3902 | expected:'C' | got:'C' | concept: 'kiss horse'
3903 | expected:'C' | got:'C' | concept: 'kiss horse'
3904 | expected:'C' | got:'C' | concept: 'carry suitcase'
3905 | expected:'B' | got:'C' | concept: 'carry suitcase'
3906 | expected:'B' | got:'C' | concept: 'carry suitcase'
3907 | expected:'A' | got:'A' | concept: 'carry suitcase'
3908 | expected:'C' | got:'B' | concept: 'carry handbag'
3909 | expected:'A' | got:'A' | concept: 'carry handbag'
3910 | expected:'D' | got:'B' | concept: 'carry handbag'
3911 | expected:'D' | got:'A' | concept: 'carry handbag'
3912 | expected:'B' | got:'B' | concept: 'hold handbag'
3913 | expected:'C' | got:'C' | concept: 'hold handbag'
3914 | expected:'B' | got:'B' | concept: 'hold handbag'
3915 | expected:'A' | got:'B' | concept: 'hold handbag'
3916 | expected:'A' | got:'A' | concept: 'carry surfboard'
3917 | expected:'A' | got:'A' | concept: 'carry surfboard'
3918 | expected:'C' | got:'C' | concept: 'carry surfboard'
3919 | expected:'C' | got:'C' | concept: 'carry surfboard'
3920 | expected:'A' | got:'A' | concept: 'drink_with cup'
3921 | expected:'B' | got:'B' | concept: 'drink_with cup'
3922 | expected:'C' | got:'C' | concept: 'drink_with cup'
3923 | expected:'C' | got:'A' | concept: 'drink_with cup'
3924 | expected:'B' | got:'A' | concept: 'hold cup'
3925 | expected:'C' | got:'B' | concept: 'hold cup'
3926 | expected:'C' | got:'C' | concept: 'hold cup'
3927 | expected:'C' | got:'D' | concept: 'hold cup'
3928 | expected:'D' | got:'B' | concept: 'drink_with bottle'
3929 | expected:'D' | got:'D' | concept: 'drink_with bottle'
3930 | expected:'C' | got:'B' | concept: 'drink_with bottle'
3931 | expected:'A' | got:'B' | concept: 'drink_with bottle'
3932 | expected:'A' | got:'D' | concept: 'hold bottle'
3933 | expected:'B' | got:'A' | concept: 'hold bottle'
3934 | expected:'A' | got:'A' | concept: 'hold bottle'
3935 | expected:'A' | got:'C' | concept: 'hold bottle'
3936 | expected:'B' | got:'B' | concept: 'lie_on couch'
3937 | expected:'C' | got:'C' | concept: 'lie_on couch'
3938 | expected:'D' | got:'B' | concept: 'lie_on couch'
3939 | expected:'D' | got:'D' | concept: 'lie_on couch'
3940 | expected:'B' | got:'B' | concept: 'lie_on bed'
3941 | expected:'B' | got:'B' | concept: 'lie_on bed'
3942 | expected:'C' | got:'C' | concept: 'lie_on bed'
3943 | expected:'C' | got:'C' | concept: 'lie_on bed'
3944 | expected:'A' | got:'A' | concept: 'sit_on couch'
3945 | expected:'D' | got:'D' | concept: 'sit_on couch'
3946 | expected:'B' | got:'B' | concept: 'sit_on couch'
3947 | expected:'C' | got:'C' | concept: 'sit_on couch'
3948 | expected:'D' | got:'B' | concept: 'lie_on bench'
3949 | expected:'D' | got:'B' | concept: 'lie_on bench'
3950 | expected:'C' | got:'C' | concept: 'lie_on bench'
3951 | expected:'B' | got:'B' | concept: 'lie_on bench'
3952 | expected:'D' | got:'C' | concept: 'hold bottle'
3953 | expected:'C' | got:'A' | concept: 'hold bottle'
3954 | expected:'A' | got:'B' | concept: 'hold bottle'
3955 | expected:'D' | got:'B' | concept: 'hold bottle'
3956 | expected:'D' | got:'D' | concept: 'drink_with bottle'
3957 | expected:'C' | got:'C' | concept: 'drink_with bottle'
3958 | expected:'C' | got:'C' | concept: 'drink_with bottle'
3959 | expected:'A' | got:'A' | concept: 'drink_with bottle'
3960 | expected:'C' | got:'D' | concept: 'drink_with cup'
3961 | expected:'C' | got:'C' | concept: 'drink_with cup'
3962 | expected:'C' | got:'A' | concept: 'drink_with cup'
3963 | expected:'B' | got:'B' | concept: 'drink_with cup'
3964 | expected:'C' | got:'B' | concept: 'hold pizza'
3965 | expected:'D' | got:'A' | concept: 'hold pizza'
3966 | expected:'D' | got:'D' | concept: 'hold pizza'
3967 | expected:'B' | got:'B' | concept: 'hold pizza'
3968 | expected:'B' | got:'B' | concept: 'carry suitcase'
3969 | expected:'D' | got:'A' | concept: 'carry suitcase'
3970 | expected:'C' | got:'C' | concept: 'carry suitcase'
3971 | expected:'A' | got:'A' | concept: 'carry suitcase'
3972 | expected:'A' | got:'A' | concept: 'hold handbag'
3973 | expected:'C' | got:'C' | concept: 'hold handbag'
3974 | expected:'B' | got:'B' | concept: 'hold handbag'
3975 | expected:'D' | got:'A' | concept: 'hold handbag'
3976 | expected:'D' | got:'D' | concept: 'carry handbag'
3977 | expected:'A' | got:'A' | concept: 'carry handbag'
3978 | expected:'D' | got:'B' | concept: 'carry handbag'
3979 | expected:'C' | got:'A' | concept: 'carry handbag'
3980 | expected:'A' | got:'A' | concept: 'carry surfboard'
3981 | expected:'A' | got:'A' | concept: 'carry surfboard'
3982 | expected:'A' | got:'A' | concept: 'carry surfboard'
3983 | expected:'C' | got:'C' | concept: 'carry surfboard'
3984 | expected:'A' | got:'A' | concept: 'pet horse'
3985 | expected:'A' | got:'A' | concept: 'pet horse'
3986 | expected:'D' | got:'D' | concept: 'pet horse'
3987 | expected:'C' | got:'C' | concept: 'pet horse'
3988 | expected:'D' | got:'D' | concept: 'pet sheep'
3989 | expected:'C' | got:'C' | concept: 'pet sheep'
3990 | expected:'B' | got:'B' | concept: 'pet sheep'
3991 | expected:'B' | got:'B' | concept: 'pet sheep'
3992 | expected:'D' | got:'D' | concept: 'pet dog'
3993 | expected:'C' | got:'C' | concept: 'pet dog'
3994 | expected:'C' | got:'C' | concept: 'pet dog'
3995 | expected:'B' | got:'B' | concept: 'pet dog'
3996 | expected:'D' | got:'A' | concept: 'shear sheep'
3997 | expected:'A' | got:'A' | concept: 'shear sheep'
3998 | expected:'A' | got:'C' | concept: 'shear sheep'
3999 | expected:'A' | got:'A' | concept: 'shear sheep'
4000 | expected:'A' | got:'B' | concept: 'hug dog'
4001 | expected:'A' | got:'A' | concept: 'hug dog'
4002 | expected:'A' | got:'D' | concept: 'hug dog'
4003 | expected:'D' | got:'D' | concept: 'hug dog'
4004 | expected:'C' | got:'C' | concept: 'kiss dog'
4005 | expected:'C' | got:'C' | concept: 'kiss dog'
4006 | expected:'D' | got:'D' | concept: 'kiss dog'
4007 | expected:'D' | got:'D' | concept: 'kiss dog'
4008 | expected:'D' | got:'C' | concept: 'train dog'
4009 | expected:'A' | got:'A' | concept: 'train dog'
4010 | expected:'A' | got:'C' | concept: 'train dog'
4011 | expected:'B' | got:'B' | concept: 'train dog'
4012 | expected:'C' | got:'C' | concept: 'pet dog'
4013 | expected:'D' | got:'D' | concept: 'pet dog'
4014 | expected:'B' | got:'B' | concept: 'pet dog'
4015 | expected:'C' | got:'C' | concept: 'pet dog'
4016 | expected:'D' | got:'D' | concept: 'repair bicycle'
4017 | expected:'D' | got:'D' | concept: 'repair bicycle'
4018 | expected:'B' | got:'B' | concept: 'repair bicycle'
4019 | expected:'A' | got:'D' | concept: 'repair bicycle'
4020 | expected:'B' | got:'C' | concept: 'walk bicycle'
4021 | expected:'D' | got:'A' | concept: 'walk bicycle'
4022 | expected:'C' | got:'C' | concept: 'walk bicycle'
4023 | expected:'B' | got:'B' | concept: 'walk bicycle'
4024 | expected:'C' | got:'C' | concept: 'ride bicycle'
4025 | expected:'B' | got:'B' | concept: 'ride bicycle'
4026 | expected:'B' | got:'A' | concept: 'ride bicycle'
4027 | expected:'C' | got:'C' | concept: 'ride bicycle'
4028 | expected:'C' | got:'C' | concept: 'straddle bicycle'
4029 | expected:'D' | got:'C' | concept: 'straddle bicycle'
4030 | expected:'B' | got:'A' | concept: 'straddle bicycle'
4031 | expected:'B' | got:'B' | concept: 'straddle bicycle'
4032 | expected:'A' | got:'A' | concept: 'pet horse'
4033 | expected:'A' | got:'A' | concept: 'pet horse'
4034 | expected:'B' | got:'B' | concept: 'pet horse'
4035 | expected:'A' | got:'A' | concept: 'pet horse'
4036 | expected:'B' | got:'B' | concept: 'pet dog'
4037 | expected:'C' | got:'C' | concept: 'pet dog'
4038 | expected:'C' | got:'C' | concept: 'pet dog'
4039 | expected:'D' | got:'D' | concept: 'pet dog'
4040 | expected:'B' | got:'B' | concept: 'shear sheep'
4041 | expected:'C' | got:'C' | concept: 'shear sheep'
4042 | expected:'C' | got:'A' | concept: 'shear sheep'
4043 | expected:'A' | got:'A' | concept: 'shear sheep'
4044 | expected:'C' | got:'C' | concept: 'pet sheep'
4045 | expected:'B' | got:'B' | concept: 'pet sheep'
4046 | expected:'C' | got:'C' | concept: 'pet sheep'
4047 | expected:'A' | got:'A' | concept: 'pet sheep'
4048 | expected:'D' | got:'D' | concept: 'ride horse'
4049 | expected:'C' | got:'C' | concept: 'ride horse'
4050 | expected:'D' | got:'D' | concept: 'ride horse'
4051 | expected:'C' | got:'C' | concept: 'ride horse'
4052 | expected:'C' | got:'C' | concept: 'pet horse'
4053 | expected:'D' | got:'D' | concept: 'pet horse'
4054 | expected:'B' | got:'A' | concept: 'pet horse'
4055 | expected:'B' | got:'B' | concept: 'pet horse'
4056 | expected:'D' | got:'D' | concept: 'kiss person'
4057 | expected:'D' | got:'D' | concept: 'kiss person'
4058 | expected:'B' | got:'B' | concept: 'kiss person'
4059 | expected:'D' | got:'D' | concept: 'kiss person'
4060 | expected:'D' | got:'D' | concept: 'kiss horse'
4061 | expected:'C' | got:'C' | concept: 'kiss horse'
4062 | expected:'B' | got:'B' | concept: 'kiss horse'
4063 | expected:'D' | got:'D' | concept: 'kiss horse'
4064 | expected:'D' | got:'D' | concept: 'hold spoon'
4065 | expected:'B' | got:'B' | concept: 'hold spoon'
4066 | expected:'A' | got:'A' | concept: 'hold spoon'
4067 | expected:'D' | got:'D' | concept: 'hold spoon'
4068 | expected:'C' | got:'C' | concept: 'hold hot_dog'
4069 | expected:'D' | got:'D' | concept: 'hold hot_dog'
4070 | expected:'D' | got:'D' | concept: 'hold hot_dog'
4071 | expected:'C' | got:'A' | concept: 'hold hot_dog'
4072 | expected:'B' | got:'B' | concept: 'swing tennis_racket'
4073 | expected:'C' | got:'C' | concept: 'swing tennis_racket'
4074 | expected:'A' | got:'A' | concept: 'swing tennis_racket'
4075 | expected:'D' | got:'D' | concept: 'swing tennis_racket'
4076 | expected:'C' | got:'A' | concept: 'hold tennis_racket'
4077 | expected:'C' | got:'D' | concept: 'hold tennis_racket'
4078 | expected:'B' | got:'A' | concept: 'hold tennis_racket'
4079 | expected:'B' | got:'D' | concept: 'hold tennis_racket'
4080 | expected:'D' | got:'D' | concept: 'hold skateboard'
4081 | expected:'C' | got:'C' | concept: 'hold skateboard'
4082 | expected:'A' | got:'A' | concept: 'hold skateboard'
4083 | expected:'B' | got:'B' | concept: 'hold skateboard'
4084 | expected:'B' | got:'D' | concept: 'sit_on skateboard'
4085 | expected:'A' | got:'D' | concept: 'sit_on skateboard'
4086 | expected:'D' | got:'D' | concept: 'sit_on skateboard'
4087 | expected:'C' | got:'D' | concept: 'sit_on skateboard'
4088 | expected:'D' | got:'D' | concept: 'hold cake'
4089 | expected:'B' | got:'B' | concept: 'hold cake'
4090 | expected:'B' | got:'B' | concept: 'hold cake'
4091 | expected:'B' | got:'B' | concept: 'hold cake'
4092 | expected:'B' | got:'B' | concept: 'hold tennis_racket'
4093 | expected:'D' | got:'D' | concept: 'hold tennis_racket'
4094 | expected:'B' | got:'B' | concept: 'hold tennis_racket'
4095 | expected:'A' | got:'A' | concept: 'hold tennis_racket'
4096 | expected:'C' | got:'C' | concept: 'hold pizza'
4097 | expected:'C' | got:'B' | concept: 'hold pizza'
4098 | expected:'B' | got:'D' | concept: 'hold pizza'
4099 | expected:'A' | got:'A' | concept: 'hold pizza'
4100 | expected:'A' | got:'A' | concept: 'cut pizza'
4101 | expected:'C' | got:'C' | concept: 'cut pizza'
4102 | expected:'D' | got:'D' | concept: 'cut pizza'
4103 | expected:'D' | got:'D' | concept: 'cut pizza'
4104 | expected:'A' | got:'A' | concept: 'eat pizza'
4105 | expected:'A' | got:'A' | concept: 'eat pizza'
4106 | expected:'A' | got:'A' | concept: 'eat pizza'
4107 | expected:'B' | got:'B' | concept: 'eat pizza'
4108 | expected:'A' | got:'C' | concept: 'make pizza'
4109 | expected:'C' | got:'B' | concept: 'make pizza'
4110 | expected:'D' | got:'B' | concept: 'make pizza'
4111 | expected:'C' | got:'C' | concept: 'make pizza'
4112 | expected:'D' | got:'C' | concept: 'walk horse'
4113 | expected:'A' | got:'A' | concept: 'walk horse'
4114 | expected:'D' | got:'D' | concept: 'walk horse'
4115 | expected:'D' | got:'C' | concept: 'walk horse'
4116 | expected:'D' | got:'D' | concept: 'kiss horse'
4117 | expected:'A' | got:'A' | concept: 'kiss horse'
4118 | expected:'C' | got:'C' | concept: 'kiss horse'
4119 | expected:'B' | got:'B' | concept: 'kiss horse'
4120 | expected:'C' | got:'C' | concept: 'kiss person'
4121 | expected:'C' | got:'C' | concept: 'kiss person'
4122 | expected:'A' | got:'A' | concept: 'kiss person'
4123 | expected:'D' | got:'D' | concept: 'kiss person'
4124 | expected:'B' | got:'B' | concept: 'ride horse'
4125 | expected:'A' | got:'A' | concept: 'ride horse'
4126 | expected:'A' | got:'A' | concept: 'ride horse'
4127 | expected:'B' | got:'B' | concept: 'ride horse'
4128 | expected:'D' | got:'D' | concept: 'repair bicycle'
4129 | expected:'A' | got:'A' | concept: 'repair bicycle'
4130 | expected:'A' | got:'A' | concept: 'repair bicycle'
4131 | expected:'D' | got:'D' | concept: 'repair bicycle'
4132 | expected:'C' | got:'C' | concept: 'wash bicycle'
4133 | expected:'A' | got:'D' | concept: 'wash bicycle'
4134 | expected:'D' | got:'C' | concept: 'wash bicycle'
4135 | expected:'D' | got:'D' | concept: 'wash bicycle'
4136 | expected:'B' | got:'C' | concept: 'straddle bicycle'
4137 | expected:'D' | got:'D' | concept: 'straddle bicycle'
4138 | expected:'C' | got:'C' | concept: 'straddle bicycle'
4139 | expected:'D' | got:'D' | concept: 'straddle bicycle'
4140 | expected:'D' | got:'D' | concept: 'jump bicycle'
4141 | expected:'D' | got:'D' | concept: 'jump bicycle'
4142 | expected:'A' | got:'A' | concept: 'jump bicycle'
4143 | expected:'B' | got:'B' | concept: 'jump bicycle'
4144 | expected:'C' | got:'D' | concept: 'hold cake'
4145 | expected:'C' | got:'INVALID' | concept: 'hold cake'
4146 | expected:'A' | got:'C' | concept: 'hold cake'
4147 | expected:'C' | got:'INVALID' | concept: 'hold cake'
4148 | expected:'D' | got:'D' | concept: 'cut cake'
4149 | expected:'A' | got:'A' | concept: 'cut cake'
4150 | expected:'B' | got:'B' | concept: 'cut cake'
4151 | expected:'A' | got:'A' | concept: 'cut cake'
4152 | expected:'C' | got:'C' | concept: 'cut pizza'
4153 | expected:'A' | got:'A' | concept: 'cut pizza'
4154 | expected:'C' | got:'C' | concept: 'cut pizza'
4155 | expected:'B' | got:'B' | concept: 'cut pizza'
4156 | expected:'D' | got:'C' | concept: 'eat pizza'
4157 | expected:'B' | got:'B' | concept: 'eat pizza'
4158 | expected:'D' | got:'D' | concept: 'eat pizza'
4159 | expected:'B' | got:'B' | concept: 'eat pizza'
4160 | expected:'D' | got:'D' | concept: 'operate microwave'
4161 | expected:'B' | got:'B' | concept: 'operate microwave'
4162 | expected:'C' | got:'C' | concept: 'operate microwave'
4163 | expected:'D' | got:'D' | concept: 'operate microwave'
4164 | expected:'A' | got:'A' | concept: 'clean keyboard'
4165 | expected:'A' | got:'A' | concept: 'clean keyboard'
4166 | expected:'D' | got:'A' | concept: 'clean keyboard'
4167 | expected:'C' | got:'C' | concept: 'clean keyboard'
4168 | expected:'A' | got:'A' | concept: 'open microwave'
4169 | expected:'D' | got:'A' | concept: 'open microwave'
4170 | expected:'A' | got:'A' | concept: 'open microwave'
4171 | expected:'A' | got:'C' | concept: 'open microwave'
4172 | expected:'D' | got:'D' | concept: 'clean microwave'
4173 | expected:'D' | got:'A' | concept: 'clean microwave'
4174 | expected:'B' | got:'B' | concept: 'clean microwave'
4175 | expected:'D' | got:'D' | concept: 'clean microwave'
4176 | expected:'B' | got:'C' | concept: 'hold cake'
4177 | expected:'A' | got:'INVALID' | concept: 'hold cake'
4178 | expected:'B' | got:'B' | concept: 'hold cake'
4179 | expected:'B' | got:'D' | concept: 'hold cake'
4180 | expected:'B' | got:'B' | concept: 'hold skateboard'
4181 | expected:'B' | got:'B' | concept: 'hold skateboard'
4182 | expected:'A' | got:'A' | concept: 'hold skateboard'
4183 | expected:'B' | got:'B' | concept: 'hold skateboard'
4184 | expected:'C' | got:'A' | concept: 'hold knife'
4185 | expected:'B' | got:'B' | concept: 'hold knife'
4186 | expected:'D' | got:'D' | concept: 'hold knife'
4187 | expected:'D' | got:'D' | concept: 'hold knife'
4188 | expected:'D' | got:'D' | concept: 'hold sports_ball'
4189 | expected:'B' | got:'B' | concept: 'hold sports_ball'
4190 | expected:'A' | got:'A' | concept: 'hold sports_ball'
4191 | expected:'A' | got:'A' | concept: 'hold sports_ball'
4192 | expected:'C' | got:'C' | concept: 'hold hot_dog'
4193 | expected:'A' | got:'C' | concept: 'hold hot_dog'
4194 | expected:'C' | got:'C' | concept: 'hold hot_dog'
4195 | expected:'D' | got:'B' | concept: 'hold hot_dog'
4196 | expected:'B' | got:'B' | concept: 'hold cell_phone'
4197 | expected:'A' | got:'A' | concept: 'hold cell_phone'
4198 | expected:'C' | got:'A' | concept: 'hold cell_phone'
4199 | expected:'D' | got:'D' | concept: 'hold cell_phone'
4200 | expected:'B' | got:'D' | concept: 'hold spoon'
4201 | expected:'C' | got:'C' | concept: 'hold spoon'
4202 | expected:'B' | got:'B' | concept: 'hold spoon'
4203 | expected:'C' | got:'C' | concept: 'hold spoon'
4204 | expected:'A' | got:'A' | concept: 'hold tennis_racket'
4205 | expected:'C' | got:'C' | concept: 'hold tennis_racket'
4206 | expected:'D' | got:'A' | concept: 'hold tennis_racket'
4207 | expected:'A' | got:'A' | concept: 'hold tennis_racket'
4208 | expected:'D' | got:'A' | concept: 'kiss dog'
4209 | expected:'B' | got:'B' | concept: 'kiss dog'
4210 | expected:'A' | got:'A' | concept: 'kiss dog'
4211 | expected:'C' | got:'C' | concept: 'kiss dog'
4212 | expected:'D' | got:'D' | concept: 'hug person'
4213 | expected:'A' | got:'D' | concept: 'hug person'
4214 | expected:'B' | got:'A' | concept: 'hug person'
4215 | expected:'C' | got:'C' | concept: 'hug person'
4216 | expected:'C' | got:'C' | concept: 'greet person'
4217 | expected:'D' | got:'D' | concept: 'greet person'
4218 | expected:'A' | got:'A' | concept: 'greet person'
4219 | expected:'D' | got:'D' | concept: 'greet person'
4220 | expected:'B' | got:'B' | concept: 'kiss person'
4221 | expected:'C' | got:'C' | concept: 'kiss person'
4222 | expected:'B' | got:'B' | concept: 'kiss person'
4223 | expected:'B' | got:'B' | concept: 'kiss person'
4224 | expected:'B' | got:'A' | concept: 'hold cake'
4225 | expected:'C' | got:'C' | concept: 'hold cake'
4226 | expected:'A' | got:'C' | concept: 'hold cake'
4227 | expected:'C' | got:'A' | concept: 'hold cake'
4228 | expected:'D' | got:'D' | concept: 'hold pizza'
4229 | expected:'D' | got:'D' | concept: 'hold pizza'
4230 | expected:'A' | got:'A' | concept: 'hold pizza'
4231 | expected:'B' | got:'B' | concept: 'hold pizza'
4232 | expected:'C' | got:'C' | concept: 'hold mouse'
4233 | expected:'A' | got:'A' | concept: 'hold mouse'
4234 | expected:'C' | got:'C' | concept: 'hold mouse'
4235 | expected:'D' | got:'D' | concept: 'hold mouse'
4236 | expected:'A' | got:'A' | concept: 'hold wine_glass'
4237 | expected:'A' | got:'A' | concept: 'hold wine_glass'
4238 | expected:'A' | got:'A' | concept: 'hold wine_glass'
4239 | expected:'D' | got:'A' | concept: 'hold wine_glass'
4240 | expected:'A' | got:'A' | concept: 'hold banana'
4241 | expected:'B' | got:'B' | concept: 'hold banana'
4242 | expected:'B' | got:'B' | concept: 'hold banana'
4243 | expected:'D' | got:'A' | concept: 'hold banana'
4244 | expected:'D' | got:'D' | concept: 'hold laptop'
4245 | expected:'D' | got:'D' | concept: 'hold laptop'
4246 | expected:'A' | got:'A' | concept: 'hold laptop'
4247 | expected:'B' | got:'B' | concept: 'hold laptop'
4248 | expected:'B' | got:'B' | concept: 'hold dog'
4249 | expected:'B' | got:'B' | concept: 'hold dog'
4250 | expected:'B' | got:'B' | concept: 'hold dog'
4251 | expected:'D' | got:'D' | concept: 'hold dog'
4252 | expected:'C' | got:'A' | concept: 'hold pizza'
4253 | expected:'C' | got:'C' | concept: 'hold pizza'
4254 | expected:'D' | got:'A' | concept: 'hold pizza'
4255 | expected:'D' | got:'A' | concept: 'hold pizza'
4256 | expected:'A' | got:'A' | concept: 'hold_and_about_to_eat apple'
4257 | expected:'C' | got:'C' | concept: 'hold_and_about_to_eat apple'
4258 | expected:'A' | got:'D' | concept: 'hold_and_about_to_eat apple'
4259 | expected:'B' | got:'A' | concept: 'hold_and_about_to_eat apple'
4260 | expected:'A' | got:'C' | concept: 'eat apple'
4261 | expected:'A' | got:'D' | concept: 'eat apple'
4262 | expected:'C' | got:'C' | concept: 'eat apple'
4263 | expected:'C' | got:'C' | concept: 'eat apple'
4264 | expected:'D' | got:'D' | concept: 'pick apple'
4265 | expected:'C' | got:'C' | concept: 'pick apple'
4266 | expected:'B' | got:'B' | concept: 'pick apple'
4267 | expected:'B' | got:'C' | concept: 'pick apple'
4268 | expected:'B' | got:'B' | concept: 'peel_or_cut apple'
4269 | expected:'A' | got:'A' | concept: 'peel_or_cut apple'
4270 | expected:'C' | got:'C' | concept: 'peel_or_cut apple'
4271 | expected:'A' | got:'A' | concept: 'peel_or_cut apple'
4272 | expected:'D' | got:'D' | concept: 'jump motorcycle'
4273 | expected:'C' | got:'C' | concept: 'jump motorcycle'
4274 | expected:'D' | got:'D' | concept: 'jump motorcycle'
4275 | expected:'B' | got:'B' | concept: 'jump motorcycle'
4276 | expected:'C' | got:'C' | concept: 'jump skateboard'
4277 | expected:'D' | got:'D' | concept: 'jump skateboard'
4278 | expected:'C' | got:'C' | concept: 'jump skateboard'
4279 | expected:'D' | got:'D' | concept: 'jump skateboard'
4280 | expected:'A' | got:'A' | concept: 'grind skateboard'
4281 | expected:'C' | got:'D' | concept: 'grind skateboard'
4282 | expected:'C' | got:'C' | concept: 'grind skateboard'
4283 | expected:'D' | got:'B' | concept: 'grind skateboard'
4284 | expected:'C' | got:'C' | concept: 'jump snowboard'
4285 | expected:'C' | got:'C' | concept: 'jump snowboard'
4286 | expected:'C' | got:'B' | concept: 'jump snowboard'
4287 | expected:'C' | got:'C' | concept: 'jump snowboard'
4288 | expected:'A' | got:'A' | concept: 'hold remote'
4289 | expected:'C' | got:'C' | concept: 'hold remote'
4290 | expected:'A' | got:'A' | concept: 'hold remote'
4291 | expected:'B' | got:'B' | concept: 'hold remote'
4292 | expected:'A' | got:'A' | concept: 'hold sports_ball'
4293 | expected:'A' | got:'A' | concept: 'hold sports_ball'
4294 | expected:'C' | got:'C' | concept: 'hold sports_ball'
4295 | expected:'C' | got:'C' | concept: 'hold sports_ball'
4296 | expected:'D' | got:'D' | concept: 'hold spoon'
4297 | expected:'C' | got:'C' | concept: 'hold spoon'
4298 | expected:'B' | got:'B' | concept: 'hold spoon'
4299 | expected:'B' | got:'A' | concept: 'hold spoon'
4300 | expected:'A' | got:'A' | concept: 'hold pizza'
4301 | expected:'C' | got:'C' | concept: 'hold pizza'
4302 | expected:'C' | got:'C' | concept: 'hold pizza'
4303 | expected:'B' | got:'B' | concept: 'hold pizza'
4304 | expected:'B' | got:'B' | concept: 'ride skis'
4305 | expected:'A' | got:'A' | concept: 'ride skis'
4306 | expected:'C' | got:'C' | concept: 'ride skis'
4307 | expected:'C' | got:'C' | concept: 'ride skis'
4308 | expected:'C' | got:'C' | concept: 'ride horse'
4309 | expected:'C' | got:'C' | concept: 'ride horse'
4310 | expected:'B' | got:'B' | concept: 'ride horse'
4311 | expected:'B' | got:'B' | concept: 'ride horse'
4312 | expected:'C' | got:'C' | concept: 'ride bicycle'
4313 | expected:'C' | got:'C' | concept: 'ride bicycle'
4314 | expected:'A' | got:'A' | concept: 'ride bicycle'
4315 | expected:'A' | got:'B' | concept: 'ride bicycle'
4316 | expected:'D' | got:'A' | concept: 'straddle bicycle'
4317 | expected:'C' | got:'B' | concept: 'straddle bicycle'
4318 | expected:'C' | got:'B' | concept: 'straddle bicycle'
4319 | expected:'A' | got:'C' | concept: 'straddle bicycle'
4320 | expected:'A' | got:'A' | concept: 'jump skateboard'
4321 | expected:'A' | got:'A' | concept: 'jump skateboard'
4322 | expected:'C' | got:'C' | concept: 'jump skateboard'
4323 | expected:'A' | got:'A' | concept: 'jump skateboard'
4324 | expected:'D' | got:'A' | concept: 'ride skateboard'
4325 | expected:'A' | got:'A' | concept: 'ride skateboard'
4326 | expected:'C' | got:'C' | concept: 'ride skateboard'
4327 | expected:'D' | got:'D' | concept: 'ride skateboard'
4328 | expected:'B' | got:'B' | concept: 'grind snowboard'
4329 | expected:'D' | got:'C' | concept: 'grind snowboard'
4330 | expected:'D' | got:'B' | concept: 'grind snowboard'
4331 | expected:'B' | got:'A' | concept: 'grind snowboard'
4332 | expected:'D' | got:'C' | concept: 'grind skateboard'
4333 | expected:'C' | got:'B' | concept: 'grind skateboard'
4334 | expected:'B' | got:'B' | concept: 'grind skateboard'
4335 | expected:'D' | got:'C' | concept: 'grind skateboard'
4336 | expected:'A' | got:'A' | concept: 'walk cow'
4337 | expected:'B' | got:'B' | concept: 'walk cow'
4338 | expected:'C' | got:'C' | concept: 'walk cow'
4339 | expected:'D' | got:'A' | concept: 'walk cow'
4340 | expected:'D' | got:'B' | concept: 'train dog'
4341 | expected:'A' | got:'C' | concept: 'train dog'
4342 | expected:'A' | got:'C' | concept: 'train dog'
4343 | expected:'A' | got:'A' | concept: 'train dog'
4344 | expected:'C' | got:'C' | concept: 'walk dog'
4345 | expected:'C' | got:'B' | concept: 'walk dog'
4346 | expected:'B' | got:'B' | concept: 'walk dog'
4347 | expected:'B' | got:'B' | concept: 'walk dog'
4348 | expected:'D' | got:'D' | concept: 'pet dog'
4349 | expected:'D' | got:'D' | concept: 'pet dog'
4350 | expected:'D' | got:'D' | concept: 'pet dog'
4351 | expected:'D' | got:'D' | concept: 'pet dog'
4352 | expected:'B' | got:'B' | concept: 'carry surfboard'
4353 | expected:'C' | got:'B' | concept: 'carry surfboard'
4354 | expected:'D' | got:'B' | concept: 'carry surfboard'
4355 | expected:'B' | got:'B' | concept: 'carry surfboard'
4356 | expected:'D' | got:'A' | concept: 'carry suitcase'
4357 | expected:'D' | got:'C' | concept: 'carry suitcase'
4358 | expected:'B' | got:'B' | concept: 'carry suitcase'
4359 | expected:'A' | got:'A' | concept: 'carry suitcase'
4360 | expected:'C' | got:'C' | concept: 'ride surfboard'
4361 | expected:'D' | got:'D' | concept: 'ride surfboard'
4362 | expected:'B' | got:'B' | concept: 'ride surfboard'
4363 | expected:'B' | got:'B' | concept: 'ride surfboard'
4364 | expected:'C' | got:'C' | concept: 'carry handbag'
4365 | expected:'D' | got:'D' | concept: 'carry handbag'
4366 | expected:'D' | got:'A' | concept: 'carry handbag'
4367 | expected:'B' | got:'B' | concept: 'carry handbag'
4368 | expected:'C' | got:'C' | concept: 'inspect motorcycle'
4369 | expected:'C' | got:'C' | concept: 'inspect motorcycle'
4370 | expected:'A' | got:'A' | concept: 'inspect motorcycle'
4371 | expected:'A' | got:'A' | concept: 'inspect motorcycle'
4372 | expected:'B' | got:'B' | concept: 'inspect oven'
4373 | expected:'D' | got:'D' | concept: 'inspect oven'
4374 | expected:'D' | got:'D' | concept: 'inspect oven'
4375 | expected:'D' | got:'D' | concept: 'inspect oven'
4376 | expected:'C' | got:'C' | concept: 'clean oven'
4377 | expected:'A' | got:'A' | concept: 'clean oven'
4378 | expected:'C' | got:'C' | concept: 'clean oven'
4379 | expected:'B' | got:'B' | concept: 'clean oven'
4380 | expected:'D' | got:'D' | concept: 'sit_on motorcycle'
4381 | expected:'B' | got:'C' | concept: 'sit_on motorcycle'
4382 | expected:'A' | got:'A' | concept: 'sit_on motorcycle'
4383 | expected:'B' | got:'B' | concept: 'sit_on motorcycle'
4384 | expected:'B' | got:'B' | concept: 'carry surfboard'
4385 | expected:'B' | got:'A' | concept: 'carry surfboard'
4386 | expected:'B' | got:'B' | concept: 'carry surfboard'
4387 | expected:'B' | got:'B' | concept: 'carry surfboard'
4388 | expected:'D' | got:'A' | concept: 'carry handbag'
4389 | expected:'A' | got:'A' | concept: 'carry handbag'
4390 | expected:'B' | got:'B' | concept: 'carry handbag'
4391 | expected:'B' | got:'B' | concept: 'carry handbag'
4392 | expected:'A' | got:'A' | concept: 'ride surfboard'
4393 | expected:'B' | got:'B' | concept: 'ride surfboard'
4394 | expected:'C' | got:'C' | concept: 'ride surfboard'
4395 | expected:'B' | got:'B' | concept: 'ride surfboard'
4396 | expected:'C' | got:'C' | concept: 'carry suitcase'
4397 | expected:'B' | got:'C' | concept: 'carry suitcase'
4398 | expected:'D' | got:'C' | concept: 'carry suitcase'
4399 | expected:'C' | got:'B' | concept: 'carry suitcase'
4400 | expected:'B' | got:'B' | concept: 'hold remote'
4401 | expected:'C' | got:'C' | concept: 'hold remote'
4402 | expected:'D' | got:'D' | concept: 'hold remote'
4403 | expected:'D' | got:'D' | concept: 'hold remote'
4404 | expected:'B' | got:'B' | concept: 'hold pizza'
4405 | expected:'C' | got:'C' | concept: 'hold pizza'
4406 | expected:'C' | got:'A' | concept: 'hold pizza'
4407 | expected:'C' | got:'C' | concept: 'hold pizza'
4408 | expected:'A' | got:'C' | concept: 'hold spoon'
4409 | expected:'D' | got:'B' | concept: 'hold spoon'
4410 | expected:'B' | got:'A' | concept: 'hold spoon'
4411 | expected:'A' | got:'A' | concept: 'hold spoon'
4412 | expected:'D' | got:'C' | concept: 'lick_or_sip spoon'
4413 | expected:'A' | got:'A' | concept: 'lick_or_sip spoon'
4414 | expected:'C' | got:'C' | concept: 'lick_or_sip spoon'
4415 | expected:'B' | got:'B' | concept: 'lick_or_sip spoon'
4416 | expected:'C' | got:'C' | concept: 'hold knife'
4417 | expected:'D' | got:'D' | concept: 'hold knife'
4418 | expected:'A' | got:'A' | concept: 'hold knife'
4419 | expected:'A' | got:'B' | concept: 'hold knife'
4420 | expected:'D' | got:'D' | concept: 'hold cup'
4421 | expected:'B' | got:'B' | concept: 'hold cup'
4422 | expected:'C' | got:'C' | concept: 'hold cup'
4423 | expected:'D' | got:'C' | concept: 'hold cup'
4424 | expected:'B' | got:'B' | concept: 'hold bottle'
4425 | expected:'D' | got:'B' | concept: 'hold bottle'
4426 | expected:'C' | got:'A' | concept: 'hold bottle'
4427 | expected:'C' | got:'C' | concept: 'hold bottle'
4428 | expected:'C' | got:'C' | concept: 'hold orange'
4429 | expected:'B' | got:'B' | concept: 'hold orange'
4430 | expected:'C' | got:'C' | concept: 'hold orange'
4431 | expected:'C' | got:'C' | concept: 'hold orange'
4432 | expected:'D' | got:'D' | concept: 'ride horse'
4433 | expected:'D' | got:'D' | concept: 'ride horse'
4434 | expected:'C' | got:'C' | concept: 'ride horse'
4435 | expected:'A' | got:'A' | concept: 'ride horse'
4436 | expected:'A' | got:'A' | concept: 'pet horse'
4437 | expected:'D' | got:'D' | concept: 'pet horse'
4438 | expected:'A' | got:'A' | concept: 'pet horse'
4439 | expected:'A' | got:'A' | concept: 'pet horse'
4440 | expected:'C' | got:'C' | concept: 'kiss horse'
4441 | expected:'B' | got:'B' | concept: 'kiss horse'
4442 | expected:'B' | got:'C' | concept: 'kiss horse'
4443 | expected:'D' | got:'B' | concept: 'kiss horse'
4444 | expected:'D' | got:'D' | concept: 'pet sheep'
4445 | expected:'D' | got:'D' | concept: 'pet sheep'
4446 | expected:'C' | got:'C' | concept: 'pet sheep'
4447 | expected:'D' | got:'D' | concept: 'pet sheep'
4448 | expected:'D' | got:'B' | concept: 'peel orange'
4449 | expected:'C' | got:'C' | concept: 'peel orange'
4450 | expected:'B' | got:'C' | concept: 'peel orange'
4451 | expected:'B' | got:'C' | concept: 'peel orange'
4452 | expected:'B' | got:'B' | concept: 'eat orange'
4453 | expected:'D' | got:'D' | concept: 'eat orange'
4454 | expected:'A' | got:'A' | concept: 'eat orange'
4455 | expected:'A' | got:'A' | concept: 'eat orange'
4456 | expected:'C' | got:'C' | concept: 'squeeze orange'
4457 | expected:'C' | got:'C' | concept: 'squeeze orange'
4458 | expected:'B' | got:'D' | concept: 'squeeze orange'
4459 | expected:'A' | got:'A' | concept: 'squeeze orange'
4460 | expected:'D' | got:'D' | concept: 'peel banana'
4461 | expected:'C' | got:'C' | concept: 'peel banana'
4462 | expected:'A' | got:'A' | concept: 'peel banana'
4463 | expected:'B' | got:'B' | concept: 'peel banana'
4464 | expected:'B' | got:'B' | concept: 'clean toilet'
4465 | expected:'D' | got:'D' | concept: 'clean toilet'
4466 | expected:'C' | got:'C' | concept: 'clean toilet'
4467 | expected:'D' | got:'D' | concept: 'clean toilet'
4468 | expected:'B' | got:'B' | concept: 'clean oven'
4469 | expected:'B' | got:'B' | concept: 'clean oven'
4470 | expected:'B' | got:'B' | concept: 'clean oven'
4471 | expected:'D' | got:'D' | concept: 'clean oven'
4472 | expected:'D' | got:'A' | concept: 'clean microwave'
4473 | expected:'C' | got:'C' | concept: 'clean microwave'
4474 | expected:'C' | got:'C' | concept: 'clean microwave'
4475 | expected:'A' | got:'A' | concept: 'clean microwave'
4476 | expected:'D' | got:'A' | concept: 'clean keyboard'
4477 | expected:'A' | got:'A' | concept: 'clean keyboard'
4478 | expected:'A' | got:'A' | concept: 'clean keyboard'
4479 | expected:'A' | got:'A' | concept: 'clean keyboard'
4480 | expected:'D' | got:'D' | concept: 'peel_or_cut apple'
4481 | expected:'B' | got:'B' | concept: 'peel_or_cut apple'
4482 | expected:'D' | got:'D' | concept: 'peel_or_cut apple'
4483 | expected:'D' | got:'A' | concept: 'peel_or_cut apple'
4484 | expected:'C' | got:'C' | concept: 'eat apple'
4485 | expected:'D' | got:'D' | concept: 'eat apple'
4486 | expected:'C' | got:'C' | concept: 'eat apple'
4487 | expected:'C' | got:'C' | concept: 'eat apple'
4488 | expected:'D' | got:'D' | concept: 'eat banana'
4489 | expected:'A' | got:'A' | concept: 'eat banana'
4490 | expected:'D' | got:'D' | concept: 'eat banana'
4491 | expected:'B' | got:'B' | concept: 'eat banana'
4492 | expected:'D' | got:'D' | concept: 'eat hot_dog'
4493 | expected:'B' | got:'B' | concept: 'eat hot_dog'
4494 | expected:'D' | got:'D' | concept: 'eat hot_dog'
4495 | expected:'A' | got:'D' | concept: 'eat hot_dog'
4496 | expected:'D' | got:'D' | concept: 'ride elephant'
4497 | expected:'A' | got:'A' | concept: 'ride elephant'
4498 | expected:'C' | got:'C' | concept: 'ride elephant'
4499 | expected:'B' | got:'B' | concept: 'ride elephant'
4500 | expected:'D' | got:'D' | concept: 'ride horse'
4501 | expected:'D' | got:'D' | concept: 'ride horse'
4502 | expected:'C' | got:'C' | concept: 'ride horse'
4503 | expected:'A' | got:'A' | concept: 'ride horse'
4504 | expected:'C' | got:'C' | concept: 'ride surfboard'
4505 | expected:'B' | got:'B' | concept: 'ride surfboard'
4506 | expected:'D' | got:'D' | concept: 'ride surfboard'
4507 | expected:'D' | got:'D' | concept: 'ride surfboard'
4508 | expected:'D' | got:'D' | concept: 'ride snowboard'
4509 | expected:'A' | got:'A' | concept: 'ride snowboard'
4510 | expected:'C' | got:'C' | concept: 'ride snowboard'
4511 | expected:'C' | got:'C' | concept: 'ride snowboard'
4512 | expected:'C' | got:'A' | concept: 'hold toothbrush'
4513 | expected:'B' | got:'C' | concept: 'hold toothbrush'
4514 | expected:'C' | got:'C' | concept: 'hold toothbrush'
4515 | expected:'A' | got:'A' | concept: 'hold toothbrush'
4516 | expected:'A' | got:'A' | concept: 'hold book'
4517 | expected:'A' | got:'A' | concept: 'hold book'
4518 | expected:'A' | got:'A' | concept: 'hold book'
4519 | expected:'C' | got:'C' | concept: 'hold book'
4520 | expected:'A' | got:'D' | concept: 'hold kite'
4521 | expected:'C' | got:'C' | concept: 'hold kite'
4522 | expected:'D' | got:'A' | concept: 'hold kite'
4523 | expected:'C' | got:'C' | concept: 'hold kite'
4524 | expected:'A' | got:'A' | concept: 'hold sports_ball'
4525 | expected:'D' | got:'D' | concept: 'hold sports_ball'
4526 | expected:'C' | got:'C' | concept: 'hold sports_ball'
4527 | expected:'B' | got:'C' | concept: 'hold sports_ball'
4528 | expected:'A' | got:'A' | concept: 'sit_on skateboard'
4529 | expected:'D' | got:'D' | concept: 'sit_on skateboard'
4530 | expected:'B' | got:'B' | concept: 'sit_on skateboard'
4531 | expected:'C' | got:'C' | concept: 'sit_on skateboard'
4532 | expected:'A' | got:'A' | concept: 'stand_on chair'
4533 | expected:'A' | got:'D' | concept: 'stand_on chair'
4534 | expected:'A' | got:'A' | concept: 'stand_on chair'
4535 | expected:'D' | got:'B' | concept: 'stand_on chair'
4536 | expected:'B' | got:'B' | concept: 'sit_on chair'
4537 | expected:'D' | got:'D' | concept: 'sit_on chair'
4538 | expected:'A' | got:'A' | concept: 'sit_on chair'
4539 | expected:'D' | got:'C' | concept: 'sit_on chair'
4540 | expected:'C' | got:'C' | concept: 'lie_on_like chair'
4541 | expected:'D' | got:'B' | concept: 'lie_on_like chair'
4542 | expected:'B' | got:'B' | concept: 'lie_on_like chair'
4543 | expected:'D' | got:'D' | concept: 'lie_on_like chair'
4544 | expected:'C' | got:'C' | concept: 'hold donut'
4545 | expected:'B' | got:'B' | concept: 'hold donut'
4546 | expected:'D' | got:'D' | concept: 'hold donut'
4547 | expected:'B' | got:'C' | concept: 'hold donut'
4548 | expected:'A' | got:'A' | concept: 'hold sports_ball'
4549 | expected:'D' | got:'D' | concept: 'hold sports_ball'
4550 | expected:'D' | got:'A' | concept: 'hold sports_ball'
4551 | expected:'D' | got:'C' | concept: 'hold sports_ball'
4552 | expected:'C' | got:'C' | concept: 'drink_with cup'
4553 | expected:'A' | got:'C' | concept: 'drink_with cup'
4554 | expected:'C' | got:'C' | concept: 'drink_with cup'
4555 | expected:'D' | got:'D' | concept: 'drink_with cup'
4556 | expected:'B' | got:'C' | concept: 'hold cup'
4557 | expected:'A' | got:'B' | concept: 'hold cup'
4558 | expected:'A' | got:'A' | concept: 'hold cup'
4559 | expected:'D' | got:'D' | concept: 'hold cup'
4560 | expected:'B' | got:'B' | concept: 'hold kite'
4561 | expected:'C' | got:'C' | concept: 'hold kite'
4562 | expected:'D' | got:'D' | concept: 'hold kite'
4563 | expected:'D' | got:'D' | concept: 'hold kite'
4564 | expected:'A' | got:'A' | concept: 'hold pizza'
4565 | expected:'B' | got:'B' | concept: 'hold pizza'
4566 | expected:'A' | got:'A' | concept: 'hold pizza'
4567 | expected:'A' | got:'A' | concept: 'hold pizza'
4568 | expected:'C' | got:'C' | concept: 'hold mouse'
4569 | expected:'C' | got:'C' | concept: 'hold mouse'
4570 | expected:'A' | got:'A' | concept: 'hold mouse'
4571 | expected:'D' | got:'D' | concept: 'hold mouse'
4572 | expected:'A' | got:'A' | concept: 'hold donut'
4573 | expected:'D' | got:'D' | concept: 'hold donut'
4574 | expected:'A' | got:'A' | concept: 'hold donut'
4575 | expected:'A' | got:'A' | concept: 'hold donut'
4576 | expected:'B' | got:'B' | concept: 'ride snowboard'
4577 | expected:'B' | got:'B' | concept: 'ride snowboard'
4578 | expected:'D' | got:'D' | concept: 'ride snowboard'
4579 | expected:'A' | got:'C' | concept: 'ride snowboard'
4580 | expected:'C' | got:'C' | concept: 'jump snowboard'
4581 | expected:'B' | got:'C' | concept: 'jump snowboard'
4582 | expected:'D' | got:'D' | concept: 'jump snowboard'
4583 | expected:'B' | got:'C' | concept: 'jump snowboard'
4584 | expected:'D' | got:'D' | concept: 'jump skateboard'
4585 | expected:'A' | got:'A' | concept: 'jump skateboard'
4586 | expected:'A' | got:'A' | concept: 'jump skateboard'
4587 | expected:'C' | got:'C' | concept: 'jump skateboard'
4588 | expected:'A' | got:'A' | concept: 'jump motorcycle'
4589 | expected:'D' | got:'D' | concept: 'jump motorcycle'
4590 | expected:'C' | got:'C' | concept: 'jump motorcycle'
4591 | expected:'A' | got:'A' | concept: 'jump motorcycle'
4592 | expected:'A' | got:'A' | concept: 'drive train'
4593 | expected:'C' | got:'C' | concept: 'drive train'
4594 | expected:'C' | got:'C' | concept: 'drive train'
4595 | expected:'B' | got:'B' | concept: 'drive train'
4596 | expected:'D' | got:'D' | concept: 'swing tennis_racket'
4597 | expected:'B' | got:'B' | concept: 'swing tennis_racket'
4598 | expected:'D' | got:'D' | concept: 'swing tennis_racket'
4599 | expected:'D' | got:'A' | concept: 'swing tennis_racket'
4600 | expected:'C' | got:'C' | concept: 'board train'
4601 | expected:'A' | got:'A' | concept: 'board train'
4602 | expected:'D' | got:'D' | concept: 'board train'
4603 | expected:'C' | got:'C' | concept: 'board train'
4604 | expected:'C' | got:'C' | concept: 'hold laptop'
4605 | expected:'C' | got:'C' | concept: 'hold laptop'
4606 | expected:'D' | got:'A' | concept: 'hold laptop'
4607 | expected:'A' | got:'A' | concept: 'hold laptop'
4608 | expected:'C' | got:'C' | concept: 'push motorcycle'
4609 | expected:'B' | got:'B' | concept: 'push motorcycle'
4610 | expected:'B' | got:'B' | concept: 'push motorcycle'
4611 | expected:'C' | got:'C' | concept: 'push motorcycle'
4612 | expected:'D' | got:'D' | concept: 'jump motorcycle'
4613 | expected:'A' | got:'A' | concept: 'jump motorcycle'
4614 | expected:'B' | got:'B' | concept: 'jump motorcycle'
4615 | expected:'A' | got:'A' | concept: 'jump motorcycle'
4616 | expected:'D' | got:'D' | concept: 'wash car'
4617 | expected:'A' | got:'A' | concept: 'wash car'
4618 | expected:'A' | got:'A' | concept: 'wash car'
4619 | expected:'A' | got:'A' | concept: 'wash car'
4620 | expected:'C' | got:'C' | concept: 'wash motorcycle'
4621 | expected:'A' | got:'A' | concept: 'wash motorcycle'
4622 | expected:'C' | got:'C' | concept: 'wash motorcycle'
4623 | expected:'C' | got:'C' | concept: 'wash motorcycle'
4624 | expected:'C' | got:'C' | concept: 'sit_on skateboard'
4625 | expected:'A' | got:'A' | concept: 'sit_on skateboard'
4626 | expected:'D' | got:'D' | concept: 'sit_on skateboard'
4627 | expected:'C' | got:'C' | concept: 'sit_on skateboard'
4628 | expected:'D' | got:'D' | concept: 'sit_on chair'
4629 | expected:'B' | got:'B' | concept: 'sit_on chair'
4630 | expected:'A' | got:'C' | concept: 'sit_on chair'
4631 | expected:'B' | got:'B' | concept: 'sit_on chair'
4632 | expected:'B' | got:'B' | concept: 'sit_on couch'
4633 | expected:'C' | got:'C' | concept: 'sit_on couch'
4634 | expected:'B' | got:'B' | concept: 'sit_on couch'
4635 | expected:'D' | got:'D' | concept: 'sit_on couch'
4636 | expected:'D' | got:'D' | concept: 'sit_on bed'
4637 | expected:'C' | got:'C' | concept: 'sit_on bed'
4638 | expected:'A' | got:'A' | concept: 'sit_on bed'
4639 | expected:'D' | got:'D' | concept: 'sit_on bed'
4640 | expected:'B' | got:'B' | concept: 'eat donut'
4641 | expected:'D' | got:'D' | concept: 'eat donut'
4642 | expected:'A' | got:'A' | concept: 'eat donut'
4643 | expected:'C' | got:'C' | concept: 'eat donut'
4644 | expected:'B' | got:'B' | concept: 'eat hot_dog'
4645 | expected:'D' | got:'D' | concept: 'eat hot_dog'
4646 | expected:'B' | got:'B' | concept: 'eat hot_dog'
4647 | expected:'D' | got:'D' | concept: 'eat hot_dog'
4648 | expected:'A' | got:'A' | concept: 'eat sandwich'
4649 | expected:'C' | got:'C' | concept: 'eat sandwich'
4650 | expected:'B' | got:'B' | concept: 'eat sandwich'
4651 | expected:'A' | got:'A' | concept: 'eat sandwich'
4652 | expected:'C' | got:'D' | concept: 'eat pizza'
4653 | expected:'D' | got:'D' | concept: 'eat pizza'
4654 | expected:'A' | got:'D' | concept: 'eat pizza'
4655 | expected:'A' | got:'A' | concept: 'eat pizza'
4656 | expected:'B' | got:'D' | concept: 'hold orange'
4657 | expected:'B' | got:'B' | concept: 'hold orange'
4658 | expected:'A' | got:'A' | concept: 'hold orange'
4659 | expected:'D' | got:'A' | concept: 'hold orange'
4660 | expected:'D' | got:'A' | concept: 'hold apple'
4661 | expected:'B' | got:'B' | concept: 'hold apple'
4662 | expected:'B' | got:'A' | concept: 'hold apple'
4663 | expected:'C' | got:'C' | concept: 'hold apple'
4664 | expected:'C' | got:'C' | concept: 'squeeze orange'
4665 | expected:'D' | got:'A' | concept: 'squeeze orange'
4666 | expected:'B' | got:'B' | concept: 'squeeze orange'
4667 | expected:'C' | got:'C' | concept: 'squeeze orange'
4668 | expected:'B' | got:'B' | concept: 'hold sandwich'
4669 | expected:'A' | got:'A' | concept: 'hold sandwich'
4670 | expected:'C' | got:'C' | concept: 'hold sandwich'
4671 | expected:'C' | got:'C' | concept: 'hold sandwich'
4672 | expected:'A' | got:'A' | concept: 'jump snowboard'
4673 | expected:'A' | got:'A' | concept: 'jump snowboard'
4674 | expected:'B' | got:'B' | concept: 'jump snowboard'
4675 | expected:'C' | got:'C' | concept: 'jump snowboard'
4676 | expected:'D' | got:'D' | concept: 'grind snowboard'
4677 | expected:'C' | got:'C' | concept: 'grind snowboard'
4678 | expected:'D' | got:'A' | concept: 'grind snowboard'
4679 | expected:'C' | got:'B' | concept: 'grind snowboard'
4680 | expected:'D' | got:'D' | concept: 'ride snowboard'
4681 | expected:'C' | got:'C' | concept: 'ride snowboard'
4682 | expected:'B' | got:'B' | concept: 'ride snowboard'
4683 | expected:'D' | got:'C' | concept: 'ride snowboard'
4684 | expected:'C' | got:'C' | concept: 'jump motorcycle'
4685 | expected:'D' | got:'D' | concept: 'jump motorcycle'
4686 | expected:'C' | got:'C' | concept: 'jump motorcycle'
4687 | expected:'A' | got:'A' | concept: 'jump motorcycle'
4688 | expected:'A' | got:'B' | concept: 'lie_on bed'
4689 | expected:'B' | got:'C' | concept: 'lie_on bed'
4690 | expected:'A' | got:'A' | concept: 'lie_on bed'
4691 | expected:'C' | got:'C' | concept: 'lie_on bed'
4692 | expected:'B' | got:'B' | concept: 'lie_on couch'
4693 | expected:'A' | got:'A' | concept: 'lie_on couch'
4694 | expected:'A' | got:'A' | concept: 'lie_on couch'
4695 | expected:'D' | got:'C' | concept: 'lie_on couch'
4696 | expected:'D' | got:'D' | concept: 'sit_on bench'
4697 | expected:'A' | got:'A' | concept: 'sit_on bench'
4698 | expected:'D' | got:'D' | concept: 'sit_on bench'
4699 | expected:'B' | got:'B' | concept: 'sit_on bench'
4700 | expected:'D' | got:'B' | concept: 'lie_on bench'
4701 | expected:'D' | got:'B' | concept: 'lie_on bench'
4702 | expected:'D' | got:'C' | concept: 'lie_on bench'
4703 | expected:'D' | got:'D' | concept: 'lie_on bench'
4704 | expected:'B' | got:'B' | concept: 'clean oven'
4705 | expected:'B' | got:'B' | concept: 'clean oven'
4706 | expected:'C' | got:'B' | concept: 'clean oven'
4707 | expected:'B' | got:'B' | concept: 'clean oven'
4708 | expected:'B' | got:'C' | concept: 'operate microwave'
4709 | expected:'B' | got:'B' | concept: 'operate microwave'
4710 | expected:'A' | got:'B' | concept: 'operate microwave'
4711 | expected:'B' | got:'C' | concept: 'operate microwave'
4712 | expected:'C' | got:'C' | concept: 'clean microwave'
4713 | expected:'B' | got:'C' | concept: 'clean microwave'
4714 | expected:'B' | got:'B' | concept: 'clean microwave'
4715 | expected:'D' | got:'A' | concept: 'clean microwave'
4716 | expected:'B' | got:'B' | concept: 'open microwave'
4717 | expected:'B' | got:'A' | concept: 'open microwave'
4718 | expected:'A' | got:'C' | concept: 'open microwave'
4719 | expected:'D' | got:'B' | concept: 'open microwave'
4720 | expected:'A' | got:'A' | concept: 'hold cake'
4721 | expected:'C' | got:'A' | concept: 'hold cake'
4722 | expected:'B' | got:'A' | concept: 'hold cake'
4723 | expected:'C' | got:'C' | concept: 'hold cake'
4724 | expected:'D' | got:'A' | concept: 'hold wine_glass'
4725 | expected:'A' | got:'A' | concept: 'hold wine_glass'
4726 | expected:'A' | got:'A' | concept: 'hold wine_glass'
4727 | expected:'C' | got:'C' | concept: 'hold wine_glass'
4728 | expected:'D' | got:'A' | concept: 'hold banana'
4729 | expected:'C' | got:'C' | concept: 'hold banana'
4730 | expected:'A' | got:'A' | concept: 'hold banana'
4731 | expected:'B' | got:'B' | concept: 'hold banana'
4732 | expected:'D' | got:'D' | concept: 'hold knife'
4733 | expected:'B' | got:'B' | concept: 'hold knife'
4734 | expected:'D' | got:'D' | concept: 'hold knife'
4735 | expected:'D' | got:'D' | concept: 'hold knife'
4736 | expected:'A' | got:'A' | concept: 'walk dog'
4737 | expected:'B' | got:'B' | concept: 'walk dog'
4738 | expected:'A' | got:'A' | concept: 'walk dog'
4739 | expected:'A' | got:'A' | concept: 'walk dog'
4740 | expected:'C' | got:'C' | concept: 'walk horse'
4741 | expected:'D' | got:'C' | concept: 'walk horse'
4742 | expected:'A' | got:'A' | concept: 'walk horse'
4743 | expected:'D' | got:'A' | concept: 'walk horse'
4744 | expected:'C' | got:'C' | concept: 'hug dog'
4745 | expected:'A' | got:'A' | concept: 'hug dog'
4746 | expected:'A' | got:'A' | concept: 'hug dog'
4747 | expected:'A' | got:'A' | concept: 'hug dog'
4748 | expected:'C' | got:'C' | concept: 'walk bicycle'
4749 | expected:'D' | got:'A' | concept: 'walk bicycle'
4750 | expected:'A' | got:'A' | concept: 'walk bicycle'
4751 | expected:'B' | got:'B' | concept: 'walk bicycle'
4752 | expected:'B' | got:'B' | concept: 'kiss horse'
4753 | expected:'D' | got:'D' | concept: 'kiss horse'
4754 | expected:'D' | got:'D' | concept: 'kiss horse'
4755 | expected:'B' | got:'B' | concept: 'kiss horse'
4756 | expected:'A' | got:'A' | concept: 'kiss person'
4757 | expected:'A' | got:'C' | concept: 'kiss person'
4758 | expected:'A' | got:'A' | concept: 'kiss person'
4759 | expected:'D' | got:'D' | concept: 'kiss person'
4760 | expected:'C' | got:'D' | concept: 'hug person'
4761 | expected:'D' | got:'D' | concept: 'hug person'
4762 | expected:'D' | got:'D' | concept: 'hug person'
4763 | expected:'D' | got:'D' | concept: 'hug person'
4764 | expected:'A' | got:'A' | concept: 'kiss dog'
4765 | expected:'A' | got:'A' | concept: 'kiss dog'
4766 | expected:'D' | got:'D' | concept: 'kiss dog'
4767 | expected:'D' | got:'D' | concept: 'kiss dog'
4768 | expected:'C' | got:'C' | concept: 'kiss dog'
4769 | expected:'D' | got:'D' | concept: 'kiss dog'
4770 | expected:'C' | got:'C' | concept: 'kiss dog'
4771 | expected:'D' | got:'D' | concept: 'kiss dog'
4772 | expected:'B' | got:'B' | concept: 'train dog'
4773 | expected:'A' | got:'A' | concept: 'train dog'
4774 | expected:'C' | got:'C' | concept: 'train dog'
4775 | expected:'A' | got:'D' | concept: 'train dog'
4776 | expected:'B' | got:'D' | concept: 'walk dog'
4777 | expected:'C' | got:'D' | concept: 'walk dog'
4778 | expected:'B' | got:'B' | concept: 'walk dog'
4779 | expected:'B' | got:'B' | concept: 'walk dog'
4780 | expected:'A' | got:'A' | concept: 'pet dog'
4781 | expected:'D' | got:'B' | concept: 'pet dog'
4782 | expected:'D' | got:'D' | concept: 'pet dog'
4783 | expected:'A' | got:'A' | concept: 'pet dog'
4784 | expected:'C' | got:'C' | concept: 'eat apple'
4785 | expected:'C' | got:'C' | concept: 'eat apple'
4786 | expected:'C' | got:'C' | concept: 'eat apple'
4787 | expected:'C' | got:'C' | concept: 'eat apple'
4788 | expected:'A' | got:'A' | concept: 'eat pizza'
4789 | expected:'A' | got:'A' | concept: 'eat pizza'
4790 | expected:'C' | got:'C' | concept: 'eat pizza'
4791 | expected:'A' | got:'D' | concept: 'eat pizza'
4792 | expected:'B' | got:'B' | concept: 'eat hot_dog'
4793 | expected:'D' | got:'D' | concept: 'eat hot_dog'
4794 | expected:'A' | got:'D' | concept: 'eat hot_dog'
4795 | expected:'D' | got:'D' | concept: 'eat hot_dog'
4796 | expected:'B' | got:'B' | concept: 'eat donut'
4797 | expected:'A' | got:'A' | concept: 'eat donut'
4798 | expected:'D' | got:'D' | concept: 'eat donut'
4799 | expected:'A' | got:'A' | concept: 'eat donut'
4800 | expected:'C' | got:'C' | concept: 'ride motorcycle'
4801 | expected:'B' | got:'B' | concept: 'ride motorcycle'
4802 | expected:'B' | got:'B' | concept: 'ride motorcycle'
4803 | expected:'C' | got:'C' | concept: 'ride motorcycle'
4804 | expected:'B' | got:'D' | concept: 'straddle motorcycle'
4805 | expected:'C' | got:'C' | concept: 'straddle motorcycle'
4806 | expected:'C' | got:'C' | concept: 'straddle motorcycle'
4807 | expected:'B' | got:'B' | concept: 'straddle motorcycle'
4808 | expected:'A' | got:'B' | concept: 'turn motorcycle'
4809 | expected:'C' | got:'C' | concept: 'turn motorcycle'
4810 | expected:'B' | got:'D' | concept: 'turn motorcycle'
4811 | expected:'B' | got:'D' | concept: 'turn motorcycle'
4812 | expected:'A' | got:'B' | concept: 'push motorcycle'
4813 | expected:'C' | got:'C' | concept: 'push motorcycle'
4814 | expected:'A' | got:'A' | concept: 'push motorcycle'
4815 | expected:'A' | got:'D' | concept: 'push motorcycle'
4816 | expected:'C' | got:'C' | concept: 'pick apple'
4817 | expected:'B' | got:'B' | concept: 'pick apple'
4818 | expected:'C' | got:'C' | concept: 'pick apple'
4819 | expected:'B' | got:'B' | concept: 'pick apple'
4820 | expected:'D' | got:'B' | concept: 'eat apple'
4821 | expected:'D' | got:'D' | concept: 'eat apple'
4822 | expected:'C' | got:'C' | concept: 'eat apple'
4823 | expected:'B' | got:'D' | concept: 'eat apple'
4824 | expected:'A' | got:'A' | concept: 'hold_and_about_to_eat apple'
4825 | expected:'D' | got:'D' | concept: 'hold_and_about_to_eat apple'
4826 | expected:'A' | got:'A' | concept: 'hold_and_about_to_eat apple'
4827 | expected:'D' | got:'A' | concept: 'hold_and_about_to_eat apple'
4828 | expected:'D' | got:'B' | concept: 'peel_or_cut apple'
4829 | expected:'C' | got:'B' | concept: 'peel_or_cut apple'
4830 | expected:'A' | got:'A' | concept: 'peel_or_cut apple'
4831 | expected:'A' | got:'B' | concept: 'peel_or_cut apple'
4832 | expected:'D' | got:'D' | concept: 'peel_or_cut apple'
4833 | expected:'B' | got:'B' | concept: 'peel_or_cut apple'
4834 | expected:'A' | got:'A' | concept: 'peel_or_cut apple'
4835 | expected:'A' | got:'A' | concept: 'peel_or_cut apple'
4836 | expected:'D' | got:'D' | concept: 'hold_and_about_to_eat apple'
4837 | expected:'A' | got:'D' | concept: 'hold_and_about_to_eat apple'
4838 | expected:'D' | got:'D' | concept: 'hold_and_about_to_eat apple'
4839 | expected:'D' | got:'D' | concept: 'hold_and_about_to_eat apple'
4840 | expected:'B' | got:'D' | concept: 'eat apple'
4841 | expected:'C' | got:'C' | concept: 'eat apple'
4842 | expected:'B' | got:'C' | concept: 'eat apple'
4843 | expected:'D' | got:'A' | concept: 'eat apple'
4844 | expected:'D' | got:'D' | concept: 'pick apple'
4845 | expected:'B' | got:'B' | concept: 'pick apple'
4846 | expected:'A' | got:'A' | concept: 'pick apple'
4847 | expected:'D' | got:'A' | concept: 'pick apple'
4848 | expected:'A' | got:'C' | concept: 'lie_on bed'
4849 | expected:'A' | got:'A' | concept: 'lie_on bed'
4850 | expected:'A' | got:'A' | concept: 'lie_on bed'
4851 | expected:'B' | got:'B' | concept: 'lie_on bed'
4852 | expected:'D' | got:'C' | concept: 'lie_on couch'
4853 | expected:'A' | got:'A' | concept: 'lie_on couch'
4854 | expected:'C' | got:'C' | concept: 'lie_on couch'
4855 | expected:'D' | got:'C' | concept: 'lie_on couch'
4856 | expected:'C' | got:'C' | concept: 'lie_on bench'
4857 | expected:'C' | got:'C' | concept: 'lie_on bench'
4858 | expected:'B' | got:'B' | concept: 'lie_on bench'
4859 | expected:'C' | got:'B' | concept: 'lie_on bench'
4860 | expected:'D' | got:'C' | concept: 'sit_on bed'
4861 | expected:'D' | got:'D' | concept: 'sit_on bed'
4862 | expected:'D' | got:'B' | concept: 'sit_on bed'
4863 | expected:'D' | got:'D' | concept: 'sit_on bed'
4864 | expected:'B' | got:'B' | concept: 'stand_on chair'
4865 | expected:'B' | got:'B' | concept: 'stand_on chair'
4866 | expected:'A' | got:'D' | concept: 'stand_on chair'
4867 | expected:'D' | got:'A' | concept: 'stand_on chair'
4868 | expected:'A' | got:'A' | concept: 'stand_on boat'
4869 | expected:'C' | got:'C' | concept: 'stand_on boat'
4870 | expected:'C' | got:'C' | concept: 'stand_on boat'
4871 | expected:'D' | got:'D' | concept: 'stand_on boat'
4872 | expected:'A' | got:'A' | concept: 'sit_on chair'
4873 | expected:'A' | got:'A' | concept: 'sit_on chair'
4874 | expected:'D' | got:'D' | concept: 'sit_on chair'
4875 | expected:'B' | got:'B' | concept: 'sit_on chair'
4876 | expected:'D' | got:'D' | concept: 'lie_on_like chair'
4877 | expected:'D' | got:'A' | concept: 'lie_on_like chair'
4878 | expected:'C' | got:'C' | concept: 'lie_on_like chair'
4879 | expected:'A' | got:'D' | concept: 'lie_on_like chair'
4880 | expected:'D' | got:'D' | concept: 'sit_on bed'
4881 | expected:'A' | got:'A' | concept: 'sit_on bed'
4882 | expected:'C' | got:'C' | concept: 'sit_on bed'
4883 | expected:'A' | got:'A' | concept: 'sit_on bed'
4884 | expected:'B' | got:'B' | concept: 'ride skateboard'
4885 | expected:'B' | got:'B' | concept: 'ride skateboard'
4886 | expected:'D' | got:'D' | concept: 'ride skateboard'
4887 | expected:'C' | got:'C' | concept: 'ride skateboard'
4888 | expected:'A' | got:'A' | concept: 'sit_on skateboard'
4889 | expected:'B' | got:'A' | concept: 'sit_on skateboard'
4890 | expected:'A' | got:'A' | concept: 'sit_on skateboard'
4891 | expected:'B' | got:'B' | concept: 'sit_on skateboard'
4892 | expected:'C' | got:'C' | concept: 'sit_on chair'
4893 | expected:'A' | got:'A' | concept: 'sit_on chair'
4894 | expected:'D' | got:'D' | concept: 'sit_on chair'
4895 | expected:'C' | got:'C' | concept: 'sit_on chair'
4896 | expected:'D' | got:'D' | concept: 'hold kite'
4897 | expected:'A' | got:'A' | concept: 'hold kite'
4898 | expected:'C' | got:'C' | concept: 'hold kite'
4899 | expected:'D' | got:'D' | concept: 'hold kite'
4900 | expected:'B' | got:'B' | concept: 'hug dog'
4901 | expected:'A' | got:'A' | concept: 'hug dog'
4902 | expected:'A' | got:'B' | concept: 'hug dog'
4903 | expected:'B' | got:'B' | concept: 'hug dog'
4904 | expected:'A' | got:'A' | concept: 'hold toothbrush'
4905 | expected:'D' | got:'B' | concept: 'hold toothbrush'
4906 | expected:'A' | got:'A' | concept: 'hold toothbrush'
4907 | expected:'D' | got:'D' | concept: 'hold toothbrush'
4908 | expected:'A' | got:'A' | concept: 'hold dog'
4909 | expected:'A' | got:'C' | concept: 'hold dog'
4910 | expected:'C' | got:'D' | concept: 'hold dog'
4911 | expected:'D' | got:'C' | concept: 'hold dog'
4912 | expected:'A' | got:'A' | concept: 'repair bicycle'
4913 | expected:'B' | got:'B' | concept: 'repair bicycle'
4914 | expected:'B' | got:'B' | concept: 'repair bicycle'
4915 | expected:'D' | got:'A' | concept: 'repair bicycle'
4916 | expected:'A' | got:'A' | concept: 'sit_on truck'
4917 | expected:'A' | got:'A' | concept: 'sit_on truck'
4918 | expected:'D' | got:'D' | concept: 'sit_on truck'
4919 | expected:'D' | got:'D' | concept: 'sit_on truck'
4920 | expected:'D' | got:'A' | concept: 'load truck'
4921 | expected:'D' | got:'B' | concept: 'load truck'
4922 | expected:'D' | got:'D' | concept: 'load truck'
4923 | expected:'B' | got:'B' | concept: 'load truck'
4924 | expected:'B' | got:'B' | concept: 'repair truck'
4925 | expected:'D' | got:'D' | concept: 'repair truck'
4926 | expected:'B' | got:'B' | concept: 'repair truck'
4927 | expected:'A' | got:'A' | concept: 'repair truck'
4928 | expected:'B' | got:'B' | concept: 'clean keyboard'
4929 | expected:'C' | got:'C' | concept: 'clean keyboard'
4930 | expected:'A' | got:'A' | concept: 'clean keyboard'
4931 | expected:'D' | got:'D' | concept: 'clean keyboard'
4932 | expected:'D' | got:'D' | concept: 'clean oven'
4933 | expected:'A' | got:'A' | concept: 'clean oven'
4934 | expected:'A' | got:'A' | concept: 'clean oven'
4935 | expected:'A' | got:'A' | concept: 'clean oven'
4936 | expected:'D' | got:'D' | concept: 'clean toilet'
4937 | expected:'B' | got:'B' | concept: 'clean toilet'
4938 | expected:'A' | got:'A' | concept: 'clean toilet'
4939 | expected:'D' | got:'D' | concept: 'clean toilet'
4940 | expected:'B' | got:'B' | concept: 'clean microwave'
4941 | expected:'C' | got:'C' | concept: 'clean microwave'
4942 | expected:'A' | got:'A' | concept: 'clean microwave'
4943 | expected:'A' | got:'A' | concept: 'clean microwave'
4944 | expected:'A' | got:'A' | concept: 'jump horse'
4945 | expected:'B' | got:'B' | concept: 'jump horse'
4946 | expected:'C' | got:'C' | concept: 'jump horse'
4947 | expected:'D' | got:'D' | concept: 'jump horse'
4948 | expected:'D' | got:'D' | concept: 'hug horse'
4949 | expected:'A' | got:'C' | concept: 'hug horse'
4950 | expected:'C' | got:'C' | concept: 'hug horse'
4951 | expected:'C' | got:'A' | concept: 'hug horse'
4952 | expected:'D' | got:'D' | concept: 'kiss horse'
4953 | expected:'C' | got:'C' | concept: 'kiss horse'
4954 | expected:'A' | got:'D' | concept: 'kiss horse'
4955 | expected:'D' | got:'D' | concept: 'kiss horse'
4956 | expected:'B' | got:'B' | concept: 'feed horse'
4957 | expected:'A' | got:'C' | concept: 'feed horse'
4958 | expected:'A' | got:'A' | concept: 'feed horse'
4959 | expected:'A' | got:'A' | concept: 'feed horse'
4960 | expected:'C' | got:'C' | concept: 'wash motorcycle'
4961 | expected:'B' | got:'B' | concept: 'wash motorcycle'
4962 | expected:'D' | got:'D' | concept: 'wash motorcycle'
4963 | expected:'B' | got:'B' | concept: 'wash motorcycle'
4964 | expected:'A' | got:'A' | concept: 'jump motorcycle'
4965 | expected:'A' | got:'A' | concept: 'jump motorcycle'
4966 | expected:'C' | got:'C' | concept: 'jump motorcycle'
4967 | expected:'C' | got:'C' | concept: 'jump motorcycle'
4968 | expected:'C' | got:'C' | concept: 'jump snowboard'
4969 | expected:'D' | got:'C' | concept: 'jump snowboard'
4970 | expected:'B' | got:'B' | concept: 'jump snowboard'
4971 | expected:'A' | got:'A' | concept: 'jump snowboard'
4972 | expected:'D' | got:'D' | concept: 'jump skateboard'
4973 | expected:'D' | got:'D' | concept: 'jump skateboard'
4974 | expected:'B' | got:'B' | concept: 'jump skateboard'
4975 | expected:'D' | got:'D' | concept: 'jump skateboard'
4976 | expected:'D' | got:'A' | concept: 'adjust_or_tie tie'
4977 | expected:'B' | got:'B' | concept: 'adjust_or_tie tie'
4978 | expected:'B' | got:'B' | concept: 'adjust_or_tie tie'
4979 | expected:'A' | got:'A' | concept: 'adjust_or_tie tie'
4980 | expected:'D' | got:'D' | concept: 'block sports_ball'
4981 | expected:'B' | got:'B' | concept: 'block sports_ball'
4982 | expected:'C' | got:'C' | concept: 'block sports_ball'
4983 | expected:'B' | got:'B' | concept: 'block sports_ball'
4984 | expected:'B' | got:'D' | concept: 'wear tie'
4985 | expected:'B' | got:'A' | concept: 'wear tie'
4986 | expected:'A' | got:'B' | concept: 'wear tie'
4987 | expected:'D' | got:'D' | concept: 'wear tie'
4988 | expected:'D' | got:'A' | concept: 'wear backpack'
4989 | expected:'A' | got:'A' | concept: 'wear backpack'
4990 | expected:'D' | got:'D' | concept: 'wear backpack'
4991 | expected:'A' | got:'A' | concept: 'wear backpack'
4992 | expected:'B' | got:'B' | concept: 'repair bicycle'
4993 | expected:'A' | got:'A' | concept: 'repair bicycle'
4994 | expected:'C' | got:'A' | concept: 'repair bicycle'
4995 | expected:'C' | got:'C' | concept: 'repair bicycle'
4996 | expected:'D' | got:'D' | concept: 'sit_on truck'
4997 | expected:'A' | got:'A' | concept: 'sit_on truck'
4998 | expected:'A' | got:'A' | concept: 'sit_on truck'
4999 | expected:'B' | got:'B' | concept: 'sit_on truck'
5000 | expected:'B' | got:'B' | concept: 'load truck'
5001 | expected:'B' | got:'B' | concept: 'load truck'
5002 | expected:'B' | got:'D' | concept: 'load truck'
5003 | expected:'A' | got:'A' | concept: 'load truck'
5004 | expected:'D' | got:'A' | concept: 'repair truck'
5005 | expected:'D' | got:'D' | concept: 'repair truck'
5006 | expected:'B' | got:'B' | concept: 'repair truck'
5007 | expected:'D' | got:'D' | concept: 'repair truck'
5008 | expected:'C' | got:'C' | concept: 'walk bicycle'
5009 | expected:'C' | got:'C' | concept: 'walk bicycle'
5010 | expected:'A' | got:'A' | concept: 'walk bicycle'
5011 | expected:'C' | got:'C' | concept: 'walk bicycle'
5012 | expected:'C' | got:'C' | concept: 'repair bicycle'
5013 | expected:'B' | got:'B' | concept: 'repair bicycle'
5014 | expected:'D' | got:'D' | concept: 'repair bicycle'
5015 | expected:'D' | got:'D' | concept: 'repair bicycle'
5016 | expected:'B' | got:'B' | concept: 'walk horse'
5017 | expected:'B' | got:'B' | concept: 'walk horse'
5018 | expected:'B' | got:'B' | concept: 'walk horse'
5019 | expected:'B' | got:'B' | concept: 'walk horse'
5020 | expected:'A' | got:'A' | concept: 'walk dog'
5021 | expected:'C' | got:'C' | concept: 'walk dog'
5022 | expected:'A' | got:'A' | concept: 'walk dog'
5023 | expected:'B' | got:'B' | concept: 'walk dog'
5024 | expected:'A' | got:'A' | concept: 'sit_on couch'
5025 | expected:'B' | got:'B' | concept: 'sit_on couch'
5026 | expected:'B' | got:'B' | concept: 'sit_on couch'
5027 | expected:'B' | got:'B' | concept: 'sit_on couch'
5028 | expected:'D' | got:'D' | concept: 'sit_on skateboard'
5029 | expected:'B' | got:'B' | concept: 'sit_on skateboard'
5030 | expected:'A' | got:'A' | concept: 'sit_on skateboard'
5031 | expected:'D' | got:'D' | concept: 'sit_on skateboard'
5032 | expected:'C' | got:'C' | concept: 'sit_on motorcycle'
5033 | expected:'B' | got:'B' | concept: 'sit_on motorcycle'
5034 | expected:'A' | got:'A' | concept: 'sit_on motorcycle'
5035 | expected:'A' | got:'A' | concept: 'sit_on motorcycle'
5036 | expected:'C' | got:'C' | concept: 'sit_on bench'
5037 | expected:'C' | got:'C' | concept: 'sit_on bench'
5038 | expected:'A' | got:'A' | concept: 'sit_on bench'
5039 | expected:'B' | got:'B' | concept: 'sit_on bench'
5040 | expected:'B' | got:'B' | concept: 'lie_on bench'
5041 | expected:'C' | got:'B' | concept: 'lie_on bench'
5042 | expected:'A' | got:'A' | concept: 'lie_on bench'
5043 | expected:'C' | got:'B' | concept: 'lie_on bench'
5044 | expected:'D' | got:'C' | concept: 'lie_on couch'
5045 | expected:'D' | got:'C' | concept: 'lie_on couch'
5046 | expected:'A' | got:'A' | concept: 'lie_on couch'
5047 | expected:'A' | got:'A' | concept: 'lie_on couch'
5048 | expected:'C' | got:'D' | concept: 'sit_on bed'
5049 | expected:'D' | got:'D' | concept: 'sit_on bed'
5050 | expected:'B' | got:'B' | concept: 'sit_on bed'
5051 | expected:'C' | got:'C' | concept: 'sit_on bed'
5052 | expected:'C' | got:'C' | concept: 'lie_on bed'
5053 | expected:'C' | got:'C' | concept: 'lie_on bed'
5054 | expected:'C' | got:'C' | concept: 'lie_on bed'
5055 | expected:'C' | got:'C' | concept: 'lie_on bed'
5056 | expected:'B' | got:'B' | concept: 'hold toothbrush'
5057 | expected:'A' | got:'A' | concept: 'hold toothbrush'
5058 | expected:'B' | got:'B' | concept: 'hold toothbrush'
5059 | expected:'D' | got:'D' | concept: 'hold toothbrush'
5060 | expected:'D' | got:'C' | concept: 'hold cell_phone'
5061 | expected:'A' | got:'A' | concept: 'hold cell_phone'
5062 | expected:'A' | got:'A' | concept: 'hold cell_phone'
5063 | expected:'D' | got:'D' | concept: 'hold cell_phone'
5064 | expected:'B' | got:'B' | concept: 'hold remote'
5065 | expected:'C' | got:'C' | concept: 'hold remote'
5066 | expected:'D' | got:'D' | concept: 'hold remote'
5067 | expected:'B' | got:'B' | concept: 'hold remote'
5068 | expected:'B' | got:'B' | concept: 'hold banana'
5069 | expected:'B' | got:'B' | concept: 'hold banana'
5070 | expected:'C' | got:'C' | concept: 'hold banana'
5071 | expected:'C' | got:'C' | concept: 'hold banana'
5072 | expected:'D' | got:'D' | concept: 'hug person'
5073 | expected:'B' | got:'C' | concept: 'hug person'
5074 | expected:'A' | got:'D' | concept: 'hug person'
5075 | expected:'A' | got:'C' | concept: 'hug person'
5076 | expected:'B' | got:'B' | concept: 'kiss person'
5077 | expected:'A' | got:'A' | concept: 'kiss person'
5078 | expected:'B' | got:'B' | concept: 'kiss person'
5079 | expected:'A' | got:'A' | concept: 'kiss person'
5080 | expected:'B' | got:'B' | concept: 'kiss horse'
5081 | expected:'C' | got:'C' | concept: 'kiss horse'
5082 | expected:'C' | got:'C' | concept: 'kiss horse'
5083 | expected:'C' | got:'C' | concept: 'kiss horse'
5084 | expected:'C' | got:'C' | concept: 'greet person'
5085 | expected:'A' | got:'A' | concept: 'greet person'
5086 | expected:'D' | got:'D' | concept: 'greet person'
5087 | expected:'C' | got:'C' | concept: 'greet person'
5088 | expected:'B' | got:'B' | concept: 'carry handbag'
5089 | expected:'A' | got:'A' | concept: 'carry handbag'
5090 | expected:'D' | got:'A' | concept: 'carry handbag'
5091 | expected:'B' | got:'A' | concept: 'carry handbag'
5092 | expected:'D' | got:'D' | concept: 'carry suitcase'
5093 | expected:'D' | got:'D' | concept: 'carry suitcase'
5094 | expected:'D' | got:'D' | concept: 'carry suitcase'
5095 | expected:'A' | got:'A' | concept: 'carry suitcase'
5096 | expected:'A' | got:'A' | concept: 'carry surfboard'
5097 | expected:'A' | got:'A' | concept: 'carry surfboard'
5098 | expected:'B' | got:'B' | concept: 'carry surfboard'
5099 | expected:'B' | got:'A' | concept: 'carry surfboard'
5100 | expected:'A' | got:'D' | concept: 'drag suitcase'
5101 | expected:'C' | got:'C' | concept: 'drag suitcase'
5102 | expected:'C' | got:'C' | concept: 'drag suitcase'
5103 | expected:'A' | got:'D' | concept: 'drag suitcase'
5104 | expected:'C' | got:'C' | concept: 'cut pizza'
5105 | expected:'C' | got:'C' | concept: 'cut pizza'
5106 | expected:'C' | got:'C' | concept: 'cut pizza'
5107 | expected:'C' | got:'C' | concept: 'cut pizza'
5108 | expected:'B' | got:'D' | concept: 'hold pizza'
5109 | expected:'B' | got:'C' | concept: 'hold pizza'
5110 | expected:'C' | got:'B' | concept: 'hold pizza'
5111 | expected:'D' | got:'A' | concept: 'hold pizza'
5112 | expected:'A' | got:'A' | concept: 'eat pizza'
5113 | expected:'D' | got:'D' | concept: 'eat pizza'
5114 | expected:'D' | got:'D' | concept: 'eat pizza'
5115 | expected:'A' | got:'A' | concept: 'eat pizza'
5116 | expected:'B' | got:'B' | concept: 'cut cake'
5117 | expected:'B' | got:'B' | concept: 'cut cake'
5118 | expected:'B' | got:'B' | concept: 'cut cake'
5119 | expected:'B' | got:'B' | concept: 'cut cake'
5120 | expected:'A' | got:'A' | concept: 'hold handbag'
5121 | expected:'A' | got:'A' | concept: 'hold handbag'
5122 | expected:'B' | got:'B' | concept: 'hold handbag'
5123 | expected:'D' | got:'A' | concept: 'hold handbag'
5124 | expected:'A' | got:'A' | concept: 'hold bottle'
5125 | expected:'C' | got:'C' | concept: 'hold bottle'
5126 | expected:'B' | got:'B' | concept: 'hold bottle'
5127 | expected:'B' | got:'A' | concept: 'hold bottle'
5128 | expected:'B' | got:'B' | concept: 'hold toothbrush'
5129 | expected:'D' | got:'D' | concept: 'hold toothbrush'
5130 | expected:'D' | got:'B' | concept: 'hold toothbrush'
5131 | expected:'B' | got:'B' | concept: 'hold toothbrush'
5132 | expected:'A' | got:'A' | concept: 'hold orange'
5133 | expected:'A' | got:'A' | concept: 'hold orange'
5134 | expected:'D' | got:'A' | concept: 'hold orange'
5135 | expected:'A' | got:'A' | concept: 'hold orange'
5136 | expected:'A' | got:'A' | concept: 'greet person'
5137 | expected:'C' | got:'C' | concept: 'greet person'
5138 | expected:'D' | got:'D' | concept: 'greet person'
5139 | expected:'C' | got:'C' | concept: 'greet person'
5140 | expected:'A' | got:'A' | concept: 'kiss dog'
5141 | expected:'D' | got:'D' | concept: 'kiss dog'
5142 | expected:'C' | got:'C' | concept: 'kiss dog'
5143 | expected:'B' | got:'B' | concept: 'kiss dog'
5144 | expected:'A' | got:'A' | concept: 'kiss horse'
5145 | expected:'C' | got:'C' | concept: 'kiss horse'
5146 | expected:'B' | got:'B' | concept: 'kiss horse'
5147 | expected:'C' | got:'C' | concept: 'kiss horse'
5148 | expected:'C' | got:'C' | concept: 'kiss person'
5149 | expected:'B' | got:'B' | concept: 'kiss person'
5150 | expected:'A' | got:'A' | concept: 'kiss person'
5151 | expected:'C' | got:'C' | concept: 'kiss person'
5152 | expected:'C' | got:'C' | concept: 'hold mouse'
5153 | expected:'C' | got:'C' | concept: 'hold mouse'
5154 | expected:'B' | got:'B' | concept: 'hold mouse'
5155 | expected:'A' | got:'A' | concept: 'hold mouse'
5156 | expected:'C' | got:'C' | concept: 'hold handbag'
5157 | expected:'A' | got:'A' | concept: 'hold handbag'
5158 | expected:'A' | got:'A' | concept: 'hold handbag'
5159 | expected:'C' | got:'C' | concept: 'hold handbag'
5160 | expected:'B' | got:'B' | concept: 'hold knife'
5161 | expected:'A' | got:'A' | concept: 'hold knife'
5162 | expected:'A' | got:'A' | concept: 'hold knife'
5163 | expected:'B' | got:'B' | concept: 'hold knife'
5164 | expected:'B' | got:'B' | concept: 'hold orange'
5165 | expected:'C' | got:'A' | concept: 'hold orange'
5166 | expected:'A' | got:'A' | concept: 'hold orange'
5167 | expected:'B' | got:'B' | concept: 'hold orange'
5168 | expected:'A' | got:'A' | concept: 'hold handbag'
5169 | expected:'B' | got:'B' | concept: 'hold handbag'
5170 | expected:'D' | got:'A' | concept: 'hold handbag'
5171 | expected:'A' | got:'A' | concept: 'hold handbag'
5172 | expected:'C' | got:'C' | concept: 'hold dog'
5173 | expected:'D' | got:'D' | concept: 'hold dog'
5174 | expected:'D' | got:'D' | concept: 'hold dog'
5175 | expected:'C' | got:'C' | concept: 'hold dog'
5176 | expected:'C' | got:'C' | concept: 'hold kite'
5177 | expected:'A' | got:'A' | concept: 'hold kite'
5178 | expected:'B' | got:'B' | concept: 'hold kite'
5179 | expected:'A' | got:'A' | concept: 'hold kite'
5180 | expected:'A' | got:'A' | concept: 'hold bottle'
5181 | expected:'C' | got:'C' | concept: 'hold bottle'
5182 | expected:'B' | got:'B' | concept: 'hold bottle'
5183 | expected:'B' | got:'B' | concept: 'hold bottle'
5184 | expected:'D' | got:'D' | concept: 'grind skateboard'
5185 | expected:'A' | got:'A' | concept: 'grind skateboard'
5186 | expected:'B' | got:'B' | concept: 'grind skateboard'
5187 | expected:'A' | got:'A' | concept: 'grind skateboard'
5188 | expected:'A' | got:'D' | concept: 'grind snowboard'
5189 | expected:'B' | got:'B' | concept: 'grind snowboard'
5190 | expected:'A' | got:'B' | concept: 'grind snowboard'
5191 | expected:'D' | got:'C' | concept: 'grind snowboard'
5192 | expected:'B' | got:'B' | concept: 'ride snowboard'
5193 | expected:'B' | got:'B' | concept: 'ride snowboard'
5194 | expected:'B' | got:'C' | concept: 'ride snowboard'
5195 | expected:'C' | got:'C' | concept: 'ride snowboard'
5196 | expected:'C' | got:'C' | concept: 'jump snowboard'
5197 | expected:'B' | got:'B' | concept: 'jump snowboard'
5198 | expected:'C' | got:'C' | concept: 'jump snowboard'
5199 | expected:'C' | got:'C' | concept: 'jump snowboard'
5200 | expected:'D' | got:'D' | concept: 'hold donut'
5201 | expected:'B' | got:'A' | concept: 'hold donut'
5202 | expected:'D' | got:'D' | concept: 'hold donut'
5203 | expected:'B' | got:'B' | concept: 'hold donut'
5204 | expected:'C' | got:'C' | concept: 'hold sandwich'
5205 | expected:'D' | got:'D' | concept: 'hold sandwich'
5206 | expected:'C' | got:'C' | concept: 'hold sandwich'
5207 | expected:'A' | got:'A' | concept: 'hold sandwich'
5208 | expected:'A' | got:'A' | concept: 'hold cell_phone'
5209 | expected:'C' | got:'C' | concept: 'hold cell_phone'
5210 | expected:'D' | got:'C' | concept: 'hold cell_phone'
5211 | expected:'C' | got:'C' | concept: 'hold cell_phone'
5212 | expected:'D' | got:'B' | concept: 'hold bottle'
5213 | expected:'D' | got:'D' | concept: 'hold bottle'
5214 | expected:'B' | got:'B' | concept: 'hold bottle'
5215 | expected:'A' | got:'A' | concept: 'hold bottle'
5216 | expected:'A' | got:'A' | concept: 'jump snowboard'
5217 | expected:'D' | got:'D' | concept: 'jump snowboard'
5218 | expected:'B' | got:'B' | concept: 'jump snowboard'
5219 | expected:'C' | got:'C' | concept: 'jump snowboard'
5220 | expected:'B' | got:'B' | concept: 'jump horse'
5221 | expected:'C' | got:'C' | concept: 'jump horse'
5222 | expected:'C' | got:'C' | concept: 'jump horse'
5223 | expected:'B' | got:'B' | concept: 'jump horse'
5224 | expected:'B' | got:'B' | concept: 'jump motorcycle'
5225 | expected:'D' | got:'D' | concept: 'jump motorcycle'
5226 | expected:'B' | got:'B' | concept: 'jump motorcycle'
5227 | expected:'C' | got:'C' | concept: 'jump motorcycle'
5228 | expected:'B' | got:'B' | concept: 'jump skateboard'
5229 | expected:'B' | got:'B' | concept: 'jump skateboard'
5230 | expected:'D' | got:'D' | concept: 'jump skateboard'
5231 | expected:'A' | got:'A' | concept: 'jump skateboard'
5232 | expected:'A' | got:'A' | concept: 'adjust_or_tie tie'
5233 | expected:'A' | got:'A' | concept: 'adjust_or_tie tie'
5234 | expected:'C' | got:'C' | concept: 'adjust_or_tie tie'
5235 | expected:'B' | got:'B' | concept: 'adjust_or_tie tie'
5236 | expected:'A' | got:'A' | concept: 'wear backpack'
5237 | expected:'D' | got:'D' | concept: 'wear backpack'
5238 | expected:'B' | got:'B' | concept: 'wear backpack'
5239 | expected:'B' | got:'B' | concept: 'wear backpack'
5240 | expected:'B' | got:'B' | concept: 'row boat'
5241 | expected:'C' | got:'C' | concept: 'row boat'
5242 | expected:'D' | got:'A' | concept: 'row boat'
5243 | expected:'B' | got:'A' | concept: 'row boat'
5244 | expected:'B' | got:'D' | concept: 'wear tie'
5245 | expected:'A' | got:'D' | concept: 'wear tie'
5246 | expected:'A' | got:'D' | concept: 'wear tie'
5247 | expected:'C' | got:'C' | concept: 'wear tie'
5248 | expected:'A' | got:'A' | concept: 'clean keyboard'
5249 | expected:'D' | got:'D' | concept: 'clean keyboard'
5250 | expected:'C' | got:'C' | concept: 'clean keyboard'
5251 | expected:'D' | got:'D' | concept: 'clean keyboard'
5252 | expected:'B' | got:'B' | concept: 'clean oven'
5253 | expected:'A' | got:'D' | concept: 'clean oven'
5254 | expected:'C' | got:'C' | concept: 'clean oven'
5255 | expected:'C' | got:'C' | concept: 'clean oven'
5256 | expected:'D' | got:'D' | concept: 'clean microwave'
5257 | expected:'C' | got:'C' | concept: 'clean microwave'
5258 | expected:'C' | got:'C' | concept: 'clean microwave'
5259 | expected:'D' | got:'A' | concept: 'clean microwave'
5260 | expected:'A' | got:'A' | concept: 'clean refrigerator'
5261 | expected:'D' | got:'D' | concept: 'clean refrigerator'
5262 | expected:'B' | got:'B' | concept: 'clean refrigerator'
5263 | expected:'B' | got:'B' | concept: 'clean refrigerator'
5264 | expected:'C' | got:'C' | concept: 'cut_with knife'
5265 | expected:'C' | got:'C' | concept: 'cut_with knife'
5266 | expected:'C' | got:'A' | concept: 'cut_with knife'
5267 | expected:'D' | got:'C' | concept: 'cut_with knife'
5268 | expected:'B' | got:'B' | concept: 'cut_with scissors'
5269 | expected:'A' | got:'B' | concept: 'cut_with scissors'
5270 | expected:'B' | got:'C' | concept: 'cut_with scissors'
5271 | expected:'B' | got:'C' | concept: 'cut_with scissors'
5272 | expected:'C' | got:'C' | concept: 'hold knife'
5273 | expected:'A' | got:'D' | concept: 'hold knife'
5274 | expected:'C' | got:'B' | concept: 'hold knife'
5275 | expected:'A' | got:'D' | concept: 'hold knife'
5276 | expected:'D' | got:'A' | concept: 'hold scissors'
5277 | expected:'A' | got:'D' | concept: 'hold scissors'
5278 | expected:'C' | got:'A' | concept: 'hold scissors'
5279 | expected:'B' | got:'B' | concept: 'hold scissors'
5280 | expected:'D' | got:'D' | concept: 'sit_on motorcycle'
5281 | expected:'A' | got:'A' | concept: 'sit_on motorcycle'
5282 | expected:'C' | got:'C' | concept: 'sit_on motorcycle'
5283 | expected:'D' | got:'A' | concept: 'sit_on motorcycle'
5284 | expected:'D' | got:'D' | concept: 'inspect motorcycle'
5285 | expected:'C' | got:'C' | concept: 'inspect motorcycle'
5286 | expected:'A' | got:'A' | concept: 'inspect motorcycle'
5287 | expected:'A' | got:'A' | concept: 'inspect motorcycle'
5288 | expected:'C' | got:'C' | concept: 'ride motorcycle'
5289 | expected:'C' | got:'C' | concept: 'ride motorcycle'
5290 | expected:'A' | got:'C' | concept: 'ride motorcycle'
5291 | expected:'C' | got:'C' | concept: 'ride motorcycle'
5292 | expected:'D' | got:'D' | concept: 'sit_on chair'
5293 | expected:'C' | got:'C' | concept: 'sit_on chair'
5294 | expected:'C' | got:'C' | concept: 'sit_on chair'
5295 | expected:'D' | got:'D' | concept: 'sit_on chair'
5296 | expected:'D' | got:'A' | concept: 'hold apple'
5297 | expected:'D' | got:'A' | concept: 'hold apple'
5298 | expected:'C' | got:'C' | concept: 'hold apple'
5299 | expected:'A' | got:'A' | concept: 'hold apple'
5300 | expected:'D' | got:'D' | concept: 'hold toothbrush'
5301 | expected:'B' | got:'B' | concept: 'hold toothbrush'
5302 | expected:'A' | got:'C' | concept: 'hold toothbrush'
5303 | expected:'A' | got:'A' | concept: 'hold toothbrush'
5304 | expected:'A' | got:'B' | concept: 'hold cake'
5305 | expected:'D' | got:'D' | concept: 'hold cake'
5306 | expected:'D' | got:'D' | concept: 'hold cake'
5307 | expected:'C' | got:'C' | concept: 'hold cake'
5308 | expected:'D' | got:'C' | concept: 'hold scissors'
5309 | expected:'D' | got:'B' | concept: 'hold scissors'
5310 | expected:'C' | got:'D' | concept: 'hold scissors'
5311 | expected:'B' | got:'C' | concept: 'hold scissors'
5312 | expected:'D' | got:'D' | concept: 'hold laptop'
5313 | expected:'D' | got:'D' | concept: 'hold laptop'
5314 | expected:'D' | got:'D' | concept: 'hold laptop'
5315 | expected:'A' | got:'A' | concept: 'hold laptop'
5316 | expected:'D' | got:'D' | concept: 'hold remote'
5317 | expected:'B' | got:'B' | concept: 'hold remote'
5318 | expected:'D' | got:'D' | concept: 'hold remote'
5319 | expected:'C' | got:'C' | concept: 'hold remote'
5320 | expected:'A' | got:'B' | concept: 'hold spoon'
5321 | expected:'D' | got:'D' | concept: 'hold spoon'
5322 | expected:'C' | got:'C' | concept: 'hold spoon'
5323 | expected:'C' | got:'A' | concept: 'hold spoon'
5324 | expected:'D' | got:'D' | concept: 'hold tennis_racket'
5325 | expected:'B' | got:'B' | concept: 'hold tennis_racket'
5326 | expected:'C' | got:'C' | concept: 'hold tennis_racket'
5327 | expected:'A' | got:'A' | concept: 'hold tennis_racket'
5328 | expected:'D' | got:'D' | concept: 'hold skateboard'
5329 | expected:'B' | got:'B' | concept: 'hold skateboard'
5330 | expected:'A' | got:'A' | concept: 'hold skateboard'
5331 | expected:'D' | got:'D' | concept: 'hold skateboard'
5332 | expected:'B' | got:'B' | concept: 'sit_on motorcycle'
5333 | expected:'B' | got:'B' | concept: 'sit_on motorcycle'
5334 | expected:'A' | got:'A' | concept: 'sit_on motorcycle'
5335 | expected:'B' | got:'B' | concept: 'sit_on motorcycle'
5336 | expected:'B' | got:'B' | concept: 'sit_on bed'
5337 | expected:'D' | got:'D' | concept: 'sit_on bed'
5338 | expected:'D' | got:'D' | concept: 'sit_on bed'
5339 | expected:'D' | got:'D' | concept: 'sit_on bed'
5340 | expected:'D' | got:'D' | concept: 'sit_on skateboard'
5341 | expected:'A' | got:'A' | concept: 'sit_on skateboard'
5342 | expected:'A' | got:'A' | concept: 'sit_on skateboard'
5343 | expected:'A' | got:'A' | concept: 'sit_on skateboard'
5344 | expected:'C' | got:'A' | concept: 'point_at_camera remote'
5345 | expected:'C' | got:'D' | concept: 'point_at_camera remote'
5346 | expected:'A' | got:'C' | concept: 'point_at_camera remote'
5347 | expected:'A' | got:'B' | concept: 'point_at_camera remote'
5348 | expected:'A' | got:'A' | concept: 'hold remote'
5349 | expected:'B' | got:'B' | concept: 'hold remote'
5350 | expected:'A' | got:'A' | concept: 'hold remote'
5351 | expected:'C' | got:'C' | concept: 'hold remote'
5352 | expected:'A' | got:'A' | concept: 'hold apple'
5353 | expected:'A' | got:'A' | concept: 'hold apple'
5354 | expected:'C' | got:'C' | concept: 'hold apple'
5355 | expected:'A' | got:'A' | concept: 'hold apple'
5356 | expected:'B' | got:'B' | concept: 'hold cell_phone'
5357 | expected:'B' | got:'B' | concept: 'hold cell_phone'
5358 | expected:'B' | got:'B' | concept: 'hold cell_phone'
5359 | expected:'D' | got:'C' | concept: 'hold cell_phone'
5360 | expected:'D' | got:'D' | concept: 'ride horse'
5361 | expected:'D' | got:'D' | concept: 'ride horse'
5362 | expected:'B' | got:'B' | concept: 'ride horse'
5363 | expected:'C' | got:'C' | concept: 'ride horse'
5364 | expected:'B' | got:'B' | concept: 'ride surfboard'
5365 | expected:'A' | got:'A' | concept: 'ride surfboard'
5366 | expected:'C' | got:'C' | concept: 'ride surfboard'
5367 | expected:'D' | got:'D' | concept: 'ride surfboard'
5368 | expected:'C' | got:'C' | concept: 'ride bicycle'
5369 | expected:'C' | got:'C' | concept: 'ride bicycle'
5370 | expected:'D' | got:'D' | concept: 'ride bicycle'
5371 | expected:'B' | got:'B' | concept: 'ride bicycle'
5372 | expected:'D' | got:'D' | concept: 'ride motorcycle'
5373 | expected:'D' | got:'D' | concept: 'ride motorcycle'
5374 | expected:'C' | got:'C' | concept: 'ride motorcycle'
5375 | expected:'C' | got:'C' | concept: 'ride motorcycle'
5376 | expected:'C' | got:'C' | concept: 'squeeze orange'
5377 | expected:'C' | got:'C' | concept: 'squeeze orange'
5378 | expected:'C' | got:'C' | concept: 'squeeze orange'
5379 | expected:'B' | got:'B' | concept: 'squeeze orange'
5380 | expected:'A' | got:'A' | concept: 'hold scissors'
5381 | expected:'A' | got:'A' | concept: 'hold scissors'
5382 | expected:'D' | got:'D' | concept: 'hold scissors'
5383 | expected:'A' | got:'A' | concept: 'hold scissors'
5384 | expected:'B' | got:'B' | concept: 'hold orange'
5385 | expected:'B' | got:'B' | concept: 'hold orange'
5386 | expected:'A' | got:'B' | concept: 'hold orange'
5387 | expected:'A' | got:'D' | concept: 'hold orange'
5388 | expected:'C' | got:'C' | concept: 'hold hot_dog'
5389 | expected:'D' | got:'C' | concept: 'hold hot_dog'
5390 | expected:'C' | got:'C' | concept: 'hold hot_dog'
5391 | expected:'C' | got:'C' | concept: 'hold hot_dog'
5392 | expected:'B' | got:'B' | concept: 'hold skateboard'
5393 | expected:'D' | got:'D' | concept: 'hold skateboard'
5394 | expected:'D' | got:'D' | concept: 'hold skateboard'
5395 | expected:'C' | got:'C' | concept: 'hold skateboard'
5396 | expected:'A' | got:'D' | concept: 'swing tennis_racket'
5397 | expected:'B' | got:'D' | concept: 'swing tennis_racket'
5398 | expected:'D' | got:'D' | concept: 'swing tennis_racket'
5399 | expected:'D' | got:'D' | concept: 'swing tennis_racket'
5400 | expected:'C' | got:'B' | concept: 'hold tennis_racket'
5401 | expected:'C' | got:'C' | concept: 'hold tennis_racket'
5402 | expected:'A' | got:'B' | concept: 'hold tennis_racket'
5403 | expected:'B' | got:'D' | concept: 'hold tennis_racket'
5404 | expected:'C' | got:'C' | concept: 'hold laptop'
5405 | expected:'A' | got:'A' | concept: 'hold laptop'
5406 | expected:'A' | got:'A' | concept: 'hold laptop'
5407 | expected:'C' | got:'C' | concept: 'hold laptop'
5408 | expected:'C' | got:'C' | concept: 'hold scissors'
5409 | expected:'A' | got:'A' | concept: 'hold scissors'
5410 | expected:'A' | got:'A' | concept: 'hold scissors'
5411 | expected:'A' | got:'A' | concept: 'hold scissors'
5412 | expected:'D' | got:'A' | concept: 'hold handbag'
5413 | expected:'B' | got:'B' | concept: 'hold handbag'
5414 | expected:'A' | got:'A' | concept: 'hold handbag'
5415 | expected:'C' | got:'C' | concept: 'hold handbag'
5416 | expected:'A' | got:'A' | concept: 'hold remote'
5417 | expected:'C' | got:'C' | concept: 'hold remote'
5418 | expected:'D' | got:'D' | concept: 'hold remote'
5419 | expected:'C' | got:'C' | concept: 'hold remote'
5420 | expected:'B' | got:'B' | concept: 'hold book'
5421 | expected:'B' | got:'B' | concept: 'hold book'
5422 | expected:'C' | got:'C' | concept: 'hold book'
5423 | expected:'C' | got:'C' | concept: 'hold book'
5424 | expected:'C' | got:'D' | concept: 'kiss horse'
5425 | expected:'B' | got:'B' | concept: 'kiss horse'
5426 | expected:'D' | got:'A' | concept: 'kiss horse'
5427 | expected:'D' | got:'D' | concept: 'kiss horse'
5428 | expected:'B' | got:'C' | concept: 'walk horse'
5429 | expected:'A' | got:'C' | concept: 'walk horse'
5430 | expected:'B' | got:'B' | concept: 'walk horse'
5431 | expected:'B' | got:'B' | concept: 'walk horse'
5432 | expected:'D' | got:'D' | concept: 'walk dog'
5433 | expected:'B' | got:'B' | concept: 'walk dog'
5434 | expected:'B' | got:'B' | concept: 'walk dog'
5435 | expected:'B' | got:'B' | concept: 'walk dog'
5436 | expected:'D' | got:'D' | concept: 'pet horse'
5437 | expected:'D' | got:'D' | concept: 'pet horse'
5438 | expected:'C' | got:'C' | concept: 'pet horse'
5439 | expected:'A' | got:'A' | concept: 'pet horse'
5440 | expected:'A' | got:'A' | concept: 'wash bicycle'
5441 | expected:'B' | got:'B' | concept: 'wash bicycle'
5442 | expected:'A' | got:'B' | concept: 'wash bicycle'
5443 | expected:'D' | got:'A' | concept: 'wash bicycle'
5444 | expected:'B' | got:'B' | concept: 'repair truck'
5445 | expected:'C' | got:'C' | concept: 'repair truck'
5446 | expected:'C' | got:'C' | concept: 'repair truck'
5447 | expected:'C' | got:'C' | concept: 'repair truck'
5448 | expected:'C' | got:'C' | concept: 'repair bicycle'
5449 | expected:'D' | got:'A' | concept: 'repair bicycle'
5450 | expected:'C' | got:'C' | concept: 'repair bicycle'
5451 | expected:'C' | got:'C' | concept: 'repair bicycle'
5452 | expected:'C' | got:'C' | concept: 'ride bicycle'
5453 | expected:'C' | got:'D' | concept: 'ride bicycle'
5454 | expected:'D' | got:'B' | concept: 'ride bicycle'
5455 | expected:'A' | got:'A' | concept: 'ride bicycle'
5456 | expected:'B' | got:'B' | concept: 'hold skateboard'
5457 | expected:'C' | got:'C' | concept: 'hold skateboard'
5458 | expected:'A' | got:'INVALID' | concept: 'hold skateboard'
5459 | expected:'D' | got:'D' | concept: 'hold skateboard'
5460 | expected:'D' | got:'D' | concept: 'jump skateboard'
5461 | expected:'B' | got:'B' | concept: 'jump skateboard'
5462 | expected:'C' | got:'C' | concept: 'jump skateboard'
5463 | expected:'B' | got:'B' | concept: 'jump skateboard'
5464 | expected:'B' | got:'B' | concept: 'sit_on skateboard'
5465 | expected:'B' | got:'B' | concept: 'sit_on skateboard'
5466 | expected:'A' | got:'A' | concept: 'sit_on skateboard'
5467 | expected:'A' | got:'A' | concept: 'sit_on skateboard'
5468 | expected:'A' | got:'A' | concept: 'jump motorcycle'
5469 | expected:'A' | got:'A' | concept: 'jump motorcycle'
5470 | expected:'A' | got:'A' | concept: 'jump motorcycle'
5471 | expected:'B' | got:'B' | concept: 'jump motorcycle'
5472 | expected:'C' | got:'C' | concept: 'repair bicycle'
5473 | expected:'D' | got:'A' | concept: 'repair bicycle'
5474 | expected:'B' | got:'B' | concept: 'repair bicycle'
5475 | expected:'A' | got:'A' | concept: 'repair bicycle'
5476 | expected:'D' | got:'A' | concept: 'load truck'
5477 | expected:'B' | got:'B' | concept: 'load truck'
5478 | expected:'A' | got:'A' | concept: 'load truck'
5479 | expected:'A' | got:'A' | concept: 'load truck'
5480 | expected:'D' | got:'D' | concept: 'repair truck'
5481 | expected:'B' | got:'B' | concept: 'repair truck'
5482 | expected:'D' | got:'D' | concept: 'repair truck'
5483 | expected:'B' | got:'B' | concept: 'repair truck'
5484 | expected:'C' | got:'C' | concept: 'sit_on truck'
5485 | expected:'A' | got:'A' | concept: 'sit_on truck'
5486 | expected:'B' | got:'B' | concept: 'sit_on truck'
5487 | expected:'A' | got:'A' | concept: 'sit_on truck'
5488 | expected:'A' | got:'D' | concept: 'hold knife'
5489 | expected:'D' | got:'B' | concept: 'hold knife'
5490 | expected:'A' | got:'A' | concept: 'hold knife'
5491 | expected:'A' | got:'B' | concept: 'hold knife'
5492 | expected:'A' | got:'C' | concept: 'wield knife'
5493 | expected:'A' | got:'A' | concept: 'wield knife'
5494 | expected:'D' | got:'C' | concept: 'wield knife'
5495 | expected:'C' | got:'B' | concept: 'wield knife'
5496 | expected:'C' | got:'C' | concept: 'hold laptop'
5497 | expected:'C' | got:'C' | concept: 'hold laptop'
5498 | expected:'D' | got:'D' | concept: 'hold laptop'
5499 | expected:'C' | got:'C' | concept: 'hold laptop'
5500 | expected:'B' | got:'B' | concept: 'hold bottle'
5501 | expected:'D' | got:'B' | concept: 'hold bottle'
5502 | expected:'C' | got:'B' | concept: 'hold bottle'
5503 | expected:'A' | got:'A' | concept: 'hold bottle'
5504 | expected:'B' | got:'B' | concept: 'greet person'
5505 | expected:'C' | got:'C' | concept: 'greet person'
5506 | expected:'B' | got:'C' | concept: 'greet person'
5507 | expected:'A' | got:'A' | concept: 'greet person'
5508 | expected:'C' | got:'D' | concept: 'hug person'
5509 | expected:'A' | got:'D' | concept: 'hug person'
5510 | expected:'A' | got:'C' | concept: 'hug person'
5511 | expected:'C' | got:'D' | concept: 'hug person'
5512 | expected:'C' | got:'C' | concept: 'kiss person'
5513 | expected:'A' | got:'A' | concept: 'kiss person'
5514 | expected:'D' | got:'D' | concept: 'kiss person'
5515 | expected:'B' | got:'B' | concept: 'kiss person'
5516 | expected:'C' | got:'C' | concept: 'kiss dog'
5517 | expected:'C' | got:'C' | concept: 'kiss dog'
5518 | expected:'D' | got:'D' | concept: 'kiss dog'
5519 | expected:'B' | got:'B' | concept: 'kiss dog'
5520 | expected:'B' | got:'B' | concept: 'pet dog'
5521 | expected:'B' | got:'B' | concept: 'pet dog'
5522 | expected:'C' | got:'C' | concept: 'pet dog'
5523 | expected:'D' | got:'D' | concept: 'pet dog'
5524 | expected:'A' | got:'A' | concept: 'shear sheep'
5525 | expected:'D' | got:'A' | concept: 'shear sheep'
5526 | expected:'D' | got:'D' | concept: 'shear sheep'
5527 | expected:'A' | got:'A' | concept: 'shear sheep'
5528 | expected:'C' | got:'C' | concept: 'pet horse'
5529 | expected:'A' | got:'A' | concept: 'pet horse'
5530 | expected:'C' | got:'C' | concept: 'pet horse'
5531 | expected:'C' | got:'C' | concept: 'pet horse'
5532 | expected:'C' | got:'C' | concept: 'pet sheep'
5533 | expected:'A' | got:'A' | concept: 'pet sheep'
5534 | expected:'A' | got:'A' | concept: 'pet sheep'
5535 | expected:'B' | got:'D' | concept: 'pet sheep'
5536 | expected:'B' | got:'B' | concept: 'hold wine_glass'
5537 | expected:'B' | got:'B' | concept: 'hold wine_glass'
5538 | expected:'A' | got:'A' | concept: 'hold wine_glass'
5539 | expected:'C' | got:'C' | concept: 'hold wine_glass'
5540 | expected:'C' | got:'C' | concept: 'hold cake'
5541 | expected:'C' | got:'C' | concept: 'hold cake'
5542 | expected:'A' | got:'B' | concept: 'hold cake'
5543 | expected:'D' | got:'C' | concept: 'hold cake'
5544 | expected:'B' | got:'B' | concept: 'hold scissors'
5545 | expected:'A' | got:'A' | concept: 'hold scissors'
5546 | expected:'A' | got:'A' | concept: 'hold scissors'
5547 | expected:'B' | got:'B' | concept: 'hold scissors'
5548 | expected:'C' | got:'INVALID' | concept: 'hold sports_ball'
5549 | expected:'D' | got:'D' | concept: 'hold sports_ball'
5550 | expected:'C' | got:'C' | concept: 'hold sports_ball'
5551 | expected:'D' | got:'D' | concept: 'hold sports_ball'
5552 | expected:'B' | got:'B' | concept: 'hold skateboard'
5553 | expected:'D' | got:'D' | concept: 'hold skateboard'
5554 | expected:'D' | got:'D' | concept: 'hold skateboard'
5555 | expected:'C' | got:'C' | concept: 'hold skateboard'
5556 | expected:'D' | got:'D' | concept: 'hold apple'
5557 | expected:'A' | got:'A' | concept: 'hold apple'
5558 | expected:'C' | got:'C' | concept: 'hold apple'
5559 | expected:'A' | got:'A' | concept: 'hold apple'
5560 | expected:'C' | got:'C' | concept: 'hold orange'
5561 | expected:'B' | got:'B' | concept: 'hold orange'
5562 | expected:'B' | got:'B' | concept: 'hold orange'
5563 | expected:'A' | got:'A' | concept: 'hold orange'
5564 | expected:'A' | got:'A' | concept: 'hold kite'
5565 | expected:'D' | got:'D' | concept: 'hold kite'
5566 | expected:'A' | got:'A' | concept: 'hold kite'
5567 | expected:'B' | got:'B' | concept: 'hold kite'
5568 | expected:'A' | got:'A' | concept: 'hug dog'
5569 | expected:'C' | got:'C' | concept: 'hug dog'
5570 | expected:'B' | got:'B' | concept: 'hug dog'
5571 | expected:'C' | got:'C' | concept: 'hug dog'
5572 | expected:'A' | got:'C' | concept: 'train dog'
5573 | expected:'B' | got:'B' | concept: 'train dog'
5574 | expected:'C' | got:'C' | concept: 'train dog'
5575 | expected:'B' | got:'A' | concept: 'train dog'
5576 | expected:'D' | got:'D' | concept: 'walk dog'
5577 | expected:'A' | got:'A' | concept: 'walk dog'
5578 | expected:'C' | got:'C' | concept: 'walk dog'
5579 | expected:'D' | got:'D' | concept: 'walk dog'
5580 | expected:'C' | got:'C' | concept: 'hug horse'
5581 | expected:'A' | got:'A' | concept: 'hug horse'
5582 | expected:'A' | got:'A' | concept: 'hug horse'
5583 | expected:'A' | got:'A' | concept: 'hug horse'
5584 | expected:'B' | got:'A' | concept: 'watch tv'
5585 | expected:'C' | got:'A' | concept: 'watch tv'
5586 | expected:'C' | got:'C' | concept: 'watch tv'
5587 | expected:'B' | got:'A' | concept: 'watch tv'
5588 | expected:'C' | got:'C' | concept: 'control tv'
5589 | expected:'D' | got:'D' | concept: 'control tv'
5590 | expected:'A' | got:'A' | concept: 'control tv'
5591 | expected:'B' | got:'B' | concept: 'control tv'
5592 | expected:'C' | got:'C' | concept: 'clean keyboard'
5593 | expected:'D' | got:'D' | concept: 'clean keyboard'
5594 | expected:'C' | got:'C' | concept: 'clean keyboard'
5595 | expected:'A' | got:'A' | concept: 'clean keyboard'
5596 | expected:'B' | got:'B' | concept: 'push motorcycle'
5597 | expected:'A' | got:'A' | concept: 'push motorcycle'
5598 | expected:'A' | got:'A' | concept: 'push motorcycle'
5599 | expected:'D' | got:'D' | concept: 'push motorcycle'
5600 | expected:'D' | got:'D' | concept: 'ride skis'
5601 | expected:'D' | got:'D' | concept: 'ride skis'
5602 | expected:'D' | got:'D' | concept: 'ride skis'
5603 | expected:'C' | got:'C' | concept: 'ride skis'
5604 | expected:'B' | got:'B' | concept: 'repair bicycle'
5605 | expected:'B' | got:'B' | concept: 'repair bicycle'
5606 | expected:'C' | got:'C' | concept: 'repair bicycle'
5607 | expected:'A' | got:'A' | concept: 'repair bicycle'
5608 | expected:'B' | got:'B' | concept: 'ride horse'
5609 | expected:'C' | got:'C' | concept: 'ride horse'
5610 | expected:'C' | got:'C' | concept: 'ride horse'
5611 | expected:'B' | got:'B' | concept: 'ride horse'
5612 | expected:'B' | got:'B' | concept: 'ride bicycle'
5613 | expected:'C' | got:'C' | concept: 'ride bicycle'
5614 | expected:'D' | got:'D' | concept: 'ride bicycle'
5615 | expected:'A' | got:'A' | concept: 'ride bicycle'
5616 | expected:'D' | got:'INVALID' | concept: 'eat apple'
5617 | expected:'C' | got:'C' | concept: 'eat apple'
5618 | expected:'C' | got:'C' | concept: 'eat apple'
5619 | expected:'B' | got:'B' | concept: 'eat apple'
5620 | expected:'A' | got:'A' | concept: 'eat sandwich'
5621 | expected:'B' | got:'B' | concept: 'eat sandwich'
5622 | expected:'D' | got:'D' | concept: 'eat sandwich'
5623 | expected:'D' | got:'D' | concept: 'eat sandwich'
5624 | expected:'C' | got:'C' | concept: 'eat pizza'
5625 | expected:'B' | got:'B' | concept: 'eat pizza'
5626 | expected:'D' | got:'B' | concept: 'eat pizza'
5627 | expected:'A' | got:'B' | concept: 'eat pizza'
5628 | expected:'A' | got:'A' | concept: 'hold sandwich'
5629 | expected:'D' | got:'B' | concept: 'hold sandwich'
5630 | expected:'B' | got:'D' | concept: 'hold sandwich'
5631 | expected:'C' | got:'C' | concept: 'hold sandwich'
5632 | expected:'B' | got:'B' | concept: 'jump snowboard'
5633 | expected:'A' | got:'A' | concept: 'jump snowboard'
5634 | expected:'B' | got:'B' | concept: 'jump snowboard'
5635 | expected:'C' | got:'C' | concept: 'jump snowboard'
5636 | expected:'A' | got:'A' | concept: 'jump horse'
5637 | expected:'A' | got:'A' | concept: 'jump horse'
5638 | expected:'D' | got:'D' | concept: 'jump horse'
5639 | expected:'A' | got:'A' | concept: 'jump horse'
5640 | expected:'C' | got:'C' | concept: 'jump skateboard'
5641 | expected:'B' | got:'B' | concept: 'jump skateboard'
5642 | expected:'A' | got:'A' | concept: 'jump skateboard'
5643 | expected:'B' | got:'B' | concept: 'jump skateboard'
5644 | expected:'C' | got:'C' | concept: 'sit_on skateboard'
5645 | expected:'A' | got:'A' | concept: 'sit_on skateboard'
5646 | expected:'D' | got:'D' | concept: 'sit_on skateboard'
5647 | expected:'B' | got:'B' | concept: 'sit_on skateboard'
5648 | expected:'D' | got:'D' | concept: 'hold cup'
5649 | expected:'A' | got:'A' | concept: 'hold cup'
5650 | expected:'D' | got:'C' | concept: 'hold cup'
5651 | expected:'C' | got:'C' | concept: 'hold cup'
5652 | expected:'B' | got:'B' | concept: 'hold kite'
5653 | expected:'C' | got:'C' | concept: 'hold kite'
5654 | expected:'D' | got:'D' | concept: 'hold kite'
5655 | expected:'D' | got:'D' | concept: 'hold kite'
5656 | expected:'D' | got:'D' | concept: 'hold spoon'
5657 | expected:'D' | got:'D' | concept: 'hold spoon'
5658 | expected:'A' | got:'A' | concept: 'hold spoon'
5659 | expected:'B' | got:'B' | concept: 'hold spoon'
5660 | expected:'C' | got:'C' | concept: 'hold mouse'
5661 | expected:'B' | got:'B' | concept: 'hold mouse'
5662 | expected:'D' | got:'D' | concept: 'hold mouse'
5663 | expected:'B' | got:'C' | concept: 'hold mouse'
5664 | expected:'D' | got:'D' | concept: 'hold dog'
5665 | expected:'B' | got:'B' | concept: 'hold dog'
5666 | expected:'D' | got:'D' | concept: 'hold dog'
5667 | expected:'A' | got:'D' | concept: 'hold dog'
5668 | expected:'A' | got:'A' | concept: 'walk dog'
5669 | expected:'B' | got:'B' | concept: 'walk dog'
5670 | expected:'A' | got:'A' | concept: 'walk dog'
5671 | expected:'A' | got:'C' | concept: 'walk dog'
5672 | expected:'A' | got:'A' | concept: 'kiss dog'
5673 | expected:'B' | got:'B' | concept: 'kiss dog'
5674 | expected:'D' | got:'D' | concept: 'kiss dog'
5675 | expected:'D' | got:'D' | concept: 'kiss dog'
5676 | expected:'D' | got:'D' | concept: 'pet dog'
5677 | expected:'C' | got:'C' | concept: 'pet dog'
5678 | expected:'D' | got:'D' | concept: 'pet dog'
5679 | expected:'B' | got:'B' | concept: 'pet dog'
5680 | expected:'D' | got:'D' | concept: 'ride bicycle'
5681 | expected:'B' | got:'B' | concept: 'ride bicycle'
5682 | expected:'A' | got:'A' | concept: 'ride bicycle'
5683 | expected:'D' | got:'D' | concept: 'ride bicycle'
5684 | expected:'C' | got:'C' | concept: 'ride skateboard'
5685 | expected:'C' | got:'C' | concept: 'ride skateboard'
5686 | expected:'C' | got:'C' | concept: 'ride skateboard'
5687 | expected:'A' | got:'A' | concept: 'ride skateboard'
5688 | expected:'A' | got:'A' | concept: 'ride motorcycle'
5689 | expected:'D' | got:'D' | concept: 'ride motorcycle'
5690 | expected:'D' | got:'D' | concept: 'ride motorcycle'
5691 | expected:'B' | got:'B' | concept: 'ride motorcycle'
5692 | expected:'D' | got:'D' | concept: 'ride elephant'
5693 | expected:'C' | got:'C' | concept: 'ride elephant'
5694 | expected:'A' | got:'A' | concept: 'ride elephant'
5695 | expected:'A' | got:'A' | concept: 'ride elephant'
5696 | expected:'D' | got:'A' | concept: 'hold sandwich'
5697 | expected:'C' | got:'C' | concept: 'hold sandwich'
5698 | expected:'B' | got:'B' | concept: 'hold sandwich'
5699 | expected:'A' | got:'A' | concept: 'hold sandwich'
5700 | expected:'B' | got:'B' | concept: 'hold book'
5701 | expected:'C' | got:'C' | concept: 'hold book'
5702 | expected:'B' | got:'B' | concept: 'hold book'
5703 | expected:'D' | got:'D' | concept: 'hold book'
5704 | expected:'B' | got:'B' | concept: 'hold dog'
5705 | expected:'C' | got:'C' | concept: 'hold dog'
5706 | expected:'A' | got:'A' | concept: 'hold dog'
5707 | expected:'A' | got:'A' | concept: 'hold dog'
5708 | expected:'A' | got:'A' | concept: 'hold skateboard'
5709 | expected:'D' | got:'A' | concept: 'hold skateboard'
5710 | expected:'C' | got:'C' | concept: 'hold skateboard'
5711 | expected:'B' | got:'B' | concept: 'hold skateboard'
5712 | expected:'D' | got:'C' | concept: 'hold cell_phone'
5713 | expected:'D' | got:'C' | concept: 'hold cell_phone'
5714 | expected:'B' | got:'B' | concept: 'hold cell_phone'
5715 | expected:'C' | got:'B' | concept: 'hold cell_phone'
5716 | expected:'B' | got:'B' | concept: 'hold remote'
5717 | expected:'A' | got:'A' | concept: 'hold remote'
5718 | expected:'A' | got:'A' | concept: 'hold remote'
5719 | expected:'B' | got:'B' | concept: 'hold remote'
5720 | expected:'C' | got:'C' | concept: 'hold wine_glass'
5721 | expected:'A' | got:'A' | concept: 'hold wine_glass'
5722 | expected:'D' | got:'A' | concept: 'hold wine_glass'
5723 | expected:'A' | got:'A' | concept: 'hold wine_glass'
5724 | expected:'D' | got:'C' | concept: 'point_at_camera remote'
5725 | expected:'A' | got:'C' | concept: 'point_at_camera remote'
5726 | expected:'D' | got:'D' | concept: 'point_at_camera remote'
5727 | expected:'D' | got:'A' | concept: 'point_at_camera remote'
5728 | expected:'A' | got:'A' | concept: 'ride motorcycle'
5729 | expected:'C' | got:'C' | concept: 'ride motorcycle'
5730 | expected:'D' | got:'D' | concept: 'ride motorcycle'
5731 | expected:'C' | got:'C' | concept: 'ride motorcycle'
5732 | expected:'A' | got:'A' | concept: 'ride bicycle'
5733 | expected:'A' | got:'A' | concept: 'ride bicycle'
5734 | expected:'D' | got:'D' | concept: 'ride bicycle'
5735 | expected:'B' | got:'B' | concept: 'ride bicycle'
5736 | expected:'D' | got:'D' | concept: 'ride surfboard'
5737 | expected:'C' | got:'C' | concept: 'ride surfboard'
5738 | expected:'C' | got:'C' | concept: 'ride surfboard'
5739 | expected:'C' | got:'C' | concept: 'ride surfboard'
5740 | expected:'C' | got:'C' | concept: 'ride skis'
5741 | expected:'A' | got:'A' | concept: 'ride skis'
5742 | expected:'D' | got:'D' | concept: 'ride skis'
5743 | expected:'A' | got:'A' | concept: 'ride skis'
5744 | expected:'A' | got:'A' | concept: 'hold remote'
5745 | expected:'A' | got:'A' | concept: 'hold remote'
5746 | expected:'D' | got:'D' | concept: 'hold remote'
5747 | expected:'B' | got:'B' | concept: 'hold remote'
5748 | expected:'B' | got:'A' | concept: 'hold book'
5749 | expected:'D' | got:'D' | concept: 'hold book'
5750 | expected:'C' | got:'C' | concept: 'hold book'
5751 | expected:'C' | got:'C' | concept: 'hold book'
5752 | expected:'D' | got:'C' | concept: 'hold laptop'
5753 | expected:'B' | got:'B' | concept: 'hold laptop'
5754 | expected:'C' | got:'C' | concept: 'hold laptop'
5755 | expected:'D' | got:'D' | concept: 'hold laptop'
5756 | expected:'D' | got:'D' | concept: 'hold sports_ball'
5757 | expected:'C' | got:'C' | concept: 'hold sports_ball'
5758 | expected:'C' | got:'D' | concept: 'hold sports_ball'
5759 | expected:'A' | got:'A' | concept: 'hold sports_ball'
5760 | expected:'B' | got:'B' | concept: 'hold knife'
5761 | expected:'D' | got:'D' | concept: 'hold knife'
5762 | expected:'A' | got:'C' | concept: 'hold knife'
5763 | expected:'C' | got:'D' | concept: 'hold knife'
5764 | expected:'B' | got:'D' | concept: 'lick knife'
5765 | expected:'C' | got:'C' | concept: 'lick knife'
5766 | expected:'A' | got:'D' | concept: 'lick knife'
5767 | expected:'A' | got:'C' | concept: 'lick knife'
5768 | expected:'C' | got:'A' | concept: 'wield knife'
5769 | expected:'A' | got:'A' | concept: 'wield knife'
5770 | expected:'D' | got:'D' | concept: 'wield knife'
5771 | expected:'A' | got:'C' | concept: 'wield knife'
5772 | expected:'C' | got:'C' | concept: 'cut_with knife'
5773 | expected:'A' | got:'A' | concept: 'cut_with knife'
5774 | expected:'B' | got:'B' | concept: 'cut_with knife'
5775 | expected:'B' | got:'A' | concept: 'cut_with knife'
5776 | expected:'C' | got:'C' | concept: 'feed horse'
5777 | expected:'A' | got:'A' | concept: 'feed horse'
5778 | expected:'B' | got:'B' | concept: 'feed horse'
5779 | expected:'C' | got:'C' | concept: 'feed horse'
5780 | expected:'D' | got:'D' | concept: 'jump horse'
5781 | expected:'A' | got:'A' | concept: 'jump horse'
5782 | expected:'B' | got:'B' | concept: 'jump horse'
5783 | expected:'C' | got:'D' | concept: 'jump horse'
5784 | expected:'D' | got:'D' | concept: 'hug horse'
5785 | expected:'C' | got:'D' | concept: 'hug horse'
5786 | expected:'C' | got:'C' | concept: 'hug horse'
5787 | expected:'D' | got:'A' | concept: 'hug horse'
5788 | expected:'B' | got:'B' | concept: 'ride horse'
5789 | expected:'C' | got:'C' | concept: 'ride horse'
5790 | expected:'D' | got:'D' | concept: 'ride horse'
5791 | expected:'A' | got:'A' | concept: 'ride horse'
5792 | expected:'A' | got:'C' | concept: 'hold cake'
5793 | expected:'D' | got:'A' | concept: 'hold cake'
5794 | expected:'B' | got:'B' | concept: 'hold cake'
5795 | expected:'B' | got:'C' | concept: 'hold cake'
5796 | expected:'B' | got:'B' | concept: 'cut pizza'
5797 | expected:'D' | got:'D' | concept: 'cut pizza'
5798 | expected:'D' | got:'D' | concept: 'cut pizza'
5799 | expected:'B' | got:'B' | concept: 'cut pizza'
5800 | expected:'D' | got:'C' | concept: 'hold orange'
5801 | expected:'A' | got:'A' | concept: 'hold orange'
5802 | expected:'C' | got:'C' | concept: 'hold orange'
5803 | expected:'D' | got:'A' | concept: 'hold orange'
5804 | expected:'B' | got:'B' | concept: 'cut cake'
5805 | expected:'A' | got:'A' | concept: 'cut cake'
5806 | expected:'B' | got:'B' | concept: 'cut cake'
5807 | expected:'C' | got:'C' | concept: 'cut cake'
5808 | expected:'C' | got:'C' | concept: 'hold bottle'
5809 | expected:'C' | got:'C' | concept: 'hold bottle'
5810 | expected:'D' | got:'B' | concept: 'hold bottle'
5811 | expected:'B' | got:'C' | concept: 'hold bottle'
5812 | expected:'C' | got:'A' | concept: 'hold orange'
5813 | expected:'A' | got:'C' | concept: 'hold orange'
5814 | expected:'A' | got:'A' | concept: 'hold orange'
5815 | expected:'C' | got:'C' | concept: 'hold orange'
5816 | expected:'B' | got:'B' | concept: 'hold cup'
5817 | expected:'C' | got:'D' | concept: 'hold cup'
5818 | expected:'C' | got:'C' | concept: 'hold cup'
5819 | expected:'A' | got:'A' | concept: 'hold cup'
5820 | expected:'B' | got:'B' | concept: 'hold remote'
5821 | expected:'A' | got:'A' | concept: 'hold remote'
5822 | expected:'B' | got:'B' | concept: 'hold remote'
5823 | expected:'B' | got:'B' | concept: 'hold remote'
5824 | expected:'D' | got:'D' | concept: 'jump horse'
5825 | expected:'A' | got:'A' | concept: 'jump horse'
5826 | expected:'D' | got:'D' | concept: 'jump horse'
5827 | expected:'B' | got:'B' | concept: 'jump horse'
5828 | expected:'D' | got:'D' | concept: 'direct airplane'
5829 | expected:'B' | got:'B' | concept: 'direct airplane'
5830 | expected:'A' | got:'A' | concept: 'direct airplane'
5831 | expected:'B' | got:'B' | concept: 'direct airplane'
5832 | expected:'A' | got:'A' | concept: 'wield knife'
5833 | expected:'C' | got:'C' | concept: 'wield knife'
5834 | expected:'C' | got:'C' | concept: 'wield knife'
5835 | expected:'C' | got:'C' | concept: 'wield knife'
5836 | expected:'D' | got:'D' | concept: 'sit_on chair'
5837 | expected:'B' | got:'B' | concept: 'sit_on chair'
5838 | expected:'A' | got:'A' | concept: 'sit_on chair'
5839 | expected:'D' | got:'D' | concept: 'sit_on chair'
5840 | expected:'A' | got:'A' | concept: 'ride skateboard'
5841 | expected:'B' | got:'B' | concept: 'ride skateboard'
5842 | expected:'A' | got:'A' | concept: 'ride skateboard'
5843 | expected:'D' | got:'D' | concept: 'ride skateboard'
5844 | expected:'A' | got:'A' | concept: 'ride surfboard'
5845 | expected:'C' | got:'C' | concept: 'ride surfboard'
5846 | expected:'B' | got:'B' | concept: 'ride surfboard'
5847 | expected:'B' | got:'B' | concept: 'ride surfboard'
5848 | expected:'C' | got:'C' | concept: 'carry surfboard'
5849 | expected:'A' | got:'A' | concept: 'carry surfboard'
5850 | expected:'A' | got:'A' | concept: 'carry surfboard'
5851 | expected:'A' | got:'A' | concept: 'carry surfboard'
5852 | expected:'A' | got:'A' | concept: 'carry suitcase'
5853 | expected:'A' | got:'A' | concept: 'carry suitcase'
5854 | expected:'C' | got:'C' | concept: 'carry suitcase'
5855 | expected:'D' | got:'D' | concept: 'carry suitcase'
5856 | expected:'A' | got:'A' | concept: 'eat banana'
5857 | expected:'B' | got:'B' | concept: 'eat banana'
5858 | expected:'C' | got:'C' | concept: 'eat banana'
5859 | expected:'D' | got:'D' | concept: 'eat banana'
5860 | expected:'A' | got:'A' | concept: 'eat pizza'
5861 | expected:'A' | got:'A' | concept: 'eat pizza'
5862 | expected:'C' | got:'C' | concept: 'eat pizza'
5863 | expected:'D' | got:'D' | concept: 'eat pizza'
5864 | expected:'A' | got:'D' | concept: 'cut pizza'
5865 | expected:'A' | got:'C' | concept: 'cut pizza'
5866 | expected:'C' | got:'C' | concept: 'cut pizza'
5867 | expected:'D' | got:'D' | concept: 'cut pizza'
5868 | expected:'A' | got:'A' | concept: 'eat donut'
5869 | expected:'C' | got:'C' | concept: 'eat donut'
5870 | expected:'B' | got:'B' | concept: 'eat donut'
5871 | expected:'A' | got:'A' | concept: 'eat donut'
5872 | expected:'A' | got:'A' | concept: 'hug horse'
5873 | expected:'A' | got:'A' | concept: 'hug horse'
5874 | expected:'C' | got:'C' | concept: 'hug horse'
5875 | expected:'A' | got:'A' | concept: 'hug horse'
5876 | expected:'C' | got:'C' | concept: 'kiss horse'
5877 | expected:'D' | got:'D' | concept: 'kiss horse'
5878 | expected:'C' | got:'C' | concept: 'kiss horse'
5879 | expected:'C' | got:'C' | concept: 'kiss horse'
5880 | expected:'B' | got:'B' | concept: 'walk horse'
5881 | expected:'B' | got:'B' | concept: 'walk horse'
5882 | expected:'C' | got:'C' | concept: 'walk horse'
5883 | expected:'D' | got:'D' | concept: 'walk horse'
5884 | expected:'A' | got:'A' | concept: 'walk dog'
5885 | expected:'A' | got:'A' | concept: 'walk dog'
5886 | expected:'A' | got:'A' | concept: 'walk dog'
5887 | expected:'A' | got:'A' | concept: 'walk dog'
5888 | expected:'B' | got:'B' | concept: 'hug person'
5889 | expected:'A' | got:'B' | concept: 'hug person'
5890 | expected:'C' | got:'C' | concept: 'hug person'
5891 | expected:'C' | got:'C' | concept: 'hug person'
5892 | expected:'C' | got:'C' | concept: 'kiss person'
5893 | expected:'A' | got:'A' | concept: 'kiss person'
5894 | expected:'B' | got:'B' | concept: 'kiss person'
5895 | expected:'C' | got:'C' | concept: 'kiss person'
5896 | expected:'D' | got:'D' | concept: 'greet person'
5897 | expected:'C' | got:'C' | concept: 'greet person'
5898 | expected:'D' | got:'D' | concept: 'greet person'
5899 | expected:'A' | got:'A' | concept: 'greet person'
5900 | expected:'C' | got:'C' | concept: 'kiss horse'
5901 | expected:'C' | got:'C' | concept: 'kiss horse'
5902 | expected:'C' | got:'C' | concept: 'kiss horse'
5903 | expected:'C' | got:'C' | concept: 'kiss horse'
5904 | expected:'D' | got:'D' | concept: 'clean oven'
5905 | expected:'A' | got:'A' | concept: 'clean oven'
5906 | expected:'B' | got:'B' | concept: 'clean oven'
5907 | expected:'D' | got:'D' | concept: 'clean oven'
5908 | expected:'C' | got:'A' | concept: 'clean microwave'
5909 | expected:'A' | got:'B' | concept: 'clean microwave'
5910 | expected:'A' | got:'A' | concept: 'clean microwave'
5911 | expected:'B' | got:'B' | concept: 'clean microwave'
5912 | expected:'B' | got:'B' | concept: 'operate microwave'
5913 | expected:'B' | got:'A' | concept: 'operate microwave'
5914 | expected:'B' | got:'A' | concept: 'operate microwave'
5915 | expected:'C' | got:'C' | concept: 'operate microwave'
5916 | expected:'D' | got:'A' | concept: 'open microwave'
5917 | expected:'C' | got:'C' | concept: 'open microwave'
5918 | expected:'A' | got:'A' | concept: 'open microwave'
5919 | expected:'B' | got:'D' | concept: 'open microwave'
5920 | expected:'A' | got:'A' | concept: 'hold sports_ball'
5921 | expected:'A' | got:'A' | concept: 'hold sports_ball'
5922 | expected:'A' | got:'A' | concept: 'hold sports_ball'
5923 | expected:'B' | got:'B' | concept: 'hold sports_ball'
5924 | expected:'D' | got:'D' | concept: 'hold remote'
5925 | expected:'C' | got:'C' | concept: 'hold remote'
5926 | expected:'A' | got:'A' | concept: 'hold remote'
5927 | expected:'C' | got:'C' | concept: 'hold remote'
5928 | expected:'A' | got:'A' | concept: 'hold dog'
5929 | expected:'C' | got:'C' | concept: 'hold dog'
5930 | expected:'A' | got:'A' | concept: 'hold dog'
5931 | expected:'D' | got:'D' | concept: 'hold dog'
5932 | expected:'D' | got:'D' | concept: 'hold spoon'
5933 | expected:'B' | got:'B' | concept: 'hold spoon'
5934 | expected:'D' | got:'D' | concept: 'hold spoon'
5935 | expected:'C' | got:'A' | concept: 'hold spoon'
5936 | expected:'C' | got:'B' | concept: 'hold handbag'
5937 | expected:'A' | got:'A' | concept: 'hold handbag'
5938 | expected:'C' | got:'C' | concept: 'hold handbag'
5939 | expected:'D' | got:'A' | concept: 'hold handbag'
5940 | expected:'B' | got:'B' | concept: 'hold apple'
5941 | expected:'D' | got:'A' | concept: 'hold apple'
5942 | expected:'D' | got:'D' | concept: 'hold apple'
5943 | expected:'B' | got:'B' | concept: 'hold apple'
5944 | expected:'D' | got:'A' | concept: 'hold laptop'
5945 | expected:'C' | got:'C' | concept: 'hold laptop'
5946 | expected:'A' | got:'A' | concept: 'hold laptop'
5947 | expected:'D' | got:'D' | concept: 'hold laptop'
5948 | expected:'C' | got:'C' | concept: 'hold book'
5949 | expected:'C' | got:'C' | concept: 'hold book'
5950 | expected:'A' | got:'A' | concept: 'hold book'
5951 | expected:'B' | got:'B' | concept: 'hold book'
5952 | expected:'B' | got:'B' | concept: 'hold mouse'
5953 | expected:'C' | got:'C' | concept: 'hold mouse'
5954 | expected:'B' | got:'B' | concept: 'hold mouse'
5955 | expected:'C' | got:'C' | concept: 'hold mouse'
5956 | expected:'A' | got:'C' | concept: 'hold cake'
5957 | expected:'D' | got:'D' | concept: 'hold cake'
5958 | expected:'B' | got:'B' | concept: 'hold cake'
5959 | expected:'B' | got:'D' | concept: 'hold cake'
5960 | expected:'D' | got:'D' | concept: 'hold scissors'
5961 | expected:'C' | got:'INVALID' | concept: 'hold scissors'
5962 | expected:'C' | got:'C' | concept: 'hold scissors'
5963 | expected:'A' | got:'A' | concept: 'hold scissors'
5964 | expected:'D' | got:'D' | concept: 'hold skateboard'
5965 | expected:'C' | got:'C' | concept: 'hold skateboard'
5966 | expected:'C' | got:'C' | concept: 'hold skateboard'
5967 | expected:'D' | got:'D' | concept: 'hold skateboard'
5968 | expected:'D' | got:'C' | concept: 'hold cup'
5969 | expected:'B' | got:'B' | concept: 'hold cup'
5970 | expected:'A' | got:'A' | concept: 'hold cup'
5971 | expected:'D' | got:'D' | concept: 'hold cup'
5972 | expected:'D' | got:'D' | concept: 'hold skateboard'
5973 | expected:'A' | got:'A' | concept: 'hold skateboard'
5974 | expected:'A' | got:'A' | concept: 'hold skateboard'
5975 | expected:'A' | got:'A' | concept: 'hold skateboard'
5976 | expected:'D' | got:'D' | concept: 'hold dog'
5977 | expected:'C' | got:'C' | concept: 'hold dog'
5978 | expected:'B' | got:'B' | concept: 'hold dog'
5979 | expected:'C' | got:'C' | concept: 'hold dog'
5980 | expected:'B' | got:'A' | concept: 'hold sports_ball'
5981 | expected:'D' | got:'D' | concept: 'hold sports_ball'
5982 | expected:'C' | got:'C' | concept: 'hold sports_ball'
5983 | expected:'A' | got:'A' | concept: 'hold sports_ball'
5984 | expected:'B' | got:'D' | concept: 'sit_on skateboard'
5985 | expected:'B' | got:'C' | concept: 'sit_on skateboard'
5986 | expected:'B' | got:'B' | concept: 'sit_on skateboard'
5987 | expected:'A' | got:'D' | concept: 'sit_on skateboard'
5988 | expected:'D' | got:'C' | concept: 'jump snowboard'
5989 | expected:'B' | got:'B' | concept: 'jump snowboard'
5990 | expected:'A' | got:'A' | concept: 'jump snowboard'
5991 | expected:'D' | got:'C' | concept: 'jump snowboard'
5992 | expected:'A' | got:'A' | concept: 'jump skateboard'
5993 | expected:'C' | got:'C' | concept: 'jump skateboard'
5994 | expected:'D' | got:'D' | concept: 'jump skateboard'
5995 | expected:'A' | got:'A' | concept: 'jump skateboard'
5996 | expected:'A' | got:'A' | concept: 'hold skateboard'
5997 | expected:'C' | got:'C' | concept: 'hold skateboard'
5998 | expected:'A' | got:'A' | concept: 'hold skateboard'
5999 | expected:'B' | got:'B' | concept: 'hold skateboard'
6000 | expected:'A' | got:'A' | concept: 'sit_on bed'
6001 | expected:'B' | got:'B' | concept: 'sit_on bed'
6002 | expected:'D' | got:'D' | concept: 'sit_on bed'
6003 | expected:'A' | got:'A' | concept: 'sit_on bed'
6004 | expected:'D' | got:'D' | concept: 'sit_on chair'
6005 | expected:'C' | got:'C' | concept: 'sit_on chair'
6006 | expected:'B' | got:'B' | concept: 'sit_on chair'
6007 | expected:'D' | got:'D' | concept: 'sit_on chair'
6008 | expected:'B' | got:'B' | concept: 'sit_on couch'
6009 | expected:'B' | got:'D' | concept: 'sit_on couch'
6010 | expected:'A' | got:'A' | concept: 'sit_on couch'
6011 | expected:'D' | got:'D' | concept: 'sit_on couch'
6012 | expected:'D' | got:'D' | concept: 'sit_on truck'
6013 | expected:'C' | got:'C' | concept: 'sit_on truck'
6014 | expected:'A' | got:'A' | concept: 'sit_on truck'
6015 | expected:'A' | got:'A' | concept: 'sit_on truck'
6016 | expected:'B' | got:'B' | concept: 'ride surfboard'
6017 | expected:'B' | got:'B' | concept: 'ride surfboard'
6018 | expected:'B' | got:'B' | concept: 'ride surfboard'
6019 | expected:'D' | got:'D' | concept: 'ride surfboard'
6020 | expected:'A' | got:'A' | concept: 'ride horse'
6021 | expected:'C' | got:'C' | concept: 'ride horse'
6022 | expected:'D' | got:'D' | concept: 'ride horse'
6023 | expected:'B' | got:'B' | concept: 'ride horse'
6024 | expected:'C' | got:'C' | concept: 'ride skateboard'
6025 | expected:'C' | got:'C' | concept: 'ride skateboard'
6026 | expected:'A' | got:'A' | concept: 'ride skateboard'
6027 | expected:'A' | got:'A' | concept: 'ride skateboard'
6028 | expected:'C' | got:'C' | concept: 'sit_on skateboard'
6029 | expected:'D' | got:'B' | concept: 'sit_on skateboard'
6030 | expected:'D' | got:'D' | concept: 'sit_on skateboard'
6031 | expected:'D' | got:'D' | concept: 'sit_on skateboard'
6032 | expected:'D' | got:'D' | concept: 'straddle motorcycle'
6033 | expected:'C' | got:'C' | concept: 'straddle motorcycle'
6034 | expected:'C' | got:'C' | concept: 'straddle motorcycle'
6035 | expected:'A' | got:'A' | concept: 'straddle motorcycle'
6036 | expected:'B' | got:'B' | concept: 'wash car'
6037 | expected:'A' | got:'A' | concept: 'wash car'
6038 | expected:'A' | got:'A' | concept: 'wash car'
6039 | expected:'C' | got:'A' | concept: 'wash car'
6040 | expected:'D' | got:'D' | concept: 'push motorcycle'
6041 | expected:'A' | got:'A' | concept: 'push motorcycle'
6042 | expected:'B' | got:'B' | concept: 'push motorcycle'
6043 | expected:'B' | got:'B' | concept: 'push motorcycle'
6044 | expected:'D' | got:'B' | concept: 'wash motorcycle'
6045 | expected:'C' | got:'C' | concept: 'wash motorcycle'
6046 | expected:'D' | got:'D' | concept: 'wash motorcycle'
6047 | expected:'D' | got:'D' | concept: 'wash motorcycle'
6048 | expected:'A' | got:'C' | concept: 'type_on laptop'
6049 | expected:'B' | got:'A' | concept: 'type_on laptop'
6050 | expected:'B' | got:'B' | concept: 'type_on laptop'
6051 | expected:'D' | got:'B' | concept: 'type_on laptop'
6052 | expected:'D' | got:'A' | concept: 'type_on keyboard'
6053 | expected:'C' | got:'C' | concept: 'type_on keyboard'
6054 | expected:'B' | got:'B' | concept: 'type_on keyboard'
6055 | expected:'C' | got:'C' | concept: 'type_on keyboard'
6056 | expected:'C' | got:'C' | concept: 'read laptop'
6057 | expected:'B' | got:'B' | concept: 'read laptop'
6058 | expected:'A' | got:'C' | concept: 'read laptop'
6059 | expected:'A' | got:'B' | concept: 'read laptop'
6060 | expected:'D' | got:'A' | concept: 'hold laptop'
6061 | expected:'C' | got:'B' | concept: 'hold laptop'
6062 | expected:'B' | got:'A' | concept: 'hold laptop'
6063 | expected:'A' | got:'C' | concept: 'hold laptop'
6064 | expected:'C' | got:'C' | concept: 'repair truck'
6065 | expected:'B' | got:'B' | concept: 'repair truck'
6066 | expected:'D' | got:'D' | concept: 'repair truck'
6067 | expected:'A' | got:'A' | concept: 'repair truck'
6068 | expected:'D' | got:'D' | concept: 'load truck'
6069 | expected:'D' | got:'D' | concept: 'load truck'
6070 | expected:'B' | got:'A' | concept: 'load truck'
6071 | expected:'A' | got:'A' | concept: 'load truck'
6072 | expected:'A' | got:'A' | concept: 'sit_on truck'
6073 | expected:'D' | got:'D' | concept: 'sit_on truck'
6074 | expected:'B' | got:'B' | concept: 'sit_on truck'
6075 | expected:'A' | got:'A' | concept: 'sit_on truck'
6076 | expected:'D' | got:'A' | concept: 'repair bicycle'
6077 | expected:'D' | got:'A' | concept: 'repair bicycle'
6078 | expected:'B' | got:'B' | concept: 'repair bicycle'
6079 | expected:'A' | got:'A' | concept: 'repair bicycle'
6080 | expected:'D' | got:'D' | concept: 'hold laptop'
6081 | expected:'D' | got:'B' | concept: 'hold laptop'
6082 | expected:'D' | got:'D' | concept: 'hold laptop'
6083 | expected:'C' | got:'C' | concept: 'hold laptop'
6084 | expected:'C' | got:'C' | concept: 'hold wine_glass'
6085 | expected:'A' | got:'A' | concept: 'hold wine_glass'
6086 | expected:'B' | got:'B' | concept: 'hold wine_glass'
6087 | expected:'C' | got:'C' | concept: 'hold wine_glass'
6088 | expected:'A' | got:'A' | concept: 'hold banana'
6089 | expected:'D' | got:'A' | concept: 'hold banana'
6090 | expected:'C' | got:'C' | concept: 'hold banana'
6091 | expected:'C' | got:'A' | concept: 'hold banana'
6092 | expected:'B' | got:'B' | concept: 'hold book'
6093 | expected:'D' | got:'B' | concept: 'hold book'
6094 | expected:'B' | got:'B' | concept: 'hold book'
6095 | expected:'D' | got:'D' | concept: 'hold book'
6096 | expected:'D' | got:'D' | concept: 'ride surfboard'
6097 | expected:'C' | got:'C' | concept: 'ride surfboard'
6098 | expected:'D' | got:'D' | concept: 'ride surfboard'
6099 | expected:'B' | got:'B' | concept: 'ride surfboard'
6100 | expected:'C' | got:'C' | concept: 'ride skateboard'
6101 | expected:'B' | got:'B' | concept: 'ride skateboard'
6102 | expected:'D' | got:'D' | concept: 'ride skateboard'
6103 | expected:'B' | got:'B' | concept: 'ride skateboard'
6104 | expected:'A' | got:'A' | concept: 'ride horse'
6105 | expected:'B' | got:'B' | concept: 'ride horse'
6106 | expected:'D' | got:'D' | concept: 'ride horse'
6107 | expected:'A' | got:'A' | concept: 'ride horse'
6108 | expected:'B' | got:'B' | concept: 'ride elephant'
6109 | expected:'B' | got:'B' | concept: 'ride elephant'
6110 | expected:'B' | got:'B' | concept: 'ride elephant'
6111 | expected:'C' | got:'C' | concept: 'ride elephant'
6112 | expected:'B' | got:'B' | concept: 'clean refrigerator'
6113 | expected:'C' | got:'C' | concept: 'clean refrigerator'
6114 | expected:'D' | got:'D' | concept: 'clean refrigerator'
6115 | expected:'C' | got:'C' | concept: 'clean refrigerator'
6116 | expected:'D' | got:'C' | concept: 'clean microwave'
6117 | expected:'D' | got:'A' | concept: 'clean microwave'
6118 | expected:'C' | got:'D' | concept: 'clean microwave'
6119 | expected:'D' | got:'B' | concept: 'clean microwave'
6120 | expected:'B' | got:'C' | concept: 'operate microwave'
6121 | expected:'D' | got:'A' | concept: 'operate microwave'
6122 | expected:'D' | got:'A' | concept: 'operate microwave'
6123 | expected:'A' | got:'A' | concept: 'operate microwave'
6124 | expected:'D' | got:'D' | concept: 'open microwave'
6125 | expected:'B' | got:'B' | concept: 'open microwave'
6126 | expected:'B' | got:'B' | concept: 'open microwave'
6127 | expected:'D' | got:'B' | concept: 'open microwave'
6128 | expected:'B' | got:'B' | concept: 'hold apple'
6129 | expected:'C' | got:'C' | concept: 'hold apple'
6130 | expected:'D' | got:'D' | concept: 'hold apple'
6131 | expected:'B' | got:'B' | concept: 'hold apple'
6132 | expected:'C' | got:'C' | concept: 'hold sports_ball'
6133 | expected:'B' | got:'B' | concept: 'hold sports_ball'
6134 | expected:'A' | got:'INVALID' | concept: 'hold sports_ball'
6135 | expected:'D' | got:'D' | concept: 'hold sports_ball'
6136 | expected:'B' | got:'B' | concept: 'hold toothbrush'
6137 | expected:'D' | got:'D' | concept: 'hold toothbrush'
6138 | expected:'A' | got:'A' | concept: 'hold toothbrush'
6139 | expected:'C' | got:'C' | concept: 'hold toothbrush'
6140 | expected:'A' | got:'A' | concept: 'hold scissors'
6141 | expected:'D' | got:'D' | concept: 'hold scissors'
6142 | expected:'B' | got:'B' | concept: 'hold scissors'
6143 | expected:'D' | got:'C' | concept: 'hold scissors'
6144 | expected:'D' | got:'A' | concept: 'repair bicycle'
6145 | expected:'C' | got:'C' | concept: 'repair bicycle'
6146 | expected:'C' | got:'C' | concept: 'repair bicycle'
6147 | expected:'D' | got:'A' | concept: 'repair bicycle'
6148 | expected:'C' | got:'C' | concept: 'repair truck'
6149 | expected:'C' | got:'C' | concept: 'repair truck'
6150 | expected:'A' | got:'A' | concept: 'repair truck'
6151 | expected:'B' | got:'B' | concept: 'repair truck'
6152 | expected:'C' | got:'C' | concept: 'ride bicycle'
6153 | expected:'C' | got:'C' | concept: 'ride bicycle'
6154 | expected:'C' | got:'C' | concept: 'ride bicycle'
6155 | expected:'B' | got:'B' | concept: 'ride bicycle'
6156 | expected:'D' | got:'D' | concept: 'sit_on truck'
6157 | expected:'B' | got:'B' | concept: 'sit_on truck'
6158 | expected:'C' | got:'C' | concept: 'sit_on truck'
6159 | expected:'B' | got:'A' | concept: 'sit_on truck'
6160 | expected:'D' | got:'D' | concept: 'inspect motorcycle'
6161 | expected:'D' | got:'D' | concept: 'inspect motorcycle'
6162 | expected:'D' | got:'D' | concept: 'inspect motorcycle'
6163 | expected:'B' | got:'B' | concept: 'inspect motorcycle'
6164 | expected:'C' | got:'A' | concept: 'turn motorcycle'
6165 | expected:'A' | got:'D' | concept: 'turn motorcycle'
6166 | expected:'D' | got:'A' | concept: 'turn motorcycle'
6167 | expected:'A' | got:'B' | concept: 'turn motorcycle'
6168 | expected:'A' | got:'A' | concept: 'ride motorcycle'
6169 | expected:'D' | got:'D' | concept: 'ride motorcycle'
6170 | expected:'B' | got:'B' | concept: 'ride motorcycle'
6171 | expected:'D' | got:'D' | concept: 'ride motorcycle'
6172 | expected:'A' | got:'A' | concept: 'wash motorcycle'
6173 | expected:'C' | got:'C' | concept: 'wash motorcycle'
6174 | expected:'A' | got:'A' | concept: 'wash motorcycle'
6175 | expected:'C' | got:'C' | concept: 'wash motorcycle'
6176 | expected:'D' | got:'A' | concept: 'hold apple'
6177 | expected:'B' | got:'B' | concept: 'hold apple'
6178 | expected:'D' | got:'D' | concept: 'hold apple'
6179 | expected:'D' | got:'D' | concept: 'hold apple'
6180 | expected:'D' | got:'A' | concept: 'hold banana'
6181 | expected:'A' | got:'A' | concept: 'hold banana'
6182 | expected:'A' | got:'A' | concept: 'hold banana'
6183 | expected:'D' | got:'A' | concept: 'hold banana'
6184 | expected:'B' | got:'B' | concept: 'hold skateboard'
6185 | expected:'B' | got:'B' | concept: 'hold skateboard'
6186 | expected:'A' | got:'A' | concept: 'hold skateboard'
6187 | expected:'B' | got:'B' | concept: 'hold skateboard'
6188 | expected:'B' | got:'B' | concept: 'hold kite'
6189 | expected:'C' | got:'C' | concept: 'hold kite'
6190 | expected:'A' | got:'A' | concept: 'hold kite'
6191 | expected:'D' | got:'D' | concept: 'hold kite'
6192 | expected:'A' | got:'A' | concept: 'jump snowboard'
6193 | expected:'D' | got:'A' | concept: 'jump snowboard'
6194 | expected:'A' | got:'A' | concept: 'jump snowboard'
6195 | expected:'A' | got:'A' | concept: 'jump snowboard'
6196 | expected:'D' | got:'D' | concept: 'sit_on bench'
6197 | expected:'C' | got:'C' | concept: 'sit_on bench'
6198 | expected:'A' | got:'A' | concept: 'sit_on bench'
6199 | expected:'B' | got:'B' | concept: 'sit_on bench'
6200 | expected:'C' | got:'C' | concept: 'eat_at dining_table'
6201 | expected:'A' | got:'C' | concept: 'eat_at dining_table'
6202 | expected:'B' | got:'D' | concept: 'eat_at dining_table'
6203 | expected:'C' | got:'C' | concept: 'eat_at dining_table'
6204 | expected:'A' | got:'D' | concept: 'sit_at dining_table'
6205 | expected:'D' | got:'D' | concept: 'sit_at dining_table'
6206 | expected:'A' | got:'B' | concept: 'sit_at dining_table'
6207 | expected:'B' | got:'C' | concept: 'sit_at dining_table'
6208 | expected:'C' | got:'C' | concept: 'hold knife'
6209 | expected:'A' | got:'C' | concept: 'hold knife'
6210 | expected:'D' | got:'D' | concept: 'hold knife'
6211 | expected:'A' | got:'A' | concept: 'hold knife'
6212 | expected:'B' | got:'B' | concept: 'hold skateboard'
6213 | expected:'B' | got:'B' | concept: 'hold skateboard'
6214 | expected:'B' | got:'B' | concept: 'hold skateboard'
6215 | expected:'C' | got:'C' | concept: 'hold skateboard'
6216 | expected:'A' | got:'A' | concept: 'hold cake'
6217 | expected:'A' | got:'A' | concept: 'hold cake'
6218 | expected:'B' | got:'INVALID' | concept: 'hold cake'
6219 | expected:'A' | got:'A' | concept: 'hold cake'
6220 | expected:'B' | got:'B' | concept: 'hold banana'
6221 | expected:'D' | got:'A' | concept: 'hold banana'
6222 | expected:'C' | got:'C' | concept: 'hold banana'
6223 | expected:'A' | got:'A' | concept: 'hold banana'
6224 | expected:'C' | got:'C' | concept: 'sit_on motorcycle'
6225 | expected:'C' | got:'C' | concept: 'sit_on motorcycle'
6226 | expected:'C' | got:'C' | concept: 'sit_on motorcycle'
6227 | expected:'C' | got:'C' | concept: 'sit_on motorcycle'
6228 | expected:'C' | got:'C' | concept: 'sit_on bench'
6229 | expected:'A' | got:'A' | concept: 'sit_on bench'
6230 | expected:'C' | got:'C' | concept: 'sit_on bench'
6231 | expected:'B' | got:'B' | concept: 'sit_on bench'
6232 | expected:'B' | got:'B' | concept: 'sit_on_with_multiple_person bench'
6233 | expected:'C' | got:'C' | concept: 'sit_on_with_multiple_person bench'
6234 | expected:'A' | got:'A' | concept: 'sit_on_with_multiple_person bench'
6235 | expected:'B' | got:'B' | concept: 'sit_on_with_multiple_person bench'
6236 | expected:'A' | got:'A' | concept: 'sit_on bed'
6237 | expected:'D' | got:'D' | concept: 'sit_on bed'
6238 | expected:'C' | got:'C' | concept: 'sit_on bed'
6239 | expected:'B' | got:'B' | concept: 'sit_on bed'
6240 | expected:'D' | got:'D' | concept: 'greet person'
6241 | expected:'A' | got:'D' | concept: 'greet person'
6242 | expected:'A' | got:'A' | concept: 'greet person'
6243 | expected:'D' | got:'C' | concept: 'greet person'
6244 | expected:'D' | got:'D' | concept: 'kiss person'
6245 | expected:'A' | got:'A' | concept: 'kiss person'
6246 | expected:'C' | got:'C' | concept: 'kiss person'
6247 | expected:'B' | got:'B' | concept: 'kiss person'
6248 | expected:'C' | got:'C' | concept: 'kiss horse'
6249 | expected:'B' | got:'B' | concept: 'kiss horse'
6250 | expected:'C' | got:'C' | concept: 'kiss horse'
6251 | expected:'B' | got:'B' | concept: 'kiss horse'
6252 | expected:'C' | got:'C' | concept: 'hug person'
6253 | expected:'C' | got:'C' | concept: 'hug person'
6254 | expected:'C' | got:'C' | concept: 'hug person'
6255 | expected:'D' | got:'D' | concept: 'hug person'
6256 | expected:'D' | got:'B' | concept: 'lie_on couch'
6257 | expected:'C' | got:'C' | concept: 'lie_on couch'
6258 | expected:'A' | got:'A' | concept: 'lie_on couch'
6259 | expected:'A' | got:'D' | concept: 'lie_on couch'
6260 | expected:'C' | got:'C' | concept: 'lie_on bench'
6261 | expected:'D' | got:'B' | concept: 'lie_on bench'
6262 | expected:'B' | got:'B' | concept: 'lie_on bench'
6263 | expected:'C' | got:'C' | concept: 'lie_on bench'
6264 | expected:'B' | got:'B' | concept: 'lie_on bed'
6265 | expected:'C' | got:'C' | concept: 'lie_on bed'
6266 | expected:'B' | got:'B' | concept: 'lie_on bed'
6267 | expected:'A' | got:'A' | concept: 'lie_on bed'
6268 | expected:'A' | got:'C' | concept: 'sit_on couch'
6269 | expected:'C' | got:'C' | concept: 'sit_on couch'
6270 | expected:'C' | got:'C' | concept: 'sit_on couch'
6271 | expected:'B' | got:'B' | concept: 'sit_on couch'
6272 | expected:'A' | got:'A' | concept: 'walk horse'
6273 | expected:'C' | got:'C' | concept: 'walk horse'
6274 | expected:'C' | got:'C' | concept: 'walk horse'
6275 | expected:'D' | got:'A' | concept: 'walk horse'
6276 | expected:'D' | got:'D' | concept: 'kiss horse'
6277 | expected:'D' | got:'D' | concept: 'kiss horse'
6278 | expected:'A' | got:'A' | concept: 'kiss horse'
6279 | expected:'C' | got:'C' | concept: 'kiss horse'
6280 | expected:'B' | got:'B' | concept: 'hug horse'
6281 | expected:'A' | got:'A' | concept: 'hug horse'
6282 | expected:'A' | got:'B' | concept: 'hug horse'
6283 | expected:'C' | got:'C' | concept: 'hug horse'
6284 | expected:'A' | got:'A' | concept: 'kiss person'
6285 | expected:'A' | got:'A' | concept: 'kiss person'
6286 | expected:'B' | got:'INVALID' | concept: 'kiss person'
6287 | expected:'D' | got:'D' | concept: 'kiss person'
6288 | expected:'B' | got:'B' | concept: 'hold banana'
6289 | expected:'B' | got:'B' | concept: 'hold banana'
6290 | expected:'A' | got:'A' | concept: 'hold banana'
6291 | expected:'C' | got:'C' | concept: 'hold banana'
6292 | expected:'C' | got:'C' | concept: 'hold skateboard'
6293 | expected:'D' | got:'D' | concept: 'hold skateboard'
6294 | expected:'C' | got:'C' | concept: 'hold skateboard'
6295 | expected:'C' | got:'C' | concept: 'hold skateboard'
6296 | expected:'D' | got:'A' | concept: 'hold orange'
6297 | expected:'A' | got:'A' | concept: 'hold orange'
6298 | expected:'B' | got:'B' | concept: 'hold orange'
6299 | expected:'B' | got:'B' | concept: 'hold orange'
6300 | expected:'A' | got:'A' | concept: 'hold dog'
6301 | expected:'A' | got:'A' | concept: 'hold dog'
6302 | expected:'D' | got:'D' | concept: 'hold dog'
6303 | expected:'D' | got:'D' | concept: 'hold dog'
6304 | expected:'A' | got:'A' | concept: 'hold skateboard'
6305 | expected:'D' | got:'D' | concept: 'hold skateboard'
6306 | expected:'B' | got:'B' | concept: 'hold skateboard'
6307 | expected:'B' | got:'B' | concept: 'hold skateboard'
6308 | expected:'A' | got:'A' | concept: 'hold cup'
6309 | expected:'D' | got:'D' | concept: 'hold cup'
6310 | expected:'A' | got:'A' | concept: 'hold cup'
6311 | expected:'C' | got:'C' | concept: 'hold cup'
6312 | expected:'A' | got:'A' | concept: 'hold banana'
6313 | expected:'B' | got:'B' | concept: 'hold banana'
6314 | expected:'D' | got:'D' | concept: 'hold banana'
6315 | expected:'B' | got:'B' | concept: 'hold banana'
6316 | expected:'D' | got:'D' | concept: 'hold tennis_racket'
6317 | expected:'B' | got:'B' | concept: 'hold tennis_racket'
6318 | expected:'B' | got:'B' | concept: 'hold tennis_racket'
6319 | expected:'A' | got:'A' | concept: 'hold tennis_racket'
6320 | expected:'C' | got:'C' | concept: 'hold remote'
6321 | expected:'B' | got:'B' | concept: 'hold remote'
6322 | expected:'D' | got:'D' | concept: 'hold remote'
6323 | expected:'A' | got:'A' | concept: 'hold remote'
6324 | expected:'C' | got:'C' | concept: 'hold toothbrush'
6325 | expected:'C' | got:'C' | concept: 'hold toothbrush'
6326 | expected:'C' | got:'C' | concept: 'hold toothbrush'
6327 | expected:'D' | got:'D' | concept: 'hold toothbrush'
6328 | expected:'A' | got:'C' | concept: 'point_at_camera remote'
6329 | expected:'D' | got:'B' | concept: 'point_at_camera remote'
6330 | expected:'C' | got:'C' | concept: 'point_at_camera remote'
6331 | expected:'C' | got:'D' | concept: 'point_at_camera remote'
6332 | expected:'C' | got:'C' | concept: 'hold tennis_racket'
6333 | expected:'A' | got:'A' | concept: 'hold tennis_racket'
6334 | expected:'C' | got:'C' | concept: 'hold tennis_racket'
6335 | expected:'D' | got:'D' | concept: 'hold tennis_racket'
6336 | expected:'A' | got:'A' | concept: 'ride horse'
6337 | expected:'B' | got:'B' | concept: 'ride horse'
6338 | expected:'B' | got:'B' | concept: 'ride horse'
6339 | expected:'D' | got:'D' | concept: 'ride horse'
6340 | expected:'D' | got:'D' | concept: 'ride elephant'
6341 | expected:'C' | got:'C' | concept: 'ride elephant'
6342 | expected:'B' | got:'B' | concept: 'ride elephant'
6343 | expected:'D' | got:'D' | concept: 'ride elephant'
6344 | expected:'D' | got:'D' | concept: 'ride bicycle'
6345 | expected:'D' | got:'D' | concept: 'ride bicycle'
6346 | expected:'D' | got:'D' | concept: 'ride bicycle'
6347 | expected:'A' | got:'A' | concept: 'ride bicycle'
6348 | expected:'B' | got:'B' | concept: 'ride motorcycle'
6349 | expected:'D' | got:'D' | concept: 'ride motorcycle'
6350 | expected:'A' | got:'A' | concept: 'ride motorcycle'
6351 | expected:'C' | got:'C' | concept: 'ride motorcycle'
6352 | expected:'C' | got:'C' | concept: 'cut cake'
6353 | expected:'A' | got:'A' | concept: 'cut cake'
6354 | expected:'D' | got:'D' | concept: 'cut cake'
6355 | expected:'C' | got:'C' | concept: 'cut cake'
6356 | expected:'D' | got:'C' | concept: 'hold cake'
6357 | expected:'C' | got:'A' | concept: 'hold cake'
6358 | expected:'A' | got:'D' | concept: 'hold cake'
6359 | expected:'C' | got:'C' | concept: 'hold cake'
6360 | expected:'B' | got:'B' | concept: 'cut pizza'
6361 | expected:'C' | got:'C' | concept: 'cut pizza'
6362 | expected:'C' | got:'C' | concept: 'cut pizza'
6363 | expected:'A' | got:'C' | concept: 'cut pizza'
6364 | expected:'C' | got:'C' | concept: 'eat pizza'
6365 | expected:'A' | got:'A' | concept: 'eat pizza'
6366 | expected:'D' | got:'A' | concept: 'eat pizza'
6367 | expected:'B' | got:'B' | concept: 'eat pizza'
6368 | expected:'D' | got:'D' | concept: 'kiss person'
6369 | expected:'A' | got:'C' | concept: 'kiss person'
6370 | expected:'D' | got:'D' | concept: 'kiss person'
6371 | expected:'C' | got:'C' | concept: 'kiss person'
6372 | expected:'A' | got:'A' | concept: 'greet person'
6373 | expected:'C' | got:'C' | concept: 'greet person'
6374 | expected:'C' | got:'C' | concept: 'greet person'
6375 | expected:'A' | got:'A' | concept: 'greet person'
6376 | expected:'D' | got:'D' | concept: 'hug horse'
6377 | expected:'C' | got:'C' | concept: 'hug horse'
6378 | expected:'D' | got:'D' | concept: 'hug horse'
6379 | expected:'D' | got:'D' | concept: 'hug horse'
6380 | expected:'D' | got:'D' | concept: 'hug person'
6381 | expected:'A' | got:'A' | concept: 'hug person'
6382 | expected:'A' | got:'A' | concept: 'hug person'
6383 | expected:'B' | got:'B' | concept: 'hug person'
6384 | expected:'B' | got:'B' | concept: 'hold remote'
6385 | expected:'A' | got:'A' | concept: 'hold remote'
6386 | expected:'D' | got:'D' | concept: 'hold remote'
6387 | expected:'B' | got:'B' | concept: 'hold remote'
6388 | expected:'D' | got:'D' | concept: 'swing tennis_racket'
6389 | expected:'A' | got:'A' | concept: 'swing tennis_racket'
6390 | expected:'C' | got:'C' | concept: 'swing tennis_racket'
6391 | expected:'D' | got:'D' | concept: 'swing tennis_racket'
6392 | expected:'A' | got:'A' | concept: 'hold kite'
6393 | expected:'C' | got:'C' | concept: 'hold kite'
6394 | expected:'D' | got:'D' | concept: 'hold kite'
6395 | expected:'A' | got:'A' | concept: 'hold kite'
6396 | expected:'D' | got:'B' | concept: 'hold tennis_racket'
6397 | expected:'A' | got:'A' | concept: 'hold tennis_racket'
6398 | expected:'B' | got:'A' | concept: 'hold tennis_racket'
6399 | expected:'B' | got:'C' | concept: 'hold tennis_racket'
6400 | expected:'C' | got:'A' | concept: 'sit_on truck'
6401 | expected:'C' | got:'C' | concept: 'sit_on truck'
6402 | expected:'D' | got:'D' | concept: 'sit_on truck'
6403 | expected:'C' | got:'C' | concept: 'sit_on truck'
6404 | expected:'B' | got:'B' | concept: 'repair truck'
6405 | expected:'A' | got:'A' | concept: 'repair truck'
6406 | expected:'C' | got:'A' | concept: 'repair truck'
6407 | expected:'D' | got:'A' | concept: 'repair truck'
6408 | expected:'B' | got:'A' | concept: 'load truck'
6409 | expected:'B' | got:'B' | concept: 'load truck'
6410 | expected:'A' | got:'A' | concept: 'load truck'
6411 | expected:'B' | got:'B' | concept: 'load truck'
6412 | expected:'C' | got:'C' | concept: 'sit_on couch'
6413 | expected:'D' | got:'D' | concept: 'sit_on couch'
6414 | expected:'A' | got:'A' | concept: 'sit_on couch'
6415 | expected:'A' | got:'A' | concept: 'sit_on couch'
6416 | expected:'D' | got:'D' | concept: 'hold apple'
6417 | expected:'A' | got:'A' | concept: 'hold apple'
6418 | expected:'C' | got:'C' | concept: 'hold apple'
6419 | expected:'A' | got:'A' | concept: 'hold apple'
6420 | expected:'D' | got:'D' | concept: 'hold tennis_racket'
6421 | expected:'D' | got:'D' | concept: 'hold tennis_racket'
6422 | expected:'B' | got:'B' | concept: 'hold tennis_racket'
6423 | expected:'C' | got:'C' | concept: 'hold tennis_racket'
6424 | expected:'D' | got:'D' | concept: 'hold dog'
6425 | expected:'B' | got:'B' | concept: 'hold dog'
6426 | expected:'A' | got:'A' | concept: 'hold dog'
6427 | expected:'A' | got:'A' | concept: 'hold dog'
6428 | expected:'D' | got:'D' | concept: 'hold kite'
6429 | expected:'A' | got:'A' | concept: 'hold kite'
6430 | expected:'B' | got:'B' | concept: 'hold kite'
6431 | expected:'A' | got:'A' | concept: 'hold kite'
6432 | expected:'C' | got:'D' | concept: 'toast wine_glass'
6433 | expected:'C' | got:'D' | concept: 'toast wine_glass'
6434 | expected:'A' | got:'C' | concept: 'toast wine_glass'
6435 | expected:'C' | got:'C' | concept: 'toast wine_glass'
6436 | expected:'B' | got:'B' | concept: 'hold orange'
6437 | expected:'A' | got:'A' | concept: 'hold orange'
6438 | expected:'D' | got:'A' | concept: 'hold orange'
6439 | expected:'C' | got:'C' | concept: 'hold orange'
6440 | expected:'C' | got:'A' | concept: 'hold wine_glass'
6441 | expected:'A' | got:'A' | concept: 'hold wine_glass'
6442 | expected:'C' | got:'C' | concept: 'hold wine_glass'
6443 | expected:'C' | got:'C' | concept: 'hold wine_glass'
6444 | expected:'A' | got:'D' | concept: 'hold toothbrush'
6445 | expected:'A' | got:'A' | concept: 'hold toothbrush'
6446 | expected:'C' | got:'C' | concept: 'hold toothbrush'
6447 | expected:'C' | got:'B' | concept: 'hold toothbrush'
6448 | expected:'D' | got:'D' | concept: 'ride motorcycle'
6449 | expected:'D' | got:'D' | concept: 'ride motorcycle'
6450 | expected:'A' | got:'C' | concept: 'ride motorcycle'
6451 | expected:'B' | got:'B' | concept: 'ride motorcycle'
6452 | expected:'B' | got:'B' | concept: 'sit_on motorcycle'
6453 | expected:'A' | got:'D' | concept: 'sit_on motorcycle'
6454 | expected:'D' | got:'D' | concept: 'sit_on motorcycle'
6455 | expected:'B' | got:'B' | concept: 'sit_on motorcycle'
6456 | expected:'D' | got:'C' | concept: 'sit_on couch'
6457 | expected:'D' | got:'D' | concept: 'sit_on couch'
6458 | expected:'C' | got:'C' | concept: 'sit_on couch'
6459 | expected:'A' | got:'A' | concept: 'sit_on couch'
6460 | expected:'B' | got:'C' | concept: 'straddle motorcycle'
6461 | expected:'D' | got:'D' | concept: 'straddle motorcycle'
6462 | expected:'B' | got:'D' | concept: 'straddle motorcycle'
6463 | expected:'B' | got:'D' | concept: 'straddle motorcycle'
6464 | expected:'D' | got:'D' | concept: 'turn motorcycle'
6465 | expected:'A' | got:'C' | concept: 'turn motorcycle'
6466 | expected:'C' | got:'C' | concept: 'turn motorcycle'
6467 | expected:'A' | got:'C' | concept: 'turn motorcycle'
6468 | expected:'D' | got:'D' | concept: 'jump motorcycle'
6469 | expected:'D' | got:'D' | concept: 'jump motorcycle'
6470 | expected:'A' | got:'C' | concept: 'jump motorcycle'
6471 | expected:'D' | got:'D' | concept: 'jump motorcycle'
6472 | expected:'C' | got:'A' | concept: 'straddle motorcycle'
6473 | expected:'D' | got:'D' | concept: 'straddle motorcycle'
6474 | expected:'D' | got:'D' | concept: 'straddle motorcycle'
6475 | expected:'B' | got:'B' | concept: 'straddle motorcycle'
6476 | expected:'C' | got:'C' | concept: 'jump snowboard'
6477 | expected:'C' | got:'C' | concept: 'jump snowboard'
6478 | expected:'A' | got:'A' | concept: 'jump snowboard'
6479 | expected:'D' | got:'A' | concept: 'jump snowboard'
6480 | expected:'D' | got:'D' | concept: 'ride elephant'
6481 | expected:'A' | got:'A' | concept: 'ride elephant'
6482 | expected:'C' | got:'C' | concept: 'ride elephant'
6483 | expected:'A' | got:'A' | concept: 'ride elephant'
6484 | expected:'A' | got:'A' | concept: 'ride bicycle'
6485 | expected:'A' | got:'A' | concept: 'ride bicycle'
6486 | expected:'B' | got:'B' | concept: 'ride bicycle'
6487 | expected:'B' | got:'B' | concept: 'ride bicycle'
6488 | expected:'D' | got:'D' | concept: 'kiss horse'
6489 | expected:'B' | got:'B' | concept: 'kiss horse'
6490 | expected:'D' | got:'D' | concept: 'kiss horse'
6491 | expected:'B' | got:'B' | concept: 'kiss horse'
6492 | expected:'D' | got:'D' | concept: 'ride horse'
6493 | expected:'C' | got:'C' | concept: 'ride horse'
6494 | expected:'C' | got:'C' | concept: 'ride horse'
6495 | expected:'A' | got:'A' | concept: 'ride horse'
6496 | expected:'D' | got:'D' | concept: 'straddle motorcycle'
6497 | expected:'B' | got:'B' | concept: 'straddle motorcycle'
6498 | expected:'D' | got:'D' | concept: 'straddle motorcycle'
6499 | expected:'D' | got:'A' | concept: 'straddle motorcycle'
6500 | expected:'B' | got:'B' | concept: 'ride motorcycle'
6501 | expected:'B' | got:'D' | concept: 'ride motorcycle'
6502 | expected:'D' | got:'D' | concept: 'ride motorcycle'
6503 | expected:'C' | got:'C' | concept: 'ride motorcycle'
6504 | expected:'D' | got:'D' | concept: 'jump motorcycle'
6505 | expected:'C' | got:'C' | concept: 'jump motorcycle'
6506 | expected:'C' | got:'C' | concept: 'jump motorcycle'
6507 | expected:'A' | got:'A' | concept: 'jump motorcycle'
6508 | expected:'D' | got:'D' | concept: 'wash motorcycle'
6509 | expected:'D' | got:'D' | concept: 'wash motorcycle'
6510 | expected:'D' | got:'D' | concept: 'wash motorcycle'
6511 | expected:'D' | got:'D' | concept: 'wash motorcycle'
6512 | expected:'D' | got:'D' | concept: 'ride motorcycle'
6513 | expected:'C' | got:'C' | concept: 'ride motorcycle'
6514 | expected:'A' | got:'A' | concept: 'ride motorcycle'
6515 | expected:'B' | got:'B' | concept: 'ride motorcycle'
6516 | expected:'B' | got:'B' | concept: 'ride horse'
6517 | expected:'B' | got:'B' | concept: 'ride horse'
6518 | expected:'A' | got:'A' | concept: 'ride horse'
6519 | expected:'B' | got:'B' | concept: 'ride horse'
6520 | expected:'A' | got:'A' | concept: 'ride skis'
6521 | expected:'B' | got:'B' | concept: 'ride skis'
6522 | expected:'A' | got:'A' | concept: 'ride skis'
6523 | expected:'A' | got:'A' | concept: 'ride skis'
6524 | expected:'C' | got:'C' | concept: 'ride skateboard'
6525 | expected:'D' | got:'D' | concept: 'ride skateboard'
6526 | expected:'A' | got:'A' | concept: 'ride skateboard'
6527 | expected:'D' | got:'D' | concept: 'ride skateboard'
6528 | expected:'A' | got:'A' | concept: 'jump snowboard'
6529 | expected:'A' | got:'D' | concept: 'jump snowboard'
6530 | expected:'A' | got:'A' | concept: 'jump snowboard'
6531 | expected:'D' | got:'D' | concept: 'jump snowboard'
6532 | expected:'D' | got:'D' | concept: 'jump skateboard'
6533 | expected:'D' | got:'D' | concept: 'jump skateboard'
6534 | expected:'D' | got:'D' | concept: 'jump skateboard'
6535 | expected:'D' | got:'D' | concept: 'jump skateboard'
6536 | expected:'D' | got:'A' | concept: 'hold skateboard'
6537 | expected:'C' | got:'C' | concept: 'hold skateboard'
6538 | expected:'C' | got:'C' | concept: 'hold skateboard'
6539 | expected:'B' | got:'D' | concept: 'hold skateboard'
6540 | expected:'B' | got:'D' | concept: 'ride skateboard'
6541 | expected:'C' | got:'D' | concept: 'ride skateboard'
6542 | expected:'D' | got:'C' | concept: 'ride skateboard'
6543 | expected:'C' | got:'C' | concept: 'ride skateboard'
6544 | expected:'D' | got:'C' | concept: 'drink_with cup'
6545 | expected:'C' | got:'C' | concept: 'drink_with cup'
6546 | expected:'B' | got:'B' | concept: 'drink_with cup'
6547 | expected:'C' | got:'C' | concept: 'drink_with cup'
6548 | expected:'D' | got:'D' | concept: 'hold remote'
6549 | expected:'A' | got:'A' | concept: 'hold remote'
6550 | expected:'B' | got:'B' | concept: 'hold remote'
6551 | expected:'D' | got:'D' | concept: 'hold remote'
6552 | expected:'A' | got:'C' | concept: 'hold cup'
6553 | expected:'D' | got:'D' | concept: 'hold cup'
6554 | expected:'B' | got:'C' | concept: 'hold cup'
6555 | expected:'A' | got:'C' | concept: 'hold cup'
6556 | expected:'A' | got:'A' | concept: 'hold dog'
6557 | expected:'B' | got:'B' | concept: 'hold dog'
6558 | expected:'C' | got:'C' | concept: 'hold dog'
6559 | expected:'B' | got:'B' | concept: 'hold dog'
6560 | expected:'B' | got:'B' | concept: 'sit_on motorcycle'
6561 | expected:'A' | got:'A' | concept: 'sit_on motorcycle'
6562 | expected:'D' | got:'D' | concept: 'sit_on motorcycle'
6563 | expected:'C' | got:'C' | concept: 'sit_on motorcycle'
6564 | expected:'A' | got:'A' | concept: 'sit_on chair'
6565 | expected:'C' | got:'C' | concept: 'sit_on chair'
6566 | expected:'B' | got:'D' | concept: 'sit_on chair'
6567 | expected:'A' | got:'D' | concept: 'sit_on chair'
6568 | expected:'B' | got:'B' | concept: 'sit_on bed'
6569 | expected:'B' | got:'B' | concept: 'sit_on bed'
6570 | expected:'A' | got:'A' | concept: 'sit_on bed'
6571 | expected:'A' | got:'D' | concept: 'sit_on bed'
6572 | expected:'A' | got:'D' | concept: 'lie_on_like chair'
6573 | expected:'B' | got:'B' | concept: 'lie_on_like chair'
6574 | expected:'C' | got:'D' | concept: 'lie_on_like chair'
6575 | expected:'B' | got:'A' | concept: 'lie_on_like chair'
6576 | expected:'A' | got:'B' | concept: 'hold cell_phone'
6577 | expected:'A' | got:'C' | concept: 'hold cell_phone'
6578 | expected:'C' | got:'C' | concept: 'hold cell_phone'
6579 | expected:'C' | got:'C' | concept: 'hold cell_phone'
6580 | expected:'D' | got:'A' | concept: 'read_like cell_phone'
6581 | expected:'D' | got:'B' | concept: 'read_like cell_phone'
6582 | expected:'D' | got:'A' | concept: 'read_like cell_phone'
6583 | expected:'B' | got:'C' | concept: 'read_like cell_phone'
6584 | expected:'C' | got:'C' | concept: 'talk_on_or_listen_to cell_phone'
6585 | expected:'C' | got:'C' | concept: 'talk_on_or_listen_to cell_phone'
6586 | expected:'D' | got:'D' | concept: 'talk_on_or_listen_to cell_phone'
6587 | expected:'A' | got:'A' | concept: 'talk_on_or_listen_to cell_phone'
6588 | expected:'C' | got:'C' | concept: 'hold wine_glass'
6589 | expected:'C' | got:'C' | concept: 'hold wine_glass'
6590 | expected:'C' | got:'C' | concept: 'hold wine_glass'
6591 | expected:'C' | got:'C' | concept: 'hold wine_glass'
6592 | expected:'C' | got:'C' | concept: 'point_at_camera remote'
6593 | expected:'D' | got:'C' | concept: 'point_at_camera remote'
6594 | expected:'A' | got:'A' | concept: 'point_at_camera remote'
6595 | expected:'C' | got:'C' | concept: 'point_at_camera remote'
6596 | expected:'C' | got:'C' | concept: 'hold apple'
6597 | expected:'B' | got:'B' | concept: 'hold apple'
6598 | expected:'D' | got:'A' | concept: 'hold apple'
6599 | expected:'B' | got:'B' | concept: 'hold apple'
6600 | expected:'A' | got:'B' | concept: 'hold wine_glass'
6601 | expected:'C' | got:'A' | concept: 'hold wine_glass'
6602 | expected:'C' | got:'C' | concept: 'hold wine_glass'
6603 | expected:'C' | got:'C' | concept: 'hold wine_glass'
6604 | expected:'A' | got:'A' | concept: 'hold remote'
6605 | expected:'A' | got:'A' | concept: 'hold remote'
6606 | expected:'C' | got:'C' | concept: 'hold remote'
6607 | expected:'A' | got:'A' | concept: 'hold remote'
6608 | expected:'D' | got:'B' | concept: 'hold toothbrush'
6609 | expected:'B' | got:'B' | concept: 'hold toothbrush'
6610 | expected:'D' | got:'B' | concept: 'hold toothbrush'
6611 | expected:'C' | got:'C' | concept: 'hold toothbrush'
6612 | expected:'A' | got:'A' | concept: 'hold cell_phone'
6613 | expected:'D' | got:'D' | concept: 'hold cell_phone'
6614 | expected:'B' | got:'B' | concept: 'hold cell_phone'
6615 | expected:'A' | got:'A' | concept: 'hold cell_phone'
6616 | expected:'D' | got:'D' | concept: 'fly kite'
6617 | expected:'D' | got:'D' | concept: 'fly kite'
6618 | expected:'B' | got:'B' | concept: 'fly kite'
6619 | expected:'A' | got:'A' | concept: 'fly kite'
6620 | expected:'C' | got:'B' | concept: 'hold kite'
6621 | expected:'B' | got:'D' | concept: 'hold kite'
6622 | expected:'B' | got:'C' | concept: 'hold kite'
6623 | expected:'D' | got:'D' | concept: 'hold kite'
6624 | expected:'B' | got:'B' | concept: 'hold apple'
6625 | expected:'C' | got:'C' | concept: 'hold apple'
6626 | expected:'B' | got:'B' | concept: 'hold apple'
6627 | expected:'C' | got:'C' | concept: 'hold apple'
6628 | expected:'B' | got:'B' | concept: 'hold book'
6629 | expected:'B' | got:'B' | concept: 'hold book'
6630 | expected:'C' | got:'C' | concept: 'hold book'
6631 | expected:'C' | got:'C' | concept: 'hold book'
6632 | expected:'D' | got:'A' | concept: 'hold handbag'
6633 | expected:'A' | got:'A' | concept: 'hold handbag'
6634 | expected:'B' | got:'B' | concept: 'hold handbag'
6635 | expected:'B' | got:'B' | concept: 'hold handbag'
6636 | expected:'D' | got:'A' | concept: 'hold cake'
6637 | expected:'C' | got:'A' | concept: 'hold cake'
6638 | expected:'A' | got:'A' | concept: 'hold cake'
6639 | expected:'D' | got:'A' | concept: 'hold cake'
6640 | expected:'B' | got:'D' | concept: 'hold cell_phone'
6641 | expected:'C' | got:'A' | concept: 'hold cell_phone'
6642 | expected:'B' | got:'B' | concept: 'hold cell_phone'
6643 | expected:'A' | got:'D' | concept: 'hold cell_phone'
6644 | expected:'B' | got:'B' | concept: 'talk_on_or_listen_to cell_phone'
6645 | expected:'C' | got:'C' | concept: 'talk_on_or_listen_to cell_phone'
6646 | expected:'B' | got:'B' | concept: 'talk_on_or_listen_to cell_phone'
6647 | expected:'B' | got:'B' | concept: 'talk_on_or_listen_to cell_phone'
6648 | expected:'D' | got:'A' | concept: 'hold apple'
6649 | expected:'D' | got:'A' | concept: 'hold apple'
6650 | expected:'C' | got:'C' | concept: 'hold apple'
6651 | expected:'A' | got:'A' | concept: 'hold apple'
6652 | expected:'C' | got:'D' | concept: 'read_like cell_phone'
6653 | expected:'C' | got:'B' | concept: 'read_like cell_phone'
6654 | expected:'C' | got:'D' | concept: 'read_like cell_phone'
6655 | expected:'A' | got:'C' | concept: 'read_like cell_phone'
6656 | expected:'A' | got:'A' | concept: 'type_on laptop'
6657 | expected:'C' | got:'C' | concept: 'type_on laptop'
6658 | expected:'C' | got:'C' | concept: 'type_on laptop'
6659 | expected:'A' | got:'B' | concept: 'type_on laptop'
6660 | expected:'D' | got:'A' | concept: 'clean keyboard'
6661 | expected:'A' | got:'A' | concept: 'clean keyboard'
6662 | expected:'D' | got:'A' | concept: 'clean keyboard'
6663 | expected:'C' | got:'C' | concept: 'clean keyboard'
6664 | expected:'A' | got:'A' | concept: 'clean oven'
6665 | expected:'C' | got:'C' | concept: 'clean oven'
6666 | expected:'B' | got:'B' | concept: 'clean oven'
6667 | expected:'A' | got:'A' | concept: 'clean oven'
6668 | expected:'D' | got:'D' | concept: 'type_on keyboard'
6669 | expected:'C' | got:'D' | concept: 'type_on keyboard'
6670 | expected:'D' | got:'D' | concept: 'type_on keyboard'
6671 | expected:'D' | got:'A' | concept: 'type_on keyboard'
6672 | expected:'C' | got:'C' | concept: 'kiss person'
6673 | expected:'A' | got:'A' | concept: 'kiss person'
6674 | expected:'D' | got:'D' | concept: 'kiss person'
6675 | expected:'C' | got:'C' | concept: 'kiss person'
6676 | expected:'C' | got:'C' | concept: 'greet person'
6677 | expected:'D' | got:'D' | concept: 'greet person'
6678 | expected:'D' | got:'C' | concept: 'greet person'
6679 | expected:'A' | got:'A' | concept: 'greet person'
6680 | expected:'C' | got:'A' | concept: 'hug person'
6681 | expected:'D' | got:'D' | concept: 'hug person'
6682 | expected:'A' | got:'A' | concept: 'hug person'
6683 | expected:'A' | got:'A' | concept: 'hug person'
6684 | expected:'A' | got:'A' | concept: 'kiss horse'
6685 | expected:'D' | got:'D' | concept: 'kiss horse'
6686 | expected:'C' | got:'C' | concept: 'kiss horse'
6687 | expected:'D' | got:'D' | concept: 'kiss horse'
6688 | expected:'C' | got:'C' | concept: 'ride motorcycle'
6689 | expected:'B' | got:'B' | concept: 'ride motorcycle'
6690 | expected:'B' | got:'B' | concept: 'ride motorcycle'
6691 | expected:'B' | got:'B' | concept: 'ride motorcycle'
6692 | expected:'D' | got:'A' | concept: 'push motorcycle'
6693 | expected:'C' | got:'C' | concept: 'push motorcycle'
6694 | expected:'A' | got:'A' | concept: 'push motorcycle'
6695 | expected:'A' | got:'C' | concept: 'push motorcycle'
6696 | expected:'C' | got:'C' | concept: 'inspect motorcycle'
6697 | expected:'D' | got:'A' | concept: 'inspect motorcycle'
6698 | expected:'C' | got:'C' | concept: 'inspect motorcycle'
6699 | expected:'A' | got:'A' | concept: 'inspect motorcycle'
6700 | expected:'D' | got:'C' | concept: 'straddle motorcycle'
6701 | expected:'C' | got:'C' | concept: 'straddle motorcycle'
6702 | expected:'B' | got:'D' | concept: 'straddle motorcycle'
6703 | expected:'B' | got:'B' | concept: 'straddle motorcycle'
6704 | expected:'A' | got:'A' | concept: 'hold cup'
6705 | expected:'B' | got:'B' | concept: 'hold cup'
6706 | expected:'A' | got:'A' | concept: 'hold cup'
6707 | expected:'B' | got:'B' | concept: 'hold cup'
6708 | expected:'C' | got:'C' | concept: 'hold remote'
6709 | expected:'C' | got:'C' | concept: 'hold remote'
6710 | expected:'A' | got:'A' | concept: 'hold remote'
6711 | expected:'A' | got:'A' | concept: 'hold remote'
6712 | expected:'A' | got:'A' | concept: 'hold apple'
6713 | expected:'A' | got:'A' | concept: 'hold apple'
6714 | expected:'A' | got:'A' | concept: 'hold apple'
6715 | expected:'D' | got:'A' | concept: 'hold apple'
6716 | expected:'D' | got:'D' | concept: 'hold cell_phone'
6717 | expected:'A' | got:'A' | concept: 'hold cell_phone'
6718 | expected:'A' | got:'A' | concept: 'hold cell_phone'
6719 | expected:'B' | got:'D' | concept: 'hold cell_phone'
6720 | expected:'B' | got:'B' | concept: 'repair bicycle'
6721 | expected:'A' | got:'A' | concept: 'repair bicycle'
6722 | expected:'B' | got:'B' | concept: 'repair bicycle'
6723 | expected:'D' | got:'A' | concept: 'repair bicycle'
6724 | expected:'C' | got:'C' | concept: 'repair truck'
6725 | expected:'D' | got:'D' | concept: 'repair truck'
6726 | expected:'D' | got:'D' | concept: 'repair truck'
6727 | expected:'C' | got:'C' | concept: 'repair truck'
6728 | expected:'D' | got:'D' | concept: 'load truck'
6729 | expected:'A' | got:'A' | concept: 'load truck'
6730 | expected:'C' | got:'C' | concept: 'load truck'
6731 | expected:'C' | got:'C' | concept: 'load truck'
6732 | expected:'B' | got:'B' | concept: 'sit_on truck'
6733 | expected:'C' | got:'INVALID' | concept: 'sit_on truck'
6734 | expected:'C' | got:'C' | concept: 'sit_on truck'
6735 | expected:'A' | got:'A' | concept: 'sit_on truck'
6736 | expected:'A' | got:'A' | concept: 'ride elephant'
6737 | expected:'B' | got:'B' | concept: 'ride elephant'
6738 | expected:'D' | got:'D' | concept: 'ride elephant'
6739 | expected:'A' | got:'A' | concept: 'ride elephant'
6740 | expected:'A' | got:'A' | concept: 'ride motorcycle'
6741 | expected:'C' | got:'C' | concept: 'ride motorcycle'
6742 | expected:'B' | got:'B' | concept: 'ride motorcycle'
6743 | expected:'C' | got:'C' | concept: 'ride motorcycle'
6744 | expected:'A' | got:'A' | concept: 'wash motorcycle'
6745 | expected:'D' | got:'D' | concept: 'wash motorcycle'
6746 | expected:'D' | got:'D' | concept: 'wash motorcycle'
6747 | expected:'D' | got:'D' | concept: 'wash motorcycle'
6748 | expected:'D' | got:'D' | concept: 'ride skis'
6749 | expected:'D' | got:'D' | concept: 'ride skis'
6750 | expected:'C' | got:'C' | concept: 'ride skis'
6751 | expected:'D' | got:'D' | concept: 'ride skis'
6752 | expected:'C' | got:'C' | concept: 'push motorcycle'
6753 | expected:'D' | got:'D' | concept: 'push motorcycle'
6754 | expected:'A' | got:'A' | concept: 'push motorcycle'
6755 | expected:'A' | got:'B' | concept: 'push motorcycle'
6756 | expected:'D' | got:'D' | concept: 'straddle motorcycle'
6757 | expected:'B' | got:'A' | concept: 'straddle motorcycle'
6758 | expected:'B' | got:'C' | concept: 'straddle motorcycle'
6759 | expected:'D' | got:'D' | concept: 'straddle motorcycle'
6760 | expected:'B' | got:'C' | concept: 'sit_on motorcycle'
6761 | expected:'A' | got:'A' | concept: 'sit_on motorcycle'
6762 | expected:'B' | got:'C' | concept: 'sit_on motorcycle'
6763 | expected:'D' | got:'D' | concept: 'sit_on motorcycle'
6764 | expected:'B' | got:'B' | concept: 'ride motorcycle'
6765 | expected:'D' | got:'D' | concept: 'ride motorcycle'
6766 | expected:'B' | got:'B' | concept: 'ride motorcycle'
6767 | expected:'A' | got:'A' | concept: 'ride motorcycle'
6768 | expected:'C' | got:'C' | concept: 'ride bicycle'
6769 | expected:'A' | got:'A' | concept: 'ride bicycle'
6770 | expected:'B' | got:'B' | concept: 'ride bicycle'
6771 | expected:'B' | got:'B' | concept: 'ride bicycle'
6772 | expected:'D' | got:'D' | concept: 'ride horse'
6773 | expected:'D' | got:'D' | concept: 'ride horse'
6774 | expected:'A' | got:'A' | concept: 'ride horse'
6775 | expected:'C' | got:'C' | concept: 'ride horse'
6776 | expected:'D' | got:'D' | concept: 'ride skateboard'
6777 | expected:'A' | got:'A' | concept: 'ride skateboard'
6778 | expected:'A' | got:'A' | concept: 'ride skateboard'
6779 | expected:'A' | got:'A' | concept: 'ride skateboard'
6780 | expected:'A' | got:'A' | concept: 'ride skis'
6781 | expected:'B' | got:'B' | concept: 'ride skis'
6782 | expected:'C' | got:'C' | concept: 'ride skis'
6783 | expected:'B' | got:'B' | concept: 'ride skis'
6784 | expected:'C' | got:'C' | concept: 'lie_on bed'
6785 | expected:'B' | got:'B' | concept: 'lie_on bed'
6786 | expected:'B' | got:'B' | concept: 'lie_on bed'
6787 | expected:'A' | got:'A' | concept: 'lie_on bed'
6788 | expected:'A' | got:'D' | concept: 'lie_on couch'
6789 | expected:'C' | got:'A' | concept: 'lie_on couch'
6790 | expected:'C' | got:'C' | concept: 'lie_on couch'
6791 | expected:'A' | got:'A' | concept: 'lie_on couch'
6792 | expected:'C' | got:'C' | concept: 'sit_on couch'
6793 | expected:'C' | got:'B' | concept: 'sit_on couch'
6794 | expected:'B' | got:'B' | concept: 'sit_on couch'
6795 | expected:'C' | got:'C' | concept: 'sit_on couch'
6796 | expected:'B' | got:'B' | concept: 'lie_on bench'
6797 | expected:'D' | got:'B' | concept: 'lie_on bench'
6798 | expected:'B' | got:'B' | concept: 'lie_on bench'
6799 | expected:'B' | got:'B' | concept: 'lie_on bench'
6800 | expected:'B' | got:'B' | concept: 'hold book'
6801 | expected:'C' | got:'C' | concept: 'hold book'
6802 | expected:'B' | got:'B' | concept: 'hold book'
6803 | expected:'D' | got:'D' | concept: 'hold book'
6804 | expected:'B' | got:'B' | concept: 'hold dog'
6805 | expected:'C' | got:'C' | concept: 'hold dog'
6806 | expected:'C' | got:'C' | concept: 'hold dog'
6807 | expected:'C' | got:'B' | concept: 'hold dog'
6808 | expected:'C' | got:'B' | concept: 'hold cake'
6809 | expected:'C' | got:'B' | concept: 'hold cake'
6810 | expected:'D' | got:'A' | concept: 'hold cake'
6811 | expected:'D' | got:'C' | concept: 'hold cake'
6812 | expected:'D' | got:'A' | concept: 'hold banana'
6813 | expected:'C' | got:'C' | concept: 'hold banana'
6814 | expected:'B' | got:'B' | concept: 'hold banana'
6815 | expected:'A' | got:'A' | concept: 'hold banana'
6816 | expected:'A' | got:'A' | concept: 'hold book'
6817 | expected:'D' | got:'D' | concept: 'hold book'
6818 | expected:'C' | got:'C' | concept: 'hold book'
6819 | expected:'A' | got:'A' | concept: 'hold book'
6820 | expected:'C' | got:'C' | concept: 'hold laptop'
6821 | expected:'B' | got:'C' | concept: 'hold laptop'
6822 | expected:'D' | got:'D' | concept: 'hold laptop'
6823 | expected:'B' | got:'B' | concept: 'hold laptop'
6824 | expected:'C' | got:'C' | concept: 'hold skateboard'
6825 | expected:'A' | got:'A' | concept: 'hold skateboard'
6826 | expected:'C' | got:'C' | concept: 'hold skateboard'
6827 | expected:'D' | got:'D' | concept: 'hold skateboard'
6828 | expected:'B' | got:'C' | concept: 'hold handbag'
6829 | expected:'C' | got:'C' | concept: 'hold handbag'
6830 | expected:'D' | got:'A' | concept: 'hold handbag'
6831 | expected:'C' | got:'C' | concept: 'hold handbag'
6832 | expected:'D' | got:'A' | concept: 'read laptop'
6833 | expected:'D' | got:'C' | concept: 'read laptop'
6834 | expected:'C' | got:'C' | concept: 'read laptop'
6835 | expected:'A' | got:'A' | concept: 'read laptop'
6836 | expected:'A' | got:'A' | concept: 'read book'
6837 | expected:'D' | got:'A' | concept: 'read book'
6838 | expected:'C' | got:'C' | concept: 'read book'
6839 | expected:'A' | got:'A' | concept: 'read book'
6840 | expected:'B' | got:'A' | concept: 'hold laptop'
6841 | expected:'A' | got:'A' | concept: 'hold laptop'
6842 | expected:'C' | got:'C' | concept: 'hold laptop'
6843 | expected:'A' | got:'A' | concept: 'hold laptop'
6844 | expected:'A' | got:'A' | concept: 'type_on laptop'
6845 | expected:'B' | got:'B' | concept: 'type_on laptop'
6846 | expected:'A' | got:'A' | concept: 'type_on laptop'
6847 | expected:'B' | got:'B' | concept: 'type_on laptop'
6848 | expected:'C' | got:'C' | concept: 'lick knife'
6849 | expected:'D' | got:'C' | concept: 'lick knife'
6850 | expected:'D' | got:'C' | concept: 'lick knife'
6851 | expected:'D' | got:'C' | concept: 'lick knife'
6852 | expected:'C' | got:'D' | concept: 'cut_with scissors'
6853 | expected:'C' | got:'B' | concept: 'cut_with scissors'
6854 | expected:'D' | got:'D' | concept: 'cut_with scissors'
6855 | expected:'B' | got:'C' | concept: 'cut_with scissors'
6856 | expected:'D' | got:'C' | concept: 'hold knife'
6857 | expected:'C' | got:'D' | concept: 'hold knife'
6858 | expected:'B' | got:'B' | concept: 'hold knife'
6859 | expected:'C' | got:'A' | concept: 'hold knife'
6860 | expected:'A' | got:'B' | concept: 'cut_with knife'
6861 | expected:'B' | got:'B' | concept: 'cut_with knife'
6862 | expected:'C' | got:'C' | concept: 'cut_with knife'
6863 | expected:'B' | got:'B' | concept: 'cut_with knife'
6864 | expected:'B' | got:'B' | concept: 'hold dog'
6865 | expected:'B' | got:'B' | concept: 'hold dog'
6866 | expected:'C' | got:'C' | concept: 'hold dog'
6867 | expected:'B' | got:'B' | concept: 'hold dog'
6868 | expected:'D' | got:'B' | concept: 'hold book'
6869 | expected:'A' | got:'A' | concept: 'hold book'
6870 | expected:'B' | got:'B' | concept: 'hold book'
6871 | expected:'C' | got:'C' | concept: 'hold book'
6872 | expected:'D' | got:'D' | concept: 'hold tennis_racket'
6873 | expected:'B' | got:'B' | concept: 'hold tennis_racket'
6874 | expected:'D' | got:'D' | concept: 'hold tennis_racket'
6875 | expected:'B' | got:'B' | concept: 'hold tennis_racket'
6876 | expected:'C' | got:'C' | concept: 'hold handbag'
6877 | expected:'B' | got:'B' | concept: 'hold handbag'
6878 | expected:'A' | got:'A' | concept: 'hold handbag'
6879 | expected:'C' | got:'C' | concept: 'hold handbag'
6880 | expected:'A' | got:'A' | concept: 'sit_on motorcycle'
6881 | expected:'D' | got:'D' | concept: 'sit_on motorcycle'
6882 | expected:'A' | got:'A' | concept: 'sit_on motorcycle'
6883 | expected:'D' | got:'D' | concept: 'sit_on motorcycle'
6884 | expected:'C' | got:'C' | concept: 'sit_on couch'
6885 | expected:'C' | got:'C' | concept: 'sit_on couch'
6886 | expected:'C' | got:'C' | concept: 'sit_on couch'
6887 | expected:'D' | got:'B' | concept: 'sit_on couch'
6888 | expected:'D' | got:'B' | concept: 'lie_on_like chair'
6889 | expected:'C' | got:'D' | concept: 'lie_on_like chair'
6890 | expected:'A' | got:'D' | concept: 'lie_on_like chair'
6891 | expected:'B' | got:'C' | concept: 'lie_on_like chair'
6892 | expected:'D' | got:'D' | concept: 'sit_on chair'
6893 | expected:'A' | got:'A' | concept: 'sit_on chair'
6894 | expected:'A' | got:'C' | concept: 'sit_on chair'
6895 | expected:'B' | got:'B' | concept: 'sit_on chair'
6896 | expected:'C' | got:'C' | concept: 'hold toothbrush'
6897 | expected:'C' | got:'C' | concept: 'hold toothbrush'
6898 | expected:'B' | got:'D' | concept: 'hold toothbrush'
6899 | expected:'B' | got:'B' | concept: 'hold toothbrush'
6900 | expected:'B' | got:'B' | concept: 'brush_with toothbrush'
6901 | expected:'A' | got:'C' | concept: 'brush_with toothbrush'
6902 | expected:'B' | got:'C' | concept: 'brush_with toothbrush'
6903 | expected:'A' | got:'B' | concept: 'brush_with toothbrush'
6904 | expected:'B' | got:'C' | concept: 'hold cake'
6905 | expected:'B' | got:'B' | concept: 'hold cake'
6906 | expected:'A' | got:'A' | concept: 'hold cake'
6907 | expected:'A' | got:'A' | concept: 'hold cake'
6908 | expected:'D' | got:'D' | concept: 'hold wine_glass'
6909 | expected:'D' | got:'D' | concept: 'hold wine_glass'
6910 | expected:'A' | got:'A' | concept: 'hold wine_glass'
6911 | expected:'C' | got:'C' | concept: 'hold wine_glass'
6912 | expected:'D' | got:'D' | concept: 'hold book'
6913 | expected:'C' | got:'C' | concept: 'hold book'
6914 | expected:'D' | got:'B' | concept: 'hold book'
6915 | expected:'C' | got:'C' | concept: 'hold book'
6916 | expected:'D' | got:'A' | concept: 'hold handbag'
6917 | expected:'B' | got:'A' | concept: 'hold handbag'
6918 | expected:'D' | got:'C' | concept: 'hold handbag'
6919 | expected:'A' | got:'A' | concept: 'hold handbag'
6920 | expected:'B' | got:'B' | concept: 'hold cell_phone'
6921 | expected:'B' | got:'B' | concept: 'hold cell_phone'
6922 | expected:'A' | got:'A' | concept: 'hold cell_phone'
6923 | expected:'B' | got:'B' | concept: 'hold cell_phone'
6924 | expected:'A' | got:'C' | concept: 'hold toothbrush'
6925 | expected:'B' | got:'A' | concept: 'hold toothbrush'
6926 | expected:'B' | got:'C' | concept: 'hold toothbrush'
6927 | expected:'D' | got:'D' | concept: 'hold toothbrush'
6928 | expected:'C' | got:'C' | concept: 'hold knife'
6929 | expected:'B' | got:'B' | concept: 'hold knife'
6930 | expected:'A' | got:'A' | concept: 'hold knife'
6931 | expected:'B' | got:'B' | concept: 'hold knife'
6932 | expected:'A' | got:'A' | concept: 'peel_or_cut apple'
6933 | expected:'B' | got:'B' | concept: 'peel_or_cut apple'
6934 | expected:'B' | got:'B' | concept: 'peel_or_cut apple'
6935 | expected:'A' | got:'A' | concept: 'peel_or_cut apple'
6936 | expected:'C' | got:'C' | concept: 'hold handbag'
6937 | expected:'A' | got:'A' | concept: 'hold handbag'
6938 | expected:'D' | got:'A' | concept: 'hold handbag'
6939 | expected:'D' | got:'A' | concept: 'hold handbag'
6940 | expected:'B' | got:'B' | concept: 'hold apple'
6941 | expected:'B' | got:'B' | concept: 'hold apple'
6942 | expected:'A' | got:'A' | concept: 'hold apple'
6943 | expected:'C' | got:'C' | concept: 'hold apple'
6944 | expected:'D' | got:'D' | concept: 'hold sports_ball'
6945 | expected:'A' | got:'INVALID' | concept: 'hold sports_ball'
6946 | expected:'C' | got:'A' | concept: 'hold sports_ball'
6947 | expected:'C' | got:'C' | concept: 'hold sports_ball'
6948 | expected:'A' | got:'A' | concept: 'hold banana'
6949 | expected:'D' | got:'A' | concept: 'hold banana'
6950 | expected:'C' | got:'C' | concept: 'hold banana'
6951 | expected:'B' | got:'B' | concept: 'hold banana'
6952 | expected:'D' | got:'A' | concept: 'hold cake'
6953 | expected:'B' | got:'A' | concept: 'hold cake'
6954 | expected:'B' | got:'C' | concept: 'hold cake'
6955 | expected:'D' | got:'A' | concept: 'hold cake'
6956 | expected:'A' | got:'A' | concept: 'hold knife'
6957 | expected:'D' | got:'D' | concept: 'hold knife'
6958 | expected:'A' | got:'C' | concept: 'hold knife'
6959 | expected:'C' | got:'C' | concept: 'hold knife'
6960 | expected:'C' | got:'B' | concept: 'clean keyboard'
6961 | expected:'A' | got:'A' | concept: 'clean keyboard'
6962 | expected:'C' | got:'A' | concept: 'clean keyboard'
6963 | expected:'B' | got:'B' | concept: 'clean keyboard'
6964 | expected:'A' | got:'A' | concept: 'type_on laptop'
6965 | expected:'D' | got:'D' | concept: 'type_on laptop'
6966 | expected:'A' | got:'A' | concept: 'type_on laptop'
6967 | expected:'B' | got:'C' | concept: 'type_on laptop'
6968 | expected:'A' | got:'A' | concept: 'type_on keyboard'
6969 | expected:'A' | got:'D' | concept: 'type_on keyboard'
6970 | expected:'D' | got:'B' | concept: 'type_on keyboard'
6971 | expected:'C' | got:'C' | concept: 'type_on keyboard'
6972 | expected:'A' | got:'B' | concept: 'read laptop'
6973 | expected:'C' | got:'D' | concept: 'read laptop'
6974 | expected:'C' | got:'A' | concept: 'read laptop'
6975 | expected:'C' | got:'D' | concept: 'read laptop'
6976 | expected:'D' | got:'D' | concept: 'hold handbag'
6977 | expected:'C' | got:'C' | concept: 'hold handbag'
6978 | expected:'B' | got:'B' | concept: 'hold handbag'
6979 | expected:'C' | got:'C' | concept: 'hold handbag'
6980 | expected:'B' | got:'B' | concept: 'hold sports_ball'
6981 | expected:'A' | got:'INVALID' | concept: 'hold sports_ball'
6982 | expected:'B' | got:'C' | concept: 'hold sports_ball'
6983 | expected:'C' | got:'D' | concept: 'hold sports_ball'
6984 | expected:'B' | got:'A' | concept: 'hold cake'
6985 | expected:'B' | got:'A' | concept: 'hold cake'
6986 | expected:'D' | got:'D' | concept: 'hold cake'
6987 | expected:'C' | got:'C' | concept: 'hold cake'
6988 | expected:'C' | got:'C' | concept: 'kick sports_ball'
6989 | expected:'A' | got:'A' | concept: 'kick sports_ball'
6990 | expected:'D' | got:'D' | concept: 'kick sports_ball'
6991 | expected:'A' | got:'A' | concept: 'kick sports_ball'
6992 | expected:'C' | got:'C' | concept: 'carry suitcase'
6993 | expected:'A' | got:'C' | concept: 'carry suitcase'
6994 | expected:'A' | got:'C' | concept: 'carry suitcase'
6995 | expected:'A' | got:'A' | concept: 'carry suitcase'
6996 | expected:'A' | got:'A' | concept: 'ride surfboard'
6997 | expected:'B' | got:'B' | concept: 'ride surfboard'
6998 | expected:'A' | got:'A' | concept: 'ride surfboard'
6999 | expected:'C' | got:'C' | concept: 'ride surfboard'
7000 | expected:'B' | got:'B' | concept: 'carry surfboard'
7001 | expected:'B' | got:'B' | concept: 'carry surfboard'
7002 | expected:'C' | got:'C' | concept: 'carry surfboard'
7003 | expected:'D' | got:'D' | concept: 'carry surfboard'
7004 | expected:'C' | got:'D' | concept: 'drag suitcase'
7005 | expected:'D' | got:'D' | concept: 'drag suitcase'
7006 | expected:'C' | got:'C' | concept: 'drag suitcase'
7007 | expected:'C' | got:'C' | concept: 'drag suitcase'
7008 | expected:'A' | got:'A' | concept: 'jump skateboard'
7009 | expected:'D' | got:'D' | concept: 'jump skateboard'
7010 | expected:'D' | got:'D' | concept: 'jump skateboard'
7011 | expected:'C' | got:'C' | concept: 'jump skateboard'
7012 | expected:'A' | got:'A' | concept: 'kiss horse'
7013 | expected:'B' | got:'B' | concept: 'kiss horse'
7014 | expected:'C' | got:'C' | concept: 'kiss horse'
7015 | expected:'C' | got:'C' | concept: 'kiss horse'
7016 | expected:'A' | got:'A' | concept: 'hug horse'
7017 | expected:'A' | got:'D' | concept: 'hug horse'
7018 | expected:'D' | got:'D' | concept: 'hug horse'
7019 | expected:'D' | got:'D' | concept: 'hug horse'
7020 | expected:'A' | got:'A' | concept: 'jump horse'
7021 | expected:'A' | got:'A' | concept: 'jump horse'
7022 | expected:'A' | got:'A' | concept: 'jump horse'
7023 | expected:'C' | got:'C' | concept: 'jump horse'
7024 | expected:'D' | got:'A' | concept: 'hold banana'
7025 | expected:'C' | got:'C' | concept: 'hold banana'
7026 | expected:'B' | got:'B' | concept: 'hold banana'
7027 | expected:'B' | got:'B' | concept: 'hold banana'
7028 | expected:'A' | got:'A' | concept: 'hold cup'
7029 | expected:'A' | got:'A' | concept: 'hold cup'
7030 | expected:'B' | got:'D' | concept: 'hold cup'
7031 | expected:'B' | got:'B' | concept: 'hold cup'
7032 | expected:'C' | got:'C' | concept: 'hold dog'
7033 | expected:'B' | got:'B' | concept: 'hold dog'
7034 | expected:'D' | got:'D' | concept: 'hold dog'
7035 | expected:'B' | got:'B' | concept: 'hold dog'
7036 | expected:'C' | got:'C' | concept: 'hold wine_glass'
7037 | expected:'A' | got:'A' | concept: 'hold wine_glass'
7038 | expected:'D' | got:'A' | concept: 'hold wine_glass'
7039 | expected:'C' | got:'C' | concept: 'hold wine_glass'
7040 | expected:'A' | got:'C' | concept: 'turn motorcycle'
7041 | expected:'B' | got:'D' | concept: 'turn motorcycle'
7042 | expected:'D' | got:'D' | concept: 'turn motorcycle'
7043 | expected:'A' | got:'A' | concept: 'turn motorcycle'
7044 | expected:'C' | got:'C' | concept: 'wash motorcycle'
7045 | expected:'B' | got:'B' | concept: 'wash motorcycle'
7046 | expected:'C' | got:'C' | concept: 'wash motorcycle'
7047 | expected:'B' | got:'B' | concept: 'wash motorcycle'
7048 | expected:'C' | got:'C' | concept: 'straddle motorcycle'
7049 | expected:'D' | got:'D' | concept: 'straddle motorcycle'
7050 | expected:'D' | got:'B' | concept: 'straddle motorcycle'
7051 | expected:'A' | got:'A' | concept: 'straddle motorcycle'
7052 | expected:'A' | got:'D' | concept: 'sit_on motorcycle'
7053 | expected:'C' | got:'C' | concept: 'sit_on motorcycle'
7054 | expected:'C' | got:'A' | concept: 'sit_on motorcycle'
7055 | expected:'A' | got:'A' | concept: 'sit_on motorcycle'
7056 | expected:'C' | got:'C' | concept: 'jump motorcycle'
7057 | expected:'D' | got:'D' | concept: 'jump motorcycle'
7058 | expected:'C' | got:'C' | concept: 'jump motorcycle'
7059 | expected:'A' | got:'A' | concept: 'jump motorcycle'
7060 | expected:'D' | got:'B' | concept: 'inspect motorcycle'
7061 | expected:'D' | got:'D' | concept: 'inspect motorcycle'
7062 | expected:'A' | got:'A' | concept: 'inspect motorcycle'
7063 | expected:'C' | got:'C' | concept: 'inspect motorcycle'
7064 | expected:'D' | got:'D' | concept: 'straddle motorcycle'
7065 | expected:'C' | got:'C' | concept: 'straddle motorcycle'
7066 | expected:'B' | got:'B' | concept: 'straddle motorcycle'
7067 | expected:'A' | got:'A' | concept: 'straddle motorcycle'
7068 | expected:'B' | got:'B' | concept: 'jump snowboard'
7069 | expected:'A' | got:'A' | concept: 'jump snowboard'
7070 | expected:'B' | got:'B' | concept: 'jump snowboard'
7071 | expected:'A' | got:'A' | concept: 'jump snowboard'
7072 | expected:'C' | got:'D' | concept: 'jump motorcycle'
7073 | expected:'B' | got:'B' | concept: 'jump motorcycle'
7074 | expected:'A' | got:'A' | concept: 'jump motorcycle'
7075 | expected:'A' | got:'A' | concept: 'jump motorcycle'
7076 | expected:'A' | got:'C' | concept: 'turn motorcycle'
7077 | expected:'B' | got:'B' | concept: 'turn motorcycle'
7078 | expected:'B' | got:'B' | concept: 'turn motorcycle'
7079 | expected:'A' | got:'D' | concept: 'turn motorcycle'
7080 | expected:'A' | got:'A' | concept: 'inspect motorcycle'
7081 | expected:'D' | got:'D' | concept: 'inspect motorcycle'
7082 | expected:'D' | got:'D' | concept: 'inspect motorcycle'
7083 | expected:'C' | got:'C' | concept: 'inspect motorcycle'
7084 | expected:'D' | got:'D' | concept: 'wash motorcycle'
7085 | expected:'C' | got:'C' | concept: 'wash motorcycle'
7086 | expected:'B' | got:'B' | concept: 'wash motorcycle'
7087 | expected:'D' | got:'D' | concept: 'wash motorcycle'
7088 | expected:'C' | got:'C' | concept: 'hold book'
7089 | expected:'D' | got:'D' | concept: 'hold book'
7090 | expected:'B' | got:'B' | concept: 'hold book'
7091 | expected:'A' | got:'A' | concept: 'hold book'
7092 | expected:'A' | got:'A' | concept: 'hold cell_phone'
7093 | expected:'B' | got:'B' | concept: 'hold cell_phone'
7094 | expected:'B' | got:'B' | concept: 'hold cell_phone'
7095 | expected:'C' | got:'C' | concept: 'hold cell_phone'
7096 | expected:'A' | got:'A' | concept: 'hold knife'
7097 | expected:'D' | got:'D' | concept: 'hold knife'
7098 | expected:'B' | got:'B' | concept: 'hold knife'
7099 | expected:'C' | got:'C' | concept: 'hold knife'
7100 | expected:'A' | got:'A' | concept: 'hold dog'
7101 | expected:'C' | got:'C' | concept: 'hold dog'
7102 | expected:'A' | got:'A' | concept: 'hold dog'
7103 | expected:'C' | got:'C' | concept: 'hold dog'
7104 | expected:'C' | got:'C' | concept: 'lick knife'
7105 | expected:'A' | got:'D' | concept: 'lick knife'
7106 | expected:'B' | got:'B' | concept: 'lick knife'
7107 | expected:'D' | got:'D' | concept: 'lick knife'
7108 | expected:'B' | got:'C' | concept: 'wield knife'
7109 | expected:'C' | got:'C' | concept: 'wield knife'
7110 | expected:'A' | got:'C' | concept: 'wield knife'
7111 | expected:'B' | got:'B' | concept: 'wield knife'
7112 | expected:'C' | got:'C' | concept: 'hold knife'
7113 | expected:'D' | got:'A' | concept: 'hold knife'
7114 | expected:'C' | got:'C' | concept: 'hold knife'
7115 | expected:'B' | got:'B' | concept: 'hold knife'
7116 | expected:'B' | got:'B' | concept: 'cut_with knife'
7117 | expected:'C' | got:'C' | concept: 'cut_with knife'
7118 | expected:'D' | got:'C' | concept: 'cut_with knife'
7119 | expected:'C' | got:'C' | concept: 'cut_with knife'
7120 | expected:'A' | got:'A' | concept: 'eat sandwich'
7121 | expected:'B' | got:'B' | concept: 'eat sandwich'
7122 | expected:'A' | got:'A' | concept: 'eat sandwich'
7123 | expected:'B' | got:'B' | concept: 'eat sandwich'
7124 | expected:'C' | got:'C' | concept: 'control tv'
7125 | expected:'D' | got:'D' | concept: 'control tv'
7126 | expected:'A' | got:'A' | concept: 'control tv'
7127 | expected:'D' | got:'D' | concept: 'control tv'
7128 | expected:'A' | got:'A' | concept: 'kiss dog'
7129 | expected:'C' | got:'C' | concept: 'kiss dog'
7130 | expected:'C' | got:'C' | concept: 'kiss dog'
7131 | expected:'C' | got:'C' | concept: 'kiss dog'
7132 | expected:'A' | got:'A' | concept: 'watch tv'
7133 | expected:'D' | got:'A' | concept: 'watch tv'
7134 | expected:'B' | got:'A' | concept: 'watch tv'
7135 | expected:'D' | got:'D' | concept: 'watch tv'
7136 | expected:'B' | got:'B' | concept: 'hold cell_phone'
7137 | expected:'A' | got:'A' | concept: 'hold cell_phone'
7138 | expected:'D' | got:'D' | concept: 'hold cell_phone'
7139 | expected:'C' | got:'C' | concept: 'hold cell_phone'
7140 | expected:'C' | got:'B' | concept: 'hold wine_glass'
7141 | expected:'A' | got:'A' | concept: 'hold wine_glass'
7142 | expected:'C' | got:'D' | concept: 'hold wine_glass'
7143 | expected:'A' | got:'D' | concept: 'hold wine_glass'
7144 | expected:'A' | got:'A' | concept: 'toast wine_glass'
7145 | expected:'D' | got:'D' | concept: 'toast wine_glass'
7146 | expected:'B' | got:'B' | concept: 'toast wine_glass'
7147 | expected:'B' | got:'B' | concept: 'toast wine_glass'
7148 | expected:'B' | got:'A' | concept: 'hold cake'
7149 | expected:'B' | got:'B' | concept: 'hold cake'
7150 | expected:'D' | got:'B' | concept: 'hold cake'
7151 | expected:'D' | got:'C' | concept: 'hold cake'
7152 | expected:'D' | got:'D' | concept: 'straddle motorcycle'
7153 | expected:'D' | got:'D' | concept: 'straddle motorcycle'
7154 | expected:'C' | got:'C' | concept: 'straddle motorcycle'
7155 | expected:'D' | got:'C' | concept: 'straddle motorcycle'
7156 | expected:'C' | got:'C' | concept: 'wash motorcycle'
7157 | expected:'C' | got:'C' | concept: 'wash motorcycle'
7158 | expected:'A' | got:'A' | concept: 'wash motorcycle'
7159 | expected:'C' | got:'C' | concept: 'wash motorcycle'
7160 | expected:'D' | got:'C' | concept: 'sit_on motorcycle'
7161 | expected:'A' | got:'A' | concept: 'sit_on motorcycle'
7162 | expected:'B' | got:'B' | concept: 'sit_on motorcycle'
7163 | expected:'C' | got:'C' | concept: 'sit_on motorcycle'
7164 | expected:'C' | got:'B' | concept: 'jump motorcycle'
7165 | expected:'C' | got:'C' | concept: 'jump motorcycle'
7166 | expected:'D' | got:'D' | concept: 'jump motorcycle'
7167 | expected:'A' | got:'A' | concept: 'jump motorcycle'
7168 | expected:'A' | got:'A' | concept: 'hold wine_glass'
7169 | expected:'A' | got:'A' | concept: 'hold wine_glass'
7170 | expected:'C' | got:'C' | concept: 'hold wine_glass'
7171 | expected:'B' | got:'B' | concept: 'hold wine_glass'
7172 | expected:'D' | got:'B' | concept: 'hold cake'
7173 | expected:'D' | got:'B' | concept: 'hold cake'
7174 | expected:'A' | got:'A' | concept: 'hold cake'
7175 | expected:'C' | got:'A' | concept: 'hold cake'
7176 | expected:'D' | got:'D' | concept: 'hold cell_phone'
7177 | expected:'D' | got:'D' | concept: 'hold cell_phone'
7178 | expected:'B' | got:'B' | concept: 'hold cell_phone'
7179 | expected:'B' | got:'B' | concept: 'hold cell_phone'
7180 | expected:'B' | got:'B' | concept: 'hold book'
7181 | expected:'C' | got:'C' | concept: 'hold book'
7182 | expected:'D' | got:'B' | concept: 'hold book'
7183 | expected:'B' | got:'B' | concept: 'hold book'
7184 | expected:'D' | got:'D' | concept: 'hold dog'
7185 | expected:'C' | got:'C' | concept: 'hold dog'
7186 | expected:'A' | got:'B' | concept: 'hold dog'
7187 | expected:'A' | got:'A' | concept: 'hold dog'
7188 | expected:'D' | got:'D' | concept: 'kiss dog'
7189 | expected:'B' | got:'B' | concept: 'kiss dog'
7190 | expected:'A' | got:'A' | concept: 'kiss dog'
7191 | expected:'D' | got:'D' | concept: 'kiss dog'
7192 | expected:'D' | got:'D' | concept: 'walk dog'
7193 | expected:'A' | got:'A' | concept: 'walk dog'
7194 | expected:'D' | got:'D' | concept: 'walk dog'
7195 | expected:'A' | got:'A' | concept: 'walk dog'
7196 | expected:'C' | got:'C' | concept: 'pet dog'
7197 | expected:'D' | got:'D' | concept: 'pet dog'
7198 | expected:'C' | got:'C' | concept: 'pet dog'
7199 | expected:'A' | got:'C' | concept: 'pet dog'
7200 | expected:'C' | got:'C' | concept: 'repair bicycle'
7201 | expected:'A' | got:'A' | concept: 'repair bicycle'
7202 | expected:'A' | got:'A' | concept: 'repair bicycle'
7203 | expected:'D' | got:'D' | concept: 'repair bicycle'
7204 | expected:'C' | got:'C' | concept: 'ride skateboard'
7205 | expected:'C' | got:'C' | concept: 'ride skateboard'
7206 | expected:'C' | got:'C' | concept: 'ride skateboard'
7207 | expected:'D' | got:'D' | concept: 'ride skateboard'
7208 | expected:'C' | got:'C' | concept: 'ride skis'
7209 | expected:'B' | got:'B' | concept: 'ride skis'
7210 | expected:'C' | got:'C' | concept: 'ride skis'
7211 | expected:'B' | got:'B' | concept: 'ride skis'
7212 | expected:'B' | got:'B' | concept: 'ride bicycle'
7213 | expected:'B' | got:'C' | concept: 'ride bicycle'
7214 | expected:'A' | got:'A' | concept: 'ride bicycle'
7215 | expected:'B' | got:'B' | concept: 'ride bicycle'
7216 | expected:'B' | got:'B' | concept: 'hold remote'
7217 | expected:'D' | got:'D' | concept: 'hold remote'
7218 | expected:'D' | got:'D' | concept: 'hold remote'
7219 | expected:'D' | got:'D' | concept: 'hold remote'
7220 | expected:'D' | got:'D' | concept: 'hold dog'
7221 | expected:'D' | got:'D' | concept: 'hold dog'
7222 | expected:'B' | got:'B' | concept: 'hold dog'
7223 | expected:'A' | got:'A' | concept: 'hold dog'
7224 | expected:'D' | got:'D' | concept: 'hold apple'
7225 | expected:'D' | got:'D' | concept: 'hold apple'
7226 | expected:'A' | got:'A' | concept: 'hold apple'
7227 | expected:'B' | got:'B' | concept: 'hold apple'
7228 | expected:'B' | got:'B' | concept: 'hold sports_ball'
7229 | expected:'D' | got:'A' | concept: 'hold sports_ball'
7230 | expected:'A' | got:'D' | concept: 'hold sports_ball'
7231 | expected:'B' | got:'B' | concept: 'hold sports_ball'
7232 | expected:'C' | got:'C' | concept: 'hold book'
7233 | expected:'D' | got:'B' | concept: 'hold book'
7234 | expected:'B' | got:'B' | concept: 'hold book'
7235 | expected:'D' | got:'B' | concept: 'hold book'
7236 | expected:'B' | got:'C' | concept: 'hold orange'
7237 | expected:'D' | got:'A' | concept: 'hold orange'
7238 | expected:'A' | got:'A' | concept: 'hold orange'
7239 | expected:'A' | got:'D' | concept: 'hold orange'
7240 | expected:'B' | got:'B' | concept: 'squeeze orange'
7241 | expected:'B' | got:'B' | concept: 'squeeze orange'
7242 | expected:'B' | got:'B' | concept: 'squeeze orange'
7243 | expected:'D' | got:'D' | concept: 'squeeze orange'
7244 | expected:'C' | got:'C' | concept: 'hold cup'
7245 | expected:'D' | got:'C' | concept: 'hold cup'
7246 | expected:'C' | got:'C' | concept: 'hold cup'
7247 | expected:'D' | got:'C' | concept: 'hold cup'
7248 | expected:'A' | got:'A' | concept: 'hold sports_ball'
7249 | expected:'D' | got:'D' | concept: 'hold sports_ball'
7250 | expected:'D' | got:'D' | concept: 'hold sports_ball'
7251 | expected:'C' | got:'C' | concept: 'hold sports_ball'
7252 | expected:'C' | got:'C' | concept: 'kick sports_ball'
7253 | expected:'A' | got:'A' | concept: 'kick sports_ball'
7254 | expected:'D' | got:'D' | concept: 'kick sports_ball'
7255 | expected:'C' | got:'C' | concept: 'kick sports_ball'
7256 | expected:'B' | got:'B' | concept: 'hold tennis_racket'
7257 | expected:'D' | got:'D' | concept: 'hold tennis_racket'
7258 | expected:'D' | got:'D' | concept: 'hold tennis_racket'
7259 | expected:'A' | got:'A' | concept: 'hold tennis_racket'
7260 | expected:'C' | got:'C' | concept: 'hold apple'
7261 | expected:'B' | got:'B' | concept: 'hold apple'
7262 | expected:'A' | got:'A' | concept: 'hold apple'
7263 | expected:'C' | got:'C' | concept: 'hold apple'
7264 | expected:'D' | got:'D' | concept: 'clean refrigerator'
7265 | expected:'A' | got:'A' | concept: 'clean refrigerator'
7266 | expected:'A' | got:'A' | concept: 'clean refrigerator'
7267 | expected:'C' | got:'C' | concept: 'clean refrigerator'
7268 | expected:'B' | got:'A' | concept: 'clean microwave'
7269 | expected:'C' | got:'C' | concept: 'clean microwave'
7270 | expected:'B' | got:'B' | concept: 'clean microwave'
7271 | expected:'B' | got:'B' | concept: 'clean microwave'
7272 | expected:'A' | got:'A' | concept: 'clean oven'
7273 | expected:'B' | got:'A' | concept: 'clean oven'
7274 | expected:'B' | got:'B' | concept: 'clean oven'
7275 | expected:'D' | got:'A' | concept: 'clean oven'
7276 | expected:'A' | got:'C' | concept: 'open microwave'
7277 | expected:'A' | got:'A' | concept: 'open microwave'
7278 | expected:'D' | got:'A' | concept: 'open microwave'
7279 | expected:'B' | got:'B' | concept: 'open microwave'
7280 | expected:'A' | got:'A' | concept: 'clean refrigerator'
7281 | expected:'C' | got:'C' | concept: 'clean refrigerator'
7282 | expected:'B' | got:'B' | concept: 'clean refrigerator'
7283 | expected:'C' | got:'C' | concept: 'clean refrigerator'
7284 | expected:'A' | got:'A' | concept: 'clean oven'
7285 | expected:'C' | got:'C' | concept: 'clean oven'
7286 | expected:'C' | got:'C' | concept: 'clean oven'
7287 | expected:'C' | got:'C' | concept: 'clean oven'
7288 | expected:'D' | got:'A' | concept: 'clean microwave'
7289 | expected:'A' | got:'B' | concept: 'clean microwave'
7290 | expected:'A' | got:'A' | concept: 'clean microwave'
7291 | expected:'C' | got:'C' | concept: 'clean microwave'
7292 | expected:'C' | got:'C' | concept: 'open microwave'
7293 | expected:'D' | got:'A' | concept: 'open microwave'
7294 | expected:'A' | got:'A' | concept: 'open microwave'
7295 | expected:'A' | got:'A' | concept: 'open microwave'
7296 | expected:'B' | got:'B' | concept: 'kiss dog'
7297 | expected:'C' | got:'B' | concept: 'kiss dog'
7298 | expected:'D' | got:'D' | concept: 'kiss dog'
7299 | expected:'D' | got:'D' | concept: 'kiss dog'
7300 | expected:'C' | got:'C' | concept: 'greet person'
7301 | expected:'C' | got:'C' | concept: 'greet person'
7302 | expected:'D' | got:'D' | concept: 'greet person'
7303 | expected:'C' | got:'C' | concept: 'greet person'
7304 | expected:'B' | got:'B' | concept: 'kiss person'
7305 | expected:'B' | got:'B' | concept: 'kiss person'
7306 | expected:'C' | got:'C' | concept: 'kiss person'
7307 | expected:'D' | got:'D' | concept: 'kiss person'
7308 | expected:'A' | got:'A' | concept: 'kiss horse'
7309 | expected:'D' | got:'D' | concept: 'kiss horse'
7310 | expected:'B' | got:'B' | concept: 'kiss horse'
7311 | expected:'D' | got:'D' | concept: 'kiss horse'
7312 | expected:'B' | got:'B' | concept: 'hold dog'
7313 | expected:'A' | got:'A' | concept: 'hold dog'
7314 | expected:'D' | got:'D' | concept: 'hold dog'
7315 | expected:'B' | got:'B' | concept: 'hold dog'
7316 | expected:'C' | got:'C' | concept: 'hold cup'
7317 | expected:'D' | got:'D' | concept: 'hold cup'
7318 | expected:'B' | got:'C' | concept: 'hold cup'
7319 | expected:'D' | got:'D' | concept: 'hold cup'
7320 | expected:'A' | got:'C' | concept: 'drink_with cup'
7321 | expected:'B' | got:'B' | concept: 'drink_with cup'
7322 | expected:'A' | got:'A' | concept: 'drink_with cup'
7323 | expected:'C' | got:'C' | concept: 'drink_with cup'
7324 | expected:'A' | got:'A' | concept: 'hold banana'
7325 | expected:'A' | got:'A' | concept: 'hold banana'
7326 | expected:'B' | got:'B' | concept: 'hold banana'
7327 | expected:'D' | got:'A' | concept: 'hold banana'
7328 | expected:'A' | got:'A' | concept: 'ride skateboard'
7329 | expected:'A' | got:'A' | concept: 'ride skateboard'
7330 | expected:'D' | got:'D' | concept: 'ride skateboard'
7331 | expected:'A' | got:'A' | concept: 'ride skateboard'
7332 | expected:'A' | got:'A' | concept: 'kiss horse'
7333 | expected:'D' | got:'D' | concept: 'kiss horse'
7334 | expected:'A' | got:'C' | concept: 'kiss horse'
7335 | expected:'B' | got:'B' | concept: 'kiss horse'
7336 | expected:'C' | got:'C' | concept: 'ride elephant'
7337 | expected:'D' | got:'D' | concept: 'ride elephant'
7338 | expected:'D' | got:'D' | concept: 'ride elephant'
7339 | expected:'A' | got:'A' | concept: 'ride elephant'
7340 | expected:'D' | got:'D' | concept: 'ride horse'
7341 | expected:'D' | got:'D' | concept: 'ride horse'
7342 | expected:'D' | got:'D' | concept: 'ride horse'
7343 | expected:'C' | got:'C' | concept: 'ride horse'
7344 | expected:'A' | got:'A' | concept: 'read book'
7345 | expected:'C' | got:'A' | concept: 'read book'
7346 | expected:'B' | got:'B' | concept: 'read book'
7347 | expected:'B' | got:'B' | concept: 'read book'
7348 | expected:'A' | got:'A' | concept: 'read laptop'
7349 | expected:'B' | got:'B' | concept: 'read laptop'
7350 | expected:'A' | got:'A' | concept: 'read laptop'
7351 | expected:'D' | got:'A' | concept: 'read laptop'
7352 | expected:'D' | got:'D' | concept: 'hold book'
7353 | expected:'C' | got:'C' | concept: 'hold book'
7354 | expected:'C' | got:'A' | concept: 'hold book'
7355 | expected:'D' | got:'D' | concept: 'hold book'
7356 | expected:'A' | got:'A' | concept: 'hold banana'
7357 | expected:'A' | got:'A' | concept: 'hold banana'
7358 | expected:'C' | got:'C' | concept: 'hold banana'
7359 | expected:'D' | got:'A' | concept: 'hold banana'
7360 | expected:'C' | got:'C' | concept: 'greet person'
7361 | expected:'D' | got:'D' | concept: 'greet person'
7362 | expected:'D' | got:'D' | concept: 'greet person'
7363 | expected:'D' | got:'D' | concept: 'greet person'
7364 | expected:'B' | got:'B' | concept: 'hug person'
7365 | expected:'C' | got:'C' | concept: 'hug person'
7366 | expected:'C' | got:'C' | concept: 'hug person'
7367 | expected:'C' | got:'C' | concept: 'hug person'
7368 | expected:'D' | got:'B' | concept: 'kiss horse'
7369 | expected:'C' | got:'C' | concept: 'kiss horse'
7370 | expected:'B' | got:'B' | concept: 'kiss horse'
7371 | expected:'D' | got:'A' | concept: 'kiss horse'
7372 | expected:'D' | got:'D' | concept: 'kiss person'
7373 | expected:'B' | got:'B' | concept: 'kiss person'
7374 | expected:'C' | got:'C' | concept: 'kiss person'
7375 | expected:'A' | got:'A' | concept: 'kiss person'
7376 | expected:'A' | got:'A' | concept: 'jump motorcycle'
7377 | expected:'A' | got:'A' | concept: 'jump motorcycle'
7378 | expected:'D' | got:'D' | concept: 'jump motorcycle'
7379 | expected:'D' | got:'D' | concept: 'jump motorcycle'
7380 | expected:'C' | got:'C' | concept: 'sit_on motorcycle'
7381 | expected:'D' | got:'D' | concept: 'sit_on motorcycle'
7382 | expected:'B' | got:'B' | concept: 'sit_on motorcycle'
7383 | expected:'A' | got:'C' | concept: 'sit_on motorcycle'
7384 | expected:'D' | got:'D' | concept: 'inspect motorcycle'
7385 | expected:'D' | got:'D' | concept: 'inspect motorcycle'
7386 | expected:'A' | got:'A' | concept: 'inspect motorcycle'
7387 | expected:'D' | got:'D' | concept: 'inspect motorcycle'
7388 | expected:'B' | got:'B' | concept: 'ride motorcycle'
7389 | expected:'A' | got:'A' | concept: 'ride motorcycle'
7390 | expected:'C' | got:'C' | concept: 'ride motorcycle'
7391 | expected:'D' | got:'D' | concept: 'ride motorcycle'
7392 | expected:'A' | got:'A' | concept: 'eat apple'
7393 | expected:'D' | got:'D' | concept: 'eat apple'
7394 | expected:'C' | got:'C' | concept: 'eat apple'
7395 | expected:'C' | got:'D' | concept: 'eat apple'
7396 | expected:'D' | got:'D' | concept: 'eat banana'
7397 | expected:'C' | got:'C' | concept: 'eat banana'
7398 | expected:'D' | got:'D' | concept: 'eat banana'
7399 | expected:'B' | got:'B' | concept: 'eat banana'
7400 | expected:'A' | got:'A' | concept: 'eat donut'
7401 | expected:'A' | got:'A' | concept: 'eat donut'
7402 | expected:'B' | got:'B' | concept: 'eat donut'
7403 | expected:'B' | got:'B' | concept: 'eat donut'
7404 | expected:'B' | got:'D' | concept: 'eat sandwich'
7405 | expected:'C' | got:'C' | concept: 'eat sandwich'
7406 | expected:'A' | got:'A' | concept: 'eat sandwich'
7407 | expected:'D' | got:'D' | concept: 'eat sandwich'
7408 | expected:'B' | got:'D' | concept: 'hold apple'
7409 | expected:'D' | got:'C' | concept: 'hold apple'
7410 | expected:'B' | got:'B' | concept: 'hold apple'
7411 | expected:'C' | got:'C' | concept: 'hold apple'
7412 | expected:'D' | got:'C' | concept: 'eat apple'
7413 | expected:'A' | got:'A' | concept: 'eat apple'
7414 | expected:'D' | got:'B' | concept: 'eat apple'
7415 | expected:'C' | got:'C' | concept: 'eat apple'
7416 | expected:'B' | got:'B' | concept: 'peel_or_cut apple'
7417 | expected:'D' | got:'A' | concept: 'peel_or_cut apple'
7418 | expected:'C' | got:'C' | concept: 'peel_or_cut apple'
7419 | expected:'D' | got:'A' | concept: 'peel_or_cut apple'
7420 | expected:'C' | got:'C' | concept: 'hold_and_about_to_eat apple'
7421 | expected:'B' | got:'B' | concept: 'hold_and_about_to_eat apple'
7422 | expected:'A' | got:'A' | concept: 'hold_and_about_to_eat apple'
7423 | expected:'C' | got:'C' | concept: 'hold_and_about_to_eat apple'
7424 | expected:'D' | got:'D' | concept: 'stand_on boat'
7425 | expected:'D' | got:'D' | concept: 'stand_on boat'
7426 | expected:'C' | got:'C' | concept: 'stand_on boat'
7427 | expected:'C' | got:'C' | concept: 'stand_on boat'
7428 | expected:'D' | got:'D' | concept: 'read book'
7429 | expected:'A' | got:'A' | concept: 'read book'
7430 | expected:'A' | got:'A' | concept: 'read book'
7431 | expected:'C' | got:'C' | concept: 'read book'
7432 | expected:'C' | got:'C' | concept: 'clean microwave'
7433 | expected:'D' | got:'A' | concept: 'clean microwave'
7434 | expected:'B' | got:'B' | concept: 'clean microwave'
7435 | expected:'C' | got:'C' | concept: 'clean microwave'
7436 | expected:'B' | got:'A' | concept: 'row boat'
7437 | expected:'B' | got:'B' | concept: 'row boat'
7438 | expected:'C' | got:'C' | concept: 'row boat'
7439 | expected:'A' | got:'A' | concept: 'row boat'
7440 | expected:'A' | got:'A' | concept: 'hold apple'
7441 | expected:'C' | got:'C' | concept: 'hold apple'
7442 | expected:'C' | got:'C' | concept: 'hold apple'
7443 | expected:'A' | got:'A' | concept: 'hold apple'
7444 | expected:'D' | got:'A' | concept: 'hold wine_glass'
7445 | expected:'C' | got:'C' | concept: 'hold wine_glass'
7446 | expected:'B' | got:'B' | concept: 'hold wine_glass'
7447 | expected:'D' | got:'D' | concept: 'hold wine_glass'
7448 | expected:'B' | got:'B' | concept: 'hold cell_phone'
7449 | expected:'D' | got:'D' | concept: 'hold cell_phone'
7450 | expected:'C' | got:'C' | concept: 'hold cell_phone'
7451 | expected:'B' | got:'B' | concept: 'hold cell_phone'
7452 | expected:'C' | got:'C' | concept: 'hold remote'
7453 | expected:'B' | got:'B' | concept: 'hold remote'
7454 | expected:'B' | got:'B' | concept: 'hold remote'
7455 | expected:'A' | got:'A' | concept: 'hold remote'
7456 | expected:'D' | got:'D' | concept: 'kiss horse'
7457 | expected:'A' | got:'A' | concept: 'kiss horse'
7458 | expected:'C' | got:'C' | concept: 'kiss horse'
7459 | expected:'C' | got:'C' | concept: 'kiss horse'
7460 | expected:'A' | got:'A' | concept: 'jump horse'
7461 | expected:'A' | got:'A' | concept: 'jump horse'
7462 | expected:'B' | got:'B' | concept: 'jump horse'
7463 | expected:'C' | got:'C' | concept: 'jump horse'
7464 | expected:'B' | got:'B' | concept: 'jump skateboard'
7465 | expected:'A' | got:'A' | concept: 'jump skateboard'
7466 | expected:'A' | got:'A' | concept: 'jump skateboard'
7467 | expected:'B' | got:'B' | concept: 'jump skateboard'
7468 | expected:'A' | got:'A' | concept: 'jump motorcycle'
7469 | expected:'C' | got:'C' | concept: 'jump motorcycle'
7470 | expected:'B' | got:'B' | concept: 'jump motorcycle'
7471 | expected:'C' | got:'C' | concept: 'jump motorcycle'
7472 | expected:'B' | got:'B' | concept: 'hug horse'
7473 | expected:'D' | got:'D' | concept: 'hug horse'
7474 | expected:'C' | got:'C' | concept: 'hug horse'
7475 | expected:'D' | got:'D' | concept: 'hug horse'
7476 | expected:'A' | got:'A' | concept: 'greet person'
7477 | expected:'C' | got:'C' | concept: 'greet person'
7478 | expected:'D' | got:'D' | concept: 'greet person'
7479 | expected:'A' | got:'A' | concept: 'greet person'
7480 | expected:'D' | got:'D' | concept: 'kiss person'
7481 | expected:'D' | got:'D' | concept: 'kiss person'
7482 | expected:'C' | got:'C' | concept: 'kiss person'
7483 | expected:'A' | got:'A' | concept: 'kiss person'
7484 | expected:'C' | got:'C' | concept: 'hug person'
7485 | expected:'B' | got:'B' | concept: 'hug person'
7486 | expected:'C' | got:'C' | concept: 'hug person'
7487 | expected:'A' | got:'A' | concept: 'hug person'
7488 | expected:'B' | got:'B' | concept: 'hold cell_phone'
7489 | expected:'D' | got:'D' | concept: 'hold cell_phone'
7490 | expected:'B' | got:'INVALID' | concept: 'hold cell_phone'
7491 | expected:'D' | got:'D' | concept: 'hold cell_phone'
7492 | expected:'D' | got:'D' | concept: 'hold knife'
7493 | expected:'C' | got:'C' | concept: 'hold knife'
7494 | expected:'B' | got:'B' | concept: 'hold knife'
7495 | expected:'A' | got:'A' | concept: 'hold knife'
7496 | expected:'C' | got:'C' | concept: 'hold cup'
7497 | expected:'A' | got:'A' | concept: 'hold cup'
7498 | expected:'B' | got:'C' | concept: 'hold cup'
7499 | expected:'D' | got:'D' | concept: 'hold cup'
7500 | expected:'B' | got:'B' | concept: 'hold dog'
7501 | expected:'A' | got:'A' | concept: 'hold dog'
7502 | expected:'D' | got:'D' | concept: 'hold dog'
7503 | expected:'D' | got:'B' | concept: 'hold dog'
7504 | expected:'D' | got:'D' | concept: 'kiss dog'
7505 | expected:'D' | got:'D' | concept: 'kiss dog'
7506 | expected:'D' | got:'D' | concept: 'kiss dog'
7507 | expected:'C' | got:'C' | concept: 'kiss dog'
7508 | expected:'A' | got:'A' | concept: 'jump horse'
7509 | expected:'A' | got:'A' | concept: 'jump horse'
7510 | expected:'B' | got:'A' | concept: 'jump horse'
7511 | expected:'B' | got:'B' | concept: 'jump horse'
7512 | expected:'B' | got:'B' | concept: 'ride horse'
7513 | expected:'B' | got:'B' | concept: 'ride horse'
7514 | expected:'D' | got:'D' | concept: 'ride horse'
7515 | expected:'A' | got:'A' | concept: 'ride horse'
7516 | expected:'D' | got:'D' | concept: 'kiss horse'
7517 | expected:'D' | got:'D' | concept: 'kiss horse'
7518 | expected:'A' | got:'A' | concept: 'kiss horse'
7519 | expected:'C' | got:'C' | concept: 'kiss horse'
7520 | expected:'A' | got:'C' | concept: 'hold cup'
7521 | expected:'D' | got:'D' | concept: 'hold cup'
7522 | expected:'A' | got:'A' | concept: 'hold cup'
7523 | expected:'C' | got:'C' | concept: 'hold cup'
7524 | expected:'B' | got:'B' | concept: 'hold sports_ball'
7525 | expected:'D' | got:'D' | concept: 'hold sports_ball'
7526 | expected:'D' | got:'D' | concept: 'hold sports_ball'
7527 | expected:'A' | got:'A' | concept: 'hold sports_ball'
7528 | expected:'A' | got:'A' | concept: 'hold cell_phone'
7529 | expected:'D' | got:'D' | concept: 'hold cell_phone'
7530 | expected:'B' | got:'B' | concept: 'hold cell_phone'
7531 | expected:'D' | got:'D' | concept: 'hold cell_phone'
7532 | expected:'B' | got:'B' | concept: 'hold tennis_racket'
7533 | expected:'B' | got:'B' | concept: 'hold tennis_racket'
7534 | expected:'A' | got:'A' | concept: 'hold tennis_racket'
7535 | expected:'C' | got:'D' | concept: 'hold tennis_racket'
7536 | expected:'C' | got:'C' | concept: 'wield knife'
7537 | expected:'D' | got:'D' | concept: 'wield knife'
7538 | expected:'A' | got:'C' | concept: 'wield knife'
7539 | expected:'B' | got:'D' | concept: 'wield knife'
7540 | expected:'A' | got:'C' | concept: 'cut_with knife'
7541 | expected:'A' | got:'D' | concept: 'cut_with knife'
7542 | expected:'B' | got:'B' | concept: 'cut_with knife'
7543 | expected:'D' | got:'D' | concept: 'cut_with knife'
7544 | expected:'D' | got:'D' | concept: 'hold knife'
7545 | expected:'D' | got:'D' | concept: 'hold knife'
7546 | expected:'A' | got:'A' | concept: 'hold knife'
7547 | expected:'D' | got:'D' | concept: 'hold knife'
7548 | expected:'B' | got:'B' | concept: 'hold cup'
7549 | expected:'A' | got:'A' | concept: 'hold cup'
7550 | expected:'A' | got:'A' | concept: 'hold cup'
7551 | expected:'A' | got:'A' | concept: 'hold cup'
7552 | expected:'B' | got:'B' | concept: 'kiss horse'
7553 | expected:'B' | got:'B' | concept: 'kiss horse'
7554 | expected:'C' | got:'C' | concept: 'kiss horse'
7555 | expected:'D' | got:'D' | concept: 'kiss horse'
7556 | expected:'D' | got:'D' | concept: 'hug horse'
7557 | expected:'D' | got:'D' | concept: 'hug horse'
7558 | expected:'A' | got:'A' | concept: 'hug horse'
7559 | expected:'D' | got:'D' | concept: 'hug horse'
7560 | expected:'D' | got:'D' | concept: 'hug person'
7561 | expected:'D' | got:'D' | concept: 'hug person'
7562 | expected:'C' | got:'C' | concept: 'hug person'
7563 | expected:'D' | got:'D' | concept: 'hug person'
7564 | expected:'D' | got:'D' | concept: 'jump horse'
7565 | expected:'A' | got:'A' | concept: 'jump horse'
7566 | expected:'D' | got:'D' | concept: 'jump horse'
7567 | expected:'A' | got:'A' | concept: 'jump horse'
7568 | expected:'D' | got:'C' | concept: 'sit_on_with_multiple_person bench'
7569 | expected:'D' | got:'D' | concept: 'sit_on_with_multiple_person bench'
7570 | expected:'D' | got:'D' | concept: 'sit_on_with_multiple_person bench'
7571 | expected:'B' | got:'B' | concept: 'sit_on_with_multiple_person bench'
7572 | expected:'D' | got:'D' | concept: 'sit_on bench'
7573 | expected:'D' | got:'C' | concept: 'sit_on bench'
7574 | expected:'C' | got:'C' | concept: 'sit_on bench'
7575 | expected:'D' | got:'D' | concept: 'sit_on bench'
7576 | expected:'C' | got:'C' | concept: 'lie_on bed'
7577 | expected:'D' | got:'B' | concept: 'lie_on bed'
7578 | expected:'B' | got:'B' | concept: 'lie_on bed'
7579 | expected:'B' | got:'B' | concept: 'lie_on bed'
7580 | expected:'B' | got:'B' | concept: 'lie_on bench'
7581 | expected:'D' | got:'B' | concept: 'lie_on bench'
7582 | expected:'C' | got:'C' | concept: 'lie_on bench'
7583 | expected:'B' | got:'B' | concept: 'lie_on bench'
7584 | expected:'D' | got:'A' | concept: 'hold banana'
7585 | expected:'B' | got:'B' | concept: 'hold banana'
7586 | expected:'A' | got:'A' | concept: 'hold banana'
7587 | expected:'D' | got:'D' | concept: 'hold banana'
7588 | expected:'C' | got:'C' | concept: 'drink_with cup'
7589 | expected:'D' | got:'D' | concept: 'drink_with cup'
7590 | expected:'D' | got:'D' | concept: 'drink_with cup'
7591 | expected:'C' | got:'C' | concept: 'drink_with cup'
7592 | expected:'B' | got:'A' | concept: 'hold cup'
7593 | expected:'B' | got:'A' | concept: 'hold cup'
7594 | expected:'A' | got:'B' | concept: 'hold cup'
7595 | expected:'D' | got:'C' | concept: 'hold cup'
7596 | expected:'D' | got:'D' | concept: 'hold tennis_racket'
7597 | expected:'D' | got:'D' | concept: 'hold tennis_racket'
7598 | expected:'C' | got:'C' | concept: 'hold tennis_racket'
7599 | expected:'B' | got:'B' | concept: 'hold tennis_racket'
7600 | expected:'D' | got:'D' | concept: 'greet person'
7601 | expected:'A' | got:'C' | concept: 'greet person'
7602 | expected:'D' | got:'D' | concept: 'greet person'
7603 | expected:'A' | got:'A' | concept: 'greet person'
7604 | expected:'C' | got:'C' | concept: 'hug person'
7605 | expected:'B' | got:'B' | concept: 'hug person'
7606 | expected:'A' | got:'A' | concept: 'hug person'
7607 | expected:'C' | got:'C' | concept: 'hug person'
7608 | expected:'C' | got:'C' | concept: 'hug horse'
7609 | expected:'D' | got:'D' | concept: 'hug horse'
7610 | expected:'C' | got:'C' | concept: 'hug horse'
7611 | expected:'B' | got:'B' | concept: 'hug horse'
7612 | expected:'D' | got:'D' | concept: 'kiss person'
7613 | expected:'D' | got:'D' | concept: 'kiss person'
7614 | expected:'B' | got:'B' | concept: 'kiss person'
7615 | expected:'C' | got:'C' | concept: 'kiss person'
7616 | expected:'C' | got:'C' | concept: 'release bird'
7617 | expected:'C' | got:'C' | concept: 'release bird'
7618 | expected:'B' | got:'B' | concept: 'release bird'
7619 | expected:'B' | got:'B' | concept: 'release bird'
7620 | expected:'B' | got:'B' | concept: 'read book'
7621 | expected:'A' | got:'A' | concept: 'read book'
7622 | expected:'B' | got:'B' | concept: 'read book'
7623 | expected:'D' | got:'A' | concept: 'read book'
7624 | expected:'C' | got:'C' | concept: 'point_at_camera remote'
7625 | expected:'A' | got:'A' | concept: 'point_at_camera remote'
7626 | expected:'A' | got:'A' | concept: 'point_at_camera remote'
7627 | expected:'B' | got:'B' | concept: 'point_at_camera remote'
7628 | expected:'C' | got:'C' | concept: 'hold knife'
7629 | expected:'D' | got:'D' | concept: 'hold knife'
7630 | expected:'C' | got:'D' | concept: 'hold knife'
7631 | expected:'A' | got:'A' | concept: 'hold knife'
7632 | expected:'B' | got:'B' | concept: 'hug person'
7633 | expected:'B' | got:'B' | concept: 'hug person'
7634 | expected:'B' | got:'B' | concept: 'hug person'
7635 | expected:'B' | got:'B' | concept: 'hug person'
7636 | expected:'D' | got:'D' | concept: 'ride horse'
7637 | expected:'C' | got:'C' | concept: 'ride horse'
7638 | expected:'C' | got:'C' | concept: 'ride horse'
7639 | expected:'C' | got:'C' | concept: 'ride horse'
7640 | expected:'D' | got:'D' | concept: 'hug horse'
7641 | expected:'C' | got:'C' | concept: 'hug horse'
7642 | expected:'A' | got:'B' | concept: 'hug horse'
7643 | expected:'A' | got:'C' | concept: 'hug horse'
7644 | expected:'C' | got:'C' | concept: 'kiss horse'
7645 | expected:'C' | got:'C' | concept: 'kiss horse'
7646 | expected:'A' | got:'A' | concept: 'kiss horse'
7647 | expected:'D' | got:'D' | concept: 'kiss horse'
7648 | expected:'B' | got:'B' | concept: 'kick sports_ball'
7649 | expected:'A' | got:'A' | concept: 'kick sports_ball'
7650 | expected:'D' | got:'D' | concept: 'kick sports_ball'
7651 | expected:'B' | got:'B' | concept: 'kick sports_ball'
7652 | expected:'B' | got:'B' | concept: 'hold knife'
7653 | expected:'C' | got:'C' | concept: 'hold knife'
7654 | expected:'C' | got:'C' | concept: 'hold knife'
7655 | expected:'C' | got:'A' | concept: 'hold knife'
7656 | expected:'D' | got:'D' | concept: 'hold sports_ball'
7657 | expected:'D' | got:'A' | concept: 'hold sports_ball'
7658 | expected:'B' | got:'INVALID' | concept: 'hold sports_ball'
7659 | expected:'A' | got:'A' | concept: 'hold sports_ball'
7660 | expected:'B' | got:'B' | concept: 'hold tennis_racket'
7661 | expected:'B' | got:'B' | concept: 'hold tennis_racket'
7662 | expected:'D' | got:'D' | concept: 'hold tennis_racket'
7663 | expected:'B' | got:'B' | concept: 'hold tennis_racket'
7664 | expected:'C' | got:'C' | concept: 'ride bicycle'
7665 | expected:'B' | got:'B' | concept: 'ride bicycle'
7666 | expected:'A' | got:'A' | concept: 'ride bicycle'
7667 | expected:'B' | got:'B' | concept: 'ride bicycle'
7668 | expected:'D' | got:'D' | concept: 'ride horse'
7669 | expected:'A' | got:'A' | concept: 'ride horse'
7670 | expected:'D' | got:'D' | concept: 'ride horse'
7671 | expected:'D' | got:'D' | concept: 'ride horse'
7672 | expected:'B' | got:'B' | concept: 'ride motorcycle'
7673 | expected:'C' | got:'C' | concept: 'ride motorcycle'
7674 | expected:'A' | got:'A' | concept: 'ride motorcycle'
7675 | expected:'B' | got:'B' | concept: 'ride motorcycle'
7676 | expected:'D' | got:'D' | concept: 'ride skis'
7677 | expected:'A' | got:'A' | concept: 'ride skis'
7678 | expected:'C' | got:'C' | concept: 'ride skis'
7679 | expected:'A' | got:'A' | concept: 'ride skis'
7680 | expected:'A' | got:'A' | concept: 'eat donut'
7681 | expected:'C' | got:'C' | concept: 'eat donut'
7682 | expected:'B' | got:'B' | concept: 'eat donut'
7683 | expected:'B' | got:'B' | concept: 'eat donut'
7684 | expected:'D' | got:'D' | concept: 'eat sandwich'
7685 | expected:'C' | got:'C' | concept: 'eat sandwich'
7686 | expected:'C' | got:'C' | concept: 'eat sandwich'
7687 | expected:'B' | got:'B' | concept: 'eat sandwich'
7688 | expected:'D' | got:'D' | concept: 'eat pizza'
7689 | expected:'C' | got:'C' | concept: 'eat pizza'
7690 | expected:'C' | got:'C' | concept: 'eat pizza'
7691 | expected:'D' | got:'D' | concept: 'eat pizza'
7692 | expected:'A' | got:'A' | concept: 'eat banana'
7693 | expected:'B' | got:'B' | concept: 'eat banana'
7694 | expected:'D' | got:'D' | concept: 'eat banana'
7695 | expected:'C' | got:'C' | concept: 'eat banana'
7696 | expected:'D' | got:'D' | concept: 'hold handbag'
7697 | expected:'A' | got:'A' | concept: 'hold handbag'
7698 | expected:'B' | got:'B' | concept: 'hold handbag'
7699 | expected:'D' | got:'D' | concept: 'hold handbag'
7700 | expected:'D' | got:'D' | concept: 'hold knife'
7701 | expected:'C' | got:'C' | concept: 'hold knife'
7702 | expected:'B' | got:'B' | concept: 'hold knife'
7703 | expected:'D' | got:'D' | concept: 'hold knife'
7704 | expected:'A' | got:'A' | concept: 'hold tennis_racket'
7705 | expected:'D' | got:'D' | concept: 'hold tennis_racket'
7706 | expected:'A' | got:'A' | concept: 'hold tennis_racket'
7707 | expected:'A' | got:'A' | concept: 'hold tennis_racket'
7708 | expected:'A' | got:'A' | concept: 'hold cup'
7709 | expected:'A' | got:'A' | concept: 'hold cup'
7710 | expected:'C' | got:'C' | concept: 'hold cup'
7711 | expected:'C' | got:'C' | concept: 'hold cup'
7712 | expected:'D' | got:'D' | concept: 'eat apple'
7713 | expected:'C' | got:'D' | concept: 'eat apple'
7714 | expected:'C' | got:'D' | concept: 'eat apple'
7715 | expected:'A' | got:'A' | concept: 'eat apple'
7716 | expected:'C' | got:'C' | concept: 'hold_and_about_to_eat apple'
7717 | expected:'D' | got:'D' | concept: 'hold_and_about_to_eat apple'
7718 | expected:'B' | got:'B' | concept: 'hold_and_about_to_eat apple'
7719 | expected:'D' | got:'D' | concept: 'hold_and_about_to_eat apple'
7720 | expected:'D' | got:'C' | concept: 'hold apple'
7721 | expected:'D' | got:'C' | concept: 'hold apple'
7722 | expected:'A' | got:'C' | concept: 'hold apple'
7723 | expected:'B' | got:'A' | concept: 'hold apple'
7724 | expected:'C' | got:'C' | concept: 'peel_or_cut apple'
7725 | expected:'B' | got:'B' | concept: 'peel_or_cut apple'
7726 | expected:'A' | got:'A' | concept: 'peel_or_cut apple'
7727 | expected:'A' | got:'A' | concept: 'peel_or_cut apple'
7728 | expected:'A' | got:'A' | concept: 'jump skateboard'
7729 | expected:'C' | got:'C' | concept: 'jump skateboard'
7730 | expected:'B' | got:'B' | concept: 'jump skateboard'
7731 | expected:'B' | got:'B' | concept: 'jump skateboard'
7732 | expected:'A' | got:'A' | concept: 'jump snowboard'
7733 | expected:'C' | got:'C' | concept: 'jump snowboard'
7734 | expected:'A' | got:'A' | concept: 'jump snowboard'
7735 | expected:'B' | got:'B' | concept: 'jump snowboard'
7736 | expected:'A' | got:'A' | concept: 'jump horse'
7737 | expected:'B' | got:'B' | concept: 'jump horse'
7738 | expected:'D' | got:'D' | concept: 'jump horse'
7739 | expected:'C' | got:'C' | concept: 'jump horse'
7740 | expected:'A' | got:'A' | concept: 'jump motorcycle'
7741 | expected:'C' | got:'C' | concept: 'jump motorcycle'
7742 | expected:'C' | got:'C' | concept: 'jump motorcycle'
7743 | expected:'C' | got:'C' | concept: 'jump motorcycle'
7744 | expected:'C' | got:'C' | concept: 'jump skateboard'
7745 | expected:'A' | got:'A' | concept: 'jump skateboard'
7746 | expected:'A' | got:'A' | concept: 'jump skateboard'
7747 | expected:'B' | got:'A' | concept: 'jump skateboard'
7748 | expected:'D' | got:'B' | concept: 'grind skateboard'
7749 | expected:'C' | got:'C' | concept: 'grind skateboard'
7750 | expected:'A' | got:'B' | concept: 'grind skateboard'
7751 | expected:'B' | got:'B' | concept: 'grind skateboard'
7752 | expected:'D' | got:'D' | concept: 'hold skateboard'
7753 | expected:'C' | got:'C' | concept: 'hold skateboard'
7754 | expected:'C' | got:'C' | concept: 'hold skateboard'
7755 | expected:'C' | got:'C' | concept: 'hold skateboard'
7756 | expected:'C' | got:'D' | concept: 'ride skateboard'
7757 | expected:'A' | got:'A' | concept: 'ride skateboard'
7758 | expected:'B' | got:'B' | concept: 'ride skateboard'
7759 | expected:'A' | got:'A' | concept: 'ride skateboard'
7760 | expected:'A' | got:'B' | concept: 'eat apple'
7761 | expected:'B' | got:'C' | concept: 'eat apple'
7762 | expected:'D' | got:'C' | concept: 'eat apple'
7763 | expected:'D' | got:'A' | concept: 'eat apple'
7764 | expected:'D' | got:'D' | concept: 'hold_and_about_to_eat apple'
7765 | expected:'A' | got:'A' | concept: 'hold_and_about_to_eat apple'
7766 | expected:'B' | got:'B' | concept: 'hold_and_about_to_eat apple'
7767 | expected:'B' | got:'A' | concept: 'hold_and_about_to_eat apple'
7768 | expected:'A' | got:'D' | concept: 'hold apple'
7769 | expected:'D' | got:'B' | concept: 'hold apple'
7770 | expected:'D' | got:'A' | concept: 'hold apple'
7771 | expected:'A' | got:'C' | concept: 'hold apple'
7772 | expected:'C' | got:'D' | concept: 'peel_or_cut apple'
7773 | expected:'C' | got:'C' | concept: 'peel_or_cut apple'
7774 | expected:'C' | got:'C' | concept: 'peel_or_cut apple'
7775 | expected:'D' | got:'A' | concept: 'peel_or_cut apple'
7776 | expected:'C' | got:'A' | concept: 'hold apple'
7777 | expected:'B' | got:'B' | concept: 'hold apple'
7778 | expected:'B' | got:'D' | concept: 'hold apple'
7779 | expected:'B' | got:'B' | concept: 'hold apple'
7780 | expected:'D' | got:'D' | concept: 'hold remote'
7781 | expected:'C' | got:'C' | concept: 'hold remote'
7782 | expected:'B' | got:'B' | concept: 'hold remote'
7783 | expected:'A' | got:'A' | concept: 'hold remote'
7784 | expected:'A' | got:'C' | concept: 'point_at_camera remote'
7785 | expected:'D' | got:'A' | concept: 'point_at_camera remote'
7786 | expected:'C' | got:'D' | concept: 'point_at_camera remote'
7787 | expected:'C' | got:'C' | concept: 'point_at_camera remote'
7788 | expected:'C' | got:'C' | concept: 'hold handbag'
7789 | expected:'A' | got:'A' | concept: 'hold handbag'
7790 | expected:'D' | got:'A' | concept: 'hold handbag'
7791 | expected:'C' | got:'C' | concept: 'hold handbag'
7792 | expected:'C' | got:'C' | concept: 'drink_with cup'
7793 | expected:'D' | got:'D' | concept: 'drink_with cup'
7794 | expected:'C' | got:'C' | concept: 'drink_with cup'
7795 | expected:'D' | got:'C' | concept: 'drink_with cup'
7796 | expected:'A' | got:'A' | concept: 'hold cup'
7797 | expected:'D' | got:'C' | concept: 'hold cup'
7798 | expected:'A' | got:'C' | concept: 'hold cup'
7799 | expected:'A' | got:'C' | concept: 'hold cup'
7800 | expected:'B' | got:'B' | concept: 'hold dog'
7801 | expected:'C' | got:'C' | concept: 'hold dog'
7802 | expected:'A' | got:'A' | concept: 'hold dog'
7803 | expected:'C' | got:'C' | concept: 'hold dog'
7804 | expected:'B' | got:'B' | concept: 'hold wine_glass'
7805 | expected:'B' | got:'B' | concept: 'hold wine_glass'
7806 | expected:'A' | got:'C' | concept: 'hold wine_glass'
7807 | expected:'A' | got:'A' | concept: 'hold wine_glass'
7808 | expected:'A' | got:'A' | concept: 'hold tennis_racket'
7809 | expected:'A' | got:'A' | concept: 'hold tennis_racket'
7810 | expected:'A' | got:'A' | concept: 'hold tennis_racket'
7811 | expected:'A' | got:'A' | concept: 'hold tennis_racket'
7812 | expected:'A' | got:'B' | concept: 'hold wine_glass'
7813 | expected:'D' | got:'B' | concept: 'hold wine_glass'
7814 | expected:'B' | got:'B' | concept: 'hold wine_glass'
7815 | expected:'A' | got:'A' | concept: 'hold wine_glass'
7816 | expected:'A' | got:'A' | concept: 'hold orange'
7817 | expected:'B' | got:'B' | concept: 'hold orange'
7818 | expected:'C' | got:'C' | concept: 'hold orange'
7819 | expected:'B' | got:'B' | concept: 'hold orange'
7820 | expected:'A' | got:'C' | concept: 'toast wine_glass'
7821 | expected:'A' | got:'A' | concept: 'toast wine_glass'
7822 | expected:'C' | got:'C' | concept: 'toast wine_glass'
7823 | expected:'B' | got:'B' | concept: 'toast wine_glass'
7824 | expected:'C' | got:'C' | concept: 'ride horse'
7825 | expected:'C' | got:'C' | concept: 'ride horse'
7826 | expected:'B' | got:'B' | concept: 'ride horse'
7827 | expected:'A' | got:'A' | concept: 'ride horse'
7828 | expected:'B' | got:'B' | concept: 'ride elephant'
7829 | expected:'D' | got:'D' | concept: 'ride elephant'
7830 | expected:'D' | got:'D' | concept: 'ride elephant'
7831 | expected:'C' | got:'C' | concept: 'ride elephant'
7832 | expected:'C' | got:'C' | concept: 'ride skis'
7833 | expected:'D' | got:'D' | concept: 'ride skis'
7834 | expected:'A' | got:'A' | concept: 'ride skis'
7835 | expected:'A' | got:'A' | concept: 'ride skis'
7836 | expected:'B' | got:'B' | concept: 'ride bicycle'
7837 | expected:'C' | got:'C' | concept: 'ride bicycle'
7838 | expected:'D' | got:'D' | concept: 'ride bicycle'
7839 | expected:'B' | got:'B' | concept: 'ride bicycle'
7840 | expected:'D' | got:'A' | concept: 'hold apple'
7841 | expected:'A' | got:'A' | concept: 'hold apple'
7842 | expected:'C' | got:'A' | concept: 'hold apple'
7843 | expected:'B' | got:'D' | concept: 'hold apple'
7844 | expected:'B' | got:'D' | concept: 'eat apple'
7845 | expected:'A' | got:'D' | concept: 'eat apple'
7846 | expected:'B' | got:'D' | concept: 'eat apple'
7847 | expected:'A' | got:'D' | concept: 'eat apple'
7848 | expected:'D' | got:'D' | concept: 'hold_and_about_to_eat apple'
7849 | expected:'D' | got:'D' | concept: 'hold_and_about_to_eat apple'
7850 | expected:'B' | got:'B' | concept: 'hold_and_about_to_eat apple'
7851 | expected:'B' | got:'B' | concept: 'hold_and_about_to_eat apple'
7852 | expected:'B' | got:'D' | concept: 'peel_or_cut apple'
7853 | expected:'A' | got:'A' | concept: 'peel_or_cut apple'
7854 | expected:'B' | got:'B' | concept: 'peel_or_cut apple'
7855 | expected:'B' | got:'B' | concept: 'peel_or_cut apple'
7856 | expected:'B' | got:'A' | concept: 'read laptop'
7857 | expected:'D' | got:'C' | concept: 'read laptop'
7858 | expected:'C' | got:'D' | concept: 'read laptop'
7859 | expected:'B' | got:'A' | concept: 'read laptop'
7860 | expected:'D' | got:'A' | concept: 'read book'
7861 | expected:'C' | got:'C' | concept: 'read book'
7862 | expected:'B' | got:'B' | concept: 'read book'
7863 | expected:'A' | got:'A' | concept: 'read book'
7864 | expected:'C' | got:'C' | concept: 'type_on laptop'
7865 | expected:'B' | got:'B' | concept: 'type_on laptop'
7866 | expected:'D' | got:'A' | concept: 'type_on laptop'
7867 | expected:'A' | got:'A' | concept: 'type_on laptop'
7868 | expected:'A' | got:'A' | concept: 'type_on keyboard'
7869 | expected:'B' | got:'B' | concept: 'type_on keyboard'
7870 | expected:'A' | got:'A' | concept: 'type_on keyboard'
7871 | expected:'A' | got:'A' | concept: 'type_on keyboard'
7872 | expected:'C' | got:'C' | concept: 'jump horse'
7873 | expected:'A' | got:'D' | concept: 'jump horse'
7874 | expected:'D' | got:'D' | concept: 'jump horse'
7875 | expected:'C' | got:'C' | concept: 'jump horse'
7876 | expected:'A' | got:'A' | concept: 'jump skateboard'
7877 | expected:'A' | got:'A' | concept: 'jump skateboard'
7878 | expected:'C' | got:'C' | concept: 'jump skateboard'
7879 | expected:'C' | got:'C' | concept: 'jump skateboard'
7880 | expected:'D' | got:'D' | concept: 'hold skateboard'
7881 | expected:'B' | got:'B' | concept: 'hold skateboard'
7882 | expected:'C' | got:'C' | concept: 'hold skateboard'
7883 | expected:'B' | got:'B' | concept: 'hold skateboard'
7884 | expected:'A' | got:'C' | concept: 'grind skateboard'
7885 | expected:'C' | got:'C' | concept: 'grind skateboard'
7886 | expected:'A' | got:'A' | concept: 'grind skateboard'
7887 | expected:'A' | got:'D' | concept: 'grind skateboard'
7888 | expected:'D' | got:'A' | concept: 'inspect motorcycle'
7889 | expected:'C' | got:'C' | concept: 'inspect motorcycle'
7890 | expected:'D' | got:'D' | concept: 'inspect motorcycle'
7891 | expected:'D' | got:'D' | concept: 'inspect motorcycle'
7892 | expected:'B' | got:'C' | concept: 'wash motorcycle'
7893 | expected:'D' | got:'D' | concept: 'wash motorcycle'
7894 | expected:'B' | got:'B' | concept: 'wash motorcycle'
7895 | expected:'C' | got:'C' | concept: 'wash motorcycle'
7896 | expected:'D' | got:'D' | concept: 'ride motorcycle'
7897 | expected:'A' | got:'A' | concept: 'ride motorcycle'
7898 | expected:'D' | got:'D' | concept: 'ride motorcycle'
7899 | expected:'A' | got:'A' | concept: 'ride motorcycle'
7900 | expected:'B' | got:'B' | concept: 'straddle motorcycle'
7901 | expected:'A' | got:'B' | concept: 'straddle motorcycle'
7902 | expected:'C' | got:'C' | concept: 'straddle motorcycle'
7903 | expected:'C' | got:'B' | concept: 'straddle motorcycle'
7904 | expected:'D' | got:'D' | concept: 'hold skateboard'
7905 | expected:'B' | got:'B' | concept: 'hold skateboard'
7906 | expected:'A' | got:'A' | concept: 'hold skateboard'
7907 | expected:'C' | got:'C' | concept: 'hold skateboard'
7908 | expected:'C' | got:'C' | concept: 'hold dog'
7909 | expected:'A' | got:'A' | concept: 'hold dog'
7910 | expected:'B' | got:'B' | concept: 'hold dog'
7911 | expected:'C' | got:'C' | concept: 'hold dog'
7912 | expected:'A' | got:'INVALID' | concept: 'hold sports_ball'
7913 | expected:'D' | got:'D' | concept: 'hold sports_ball'
7914 | expected:'B' | got:'D' | concept: 'hold sports_ball'
7915 | expected:'D' | got:'D' | concept: 'hold sports_ball'
7916 | expected:'B' | got:'B' | concept: 'hold book'
7917 | expected:'C' | got:'C' | concept: 'hold book'
7918 | expected:'C' | got:'C' | concept: 'hold book'
7919 | expected:'D' | got:'D' | concept: 'hold book'
7920 | expected:'B' | got:'A' | concept: 'hold book'
7921 | expected:'D' | got:'D' | concept: 'hold book'
7922 | expected:'B' | got:'A' | concept: 'hold book'
7923 | expected:'D' | got:'D' | concept: 'hold book'
7924 | expected:'B' | got:'B' | concept: 'type_on laptop'
7925 | expected:'A' | got:'A' | concept: 'type_on laptop'
7926 | expected:'D' | got:'D' | concept: 'type_on laptop'
7927 | expected:'B' | got:'B' | concept: 'type_on laptop'
7928 | expected:'D' | got:'A' | concept: 'read book'
7929 | expected:'C' | got:'A' | concept: 'read book'
7930 | expected:'B' | got:'B' | concept: 'read book'
7931 | expected:'B' | got:'B' | concept: 'read book'
7932 | expected:'D' | got:'B' | concept: 'read laptop'
7933 | expected:'B' | got:'A' | concept: 'read laptop'
7934 | expected:'A' | got:'A' | concept: 'read laptop'
7935 | expected:'D' | got:'A' | concept: 'read laptop'
7936 | expected:'D' | got:'D' | concept: 'hold sports_ball'
7937 | expected:'D' | got:'A' | concept: 'hold sports_ball'
7938 | expected:'A' | got:'A' | concept: 'hold sports_ball'
7939 | expected:'C' | got:'C' | concept: 'hold sports_ball'
7940 | expected:'B' | got:'B' | concept: 'hold apple'
7941 | expected:'B' | got:'C' | concept: 'hold apple'
7942 | expected:'C' | got:'C' | concept: 'hold apple'
7943 | expected:'D' | got:'A' | concept: 'hold apple'
7944 | expected:'A' | got:'A' | concept: 'hold wine_glass'
7945 | expected:'C' | got:'C' | concept: 'hold wine_glass'
7946 | expected:'B' | got:'B' | concept: 'hold wine_glass'
7947 | expected:'B' | got:'B' | concept: 'hold wine_glass'
7948 | expected:'A' | got:'A' | concept: 'peel_or_cut apple'
7949 | expected:'D' | got:'D' | concept: 'peel_or_cut apple'
7950 | expected:'B' | got:'B' | concept: 'peel_or_cut apple'
7951 | expected:'A' | got:'B' | concept: 'peel_or_cut apple'
7952 | expected:'C' | got:'C' | concept: 'wear tie'
7953 | expected:'C' | got:'C' | concept: 'wear tie'
7954 | expected:'A' | got:'C' | concept: 'wear tie'
7955 | expected:'A' | got:'C' | concept: 'wear tie'
7956 | expected:'C' | got:'C' | concept: 'wear backpack'
7957 | expected:'C' | got:'C' | concept: 'wear backpack'
7958 | expected:'D' | got:'D' | concept: 'wear backpack'
7959 | expected:'C' | got:'B' | concept: 'wear backpack'
7960 | expected:'D' | got:'A' | concept: 'adjust_or_tie tie'
7961 | expected:'C' | got:'C' | concept: 'adjust_or_tie tie'
7962 | expected:'B' | got:'B' | concept: 'adjust_or_tie tie'
7963 | expected:'B' | got:'B' | concept: 'adjust_or_tie tie'
7964 | expected:'B' | got:'B' | concept: 'jump horse'
7965 | expected:'B' | got:'B' | concept: 'jump horse'
7966 | expected:'A' | got:'A' | concept: 'jump horse'
7967 | expected:'B' | got:'B' | concept: 'jump horse'
7968 | expected:'A' | got:'A' | concept: 'jump motorcycle'
7969 | expected:'A' | got:'D' | concept: 'jump motorcycle'
7970 | expected:'B' | got:'C' | concept: 'jump motorcycle'
7971 | expected:'C' | got:'C' | concept: 'jump motorcycle'
7972 | expected:'C' | got:'C' | concept: 'ride motorcycle'
7973 | expected:'B' | got:'C' | concept: 'ride motorcycle'
7974 | expected:'B' | got:'C' | concept: 'ride motorcycle'
7975 | expected:'A' | got:'A' | concept: 'ride motorcycle'
7976 | expected:'B' | got:'D' | concept: 'straddle motorcycle'
7977 | expected:'C' | got:'C' | concept: 'straddle motorcycle'
7978 | expected:'A' | got:'A' | concept: 'straddle motorcycle'
7979 | expected:'B' | got:'B' | concept: 'straddle motorcycle'
7980 | expected:'D' | got:'D' | concept: 'turn motorcycle'
7981 | expected:'B' | got:'C' | concept: 'turn motorcycle'
7982 | expected:'A' | got:'D' | concept: 'turn motorcycle'
7983 | expected:'A' | got:'D' | concept: 'turn motorcycle'
7984 | expected:'D' | got:'C' | concept: 'jump skateboard'
7985 | expected:'D' | got:'D' | concept: 'jump skateboard'
7986 | expected:'C' | got:'C' | concept: 'jump skateboard'
7987 | expected:'D' | got:'D' | concept: 'jump skateboard'
7988 | expected:'C' | got:'C' | concept: 'hold skateboard'
7989 | expected:'B' | got:'B' | concept: 'hold skateboard'
7990 | expected:'D' | got:'D' | concept: 'hold skateboard'
7991 | expected:'A' | got:'B' | concept: 'hold skateboard'
7992 | expected:'C' | got:'C' | concept: 'grind skateboard'
7993 | expected:'B' | got:'B' | concept: 'grind skateboard'
7994 | expected:'B' | got:'B' | concept: 'grind skateboard'
7995 | expected:'C' | got:'C' | concept: 'grind skateboard'
7996 | expected:'B' | got:'A' | concept: 'ride skateboard'
7997 | expected:'C' | got:'A' | concept: 'ride skateboard'
7998 | expected:'B' | got:'D' | concept: 'ride skateboard'
7999 | expected:'A' | got:'A' | concept: 'ride skateboard'
---------------------------------------
Summary:
  Total: 8000
  Correct: 6290
  Incorrect: 1683
  Invalid/Parse Error: 27
  Processing Error: 0
  Accuracy (Correct / [Correct + Incorrect]): 78.89%
---------------------------------------

